diff --git "a/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" --- "a/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" +++ "b/wandb/run-20220228_163348-20lja62k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.555, "train/learning_rate": 2.801161103047896e-06, "train/epoch": 0.84, "train/global_step": 1000, "_runtime": 5844, "_timestamp": 1646071873, "_step": 1001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 222.0, 793.0, 2.0, 1.0], "bins": [-997.938720703125, -981.618896484375, -965.2991333007812, -948.9793090820312, -932.6594848632812, -916.3397216796875, -900.0198974609375, -883.7000732421875, -867.3803100585938, -851.0604858398438, -834.74072265625, -818.4208984375, -802.10107421875, -785.7813110351562, -769.4614868164062, -753.1416625976562, -736.8218994140625, -720.5020751953125, -704.1823120117188, -687.8624877929688, -671.5426635742188, -655.222900390625, -638.903076171875, -622.583251953125, -606.263427734375, -589.943603515625, -573.6238403320312, -557.3040161132812, -540.9841918945312, -524.6644287109375, -508.3446044921875, -492.0248107910156, -475.705078125, -459.3852844238281, -443.0654602050781, -426.74566650390625, -410.4258728027344, -394.1060791015625, -377.7862548828125, -361.4664611816406, -345.1466369628906, -328.82684326171875, -312.50701904296875, -296.1872253417969, -279.867431640625, -263.547607421875, -247.22781372070312, -230.90802001953125, -214.5882110595703, -198.26840209960938, -181.9486083984375, -165.62879943847656, -149.30899047851562, -132.98919677734375, -116.66938781738281, -100.3495864868164, -84.02978515625, -67.7099838256836, -51.39017868041992, -35.07037353515625, -18.750572204589844, -2.4307708740234375, 13.8890380859375, 30.208839416503906, 46.52863693237305]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 7.0, 6.0, 6.0, 22.0, 16.0, 24.0, 32.0, 36.0, 44.0, 52.0, 62.0, 60.0, 60.0, 75.0, 54.0, 73.0, 67.0, 75.0, 61.0, 44.0, 31.0, 33.0, 16.0, 13.0, 8.0, 12.0, 7.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.51752471923828, -85.005126953125, -82.49272918701172, -79.98033142089844, -77.46794128417969, -74.9555435180664, -72.44314575195312, -69.93074798583984, -67.41835021972656, -64.90595245361328, -62.3935546875, -59.881160736083984, -57.3687629699707, -54.85636520385742, -52.343971252441406, -49.831573486328125, -47.319175720214844, -44.80677795410156, -42.29438018798828, -39.781986236572266, -37.269588470458984, -34.7571907043457, -32.24479675292969, -29.732398986816406, -27.220001220703125, -24.707603454589844, -22.195207595825195, -19.682811737060547, -17.170413970947266, -14.6580171585083, -12.145620346069336, -9.633224487304688, -7.1208343505859375, -4.608437538146973, -2.096040725708008, 0.41635608673095703, 2.928752899169922, 5.441149711608887, 7.953546524047852, 10.4659423828125, 12.978340148925781, 15.490736961364746, 18.00313377380371, 20.51552963256836, 23.02792739868164, 25.540325164794922, 28.05272102355957, 30.56511688232422, 33.0775146484375, 35.58991241455078, 38.10231018066406, 40.61470413208008, 43.12710189819336, 45.63949966430664, 48.151893615722656, 50.66429138183594, 53.17668914794922, 55.6890869140625, 58.20148468017578, 60.7138786315918, 63.22627639770508, 65.7386703491211, 68.25106811523438, 70.76346588134766, 73.27586364746094]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 7.0, 0.0, 4.0, 7.0, 8.0, 11.0, 11.0, 13.0, 14.0, 26.0, 21.0, 21.0, 34.0, 28.0, 28.0, 28.0, 31.0, 39.0, 43.0, 34.0, 46.0, 40.0, 44.0, 32.0, 43.0, 43.0, 45.0, 45.0, 36.0, 30.0, 26.0, 30.0, 23.0, 24.0, 14.0, 16.0, 10.0, 13.0, 13.0, 6.0, 4.0, 8.0, 5.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.15234375, -4.03729248046875, -3.9222412109375, -3.80718994140625, -3.692138671875, -3.57708740234375, -3.4620361328125, -3.34698486328125, -3.23193359375, -3.11688232421875, -3.0018310546875, -2.88677978515625, -2.771728515625, -2.65667724609375, -2.5416259765625, -2.42657470703125, -2.3115234375, -2.19647216796875, -2.0814208984375, -1.96636962890625, -1.851318359375, -1.73626708984375, -1.6212158203125, -1.50616455078125, -1.39111328125, -1.27606201171875, -1.1610107421875, -1.04595947265625, -0.930908203125, -0.81585693359375, -0.7008056640625, -0.58575439453125, -0.470703125, -0.35565185546875, -0.2406005859375, -0.12554931640625, -0.010498046875, 0.10455322265625, 0.2196044921875, 0.33465576171875, 0.44970703125, 0.56475830078125, 0.6798095703125, 0.79486083984375, 0.909912109375, 1.02496337890625, 1.1400146484375, 1.25506591796875, 1.3701171875, 1.48516845703125, 1.6002197265625, 1.71527099609375, 1.830322265625, 1.94537353515625, 2.0604248046875, 2.17547607421875, 2.29052734375, 2.40557861328125, 2.5206298828125, 2.63568115234375, 2.750732421875, 2.86578369140625, 2.9808349609375, 3.09588623046875, 3.2109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 15.0, 13.0, 12.0, 26.0, 40.0, 39.0, 46.0, 71.0, 93.0, 117.0, 168.0, 223.0, 289.0, 415.0, 618.0, 1045.0, 1504.0, 2588.0, 5207.0, 12011.0, 37021.0, 198837.0, 1465609.0, 2033232.0, 349805.0, 55069.0, 15510.0, 6386.0, 3118.0, 1729.0, 1032.0, 712.0, 455.0, 357.0, 210.0, 151.0, 115.0, 87.0, 72.0, 46.0, 40.0, 36.0, 43.0, 24.0, 11.0, 9.0, 14.0, 3.0, 1.0, 2.0, 3.0], "bins": [-10.859375, -10.558837890625, -10.25830078125, -9.957763671875, -9.6572265625, -9.356689453125, -9.05615234375, -8.755615234375, -8.455078125, -8.154541015625, -7.85400390625, -7.553466796875, -7.2529296875, -6.952392578125, -6.65185546875, -6.351318359375, -6.05078125, -5.750244140625, -5.44970703125, -5.149169921875, -4.8486328125, -4.548095703125, -4.24755859375, -3.947021484375, -3.646484375, -3.345947265625, -3.04541015625, -2.744873046875, -2.4443359375, -2.143798828125, -1.84326171875, -1.542724609375, -1.2421875, -0.941650390625, -0.64111328125, -0.340576171875, -0.0400390625, 0.260498046875, 0.56103515625, 0.861572265625, 1.162109375, 1.462646484375, 1.76318359375, 2.063720703125, 2.3642578125, 2.664794921875, 2.96533203125, 3.265869140625, 3.56640625, 3.866943359375, 4.16748046875, 4.468017578125, 4.7685546875, 5.069091796875, 5.36962890625, 5.670166015625, 5.970703125, 6.271240234375, 6.57177734375, 6.872314453125, 7.1728515625, 7.473388671875, 7.77392578125, 8.074462890625, 8.375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 7.0, 8.0, 8.0, 19.0, 31.0, 49.0, 116.0, 174.0, 329.0, 576.0, 932.0, 817.0, 483.0, 247.0, 112.0, 75.0, 43.0, 18.0, 13.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.328125, -28.53173828125, -27.7353515625, -26.93896484375, -26.142578125, -25.34619140625, -24.5498046875, -23.75341796875, -22.95703125, -22.16064453125, -21.3642578125, -20.56787109375, -19.771484375, -18.97509765625, -18.1787109375, -17.38232421875, -16.5859375, -15.78955078125, -14.9931640625, -14.19677734375, -13.400390625, -12.60400390625, -11.8076171875, -11.01123046875, -10.21484375, -9.41845703125, -8.6220703125, -7.82568359375, -7.029296875, -6.23291015625, -5.4365234375, -4.64013671875, -3.84375, -3.04736328125, -2.2509765625, -1.45458984375, -0.658203125, 0.13818359375, 0.9345703125, 1.73095703125, 2.52734375, 3.32373046875, 4.1201171875, 4.91650390625, 5.712890625, 6.50927734375, 7.3056640625, 8.10205078125, 8.8984375, 9.69482421875, 10.4912109375, 11.28759765625, 12.083984375, 12.88037109375, 13.6767578125, 14.47314453125, 15.26953125, 16.06591796875, 16.8623046875, 17.65869140625, 18.455078125, 19.25146484375, 20.0478515625, 20.84423828125, 21.640625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 7.0, 11.0, 17.0, 25.0, 42.0, 68.0, 127.0, 283.0, 561.0, 1238.0, 6056.0, 3853586.0, 327561.0, 2995.0, 878.0, 408.0, 182.0, 97.0, 52.0, 29.0, 17.0, 14.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.375, -84.7138671875, -82.052734375, -79.3916015625, -76.73046875, -74.0693359375, -71.408203125, -68.7470703125, -66.0859375, -63.4248046875, -60.763671875, -58.1025390625, -55.44140625, -52.7802734375, -50.119140625, -47.4580078125, -44.796875, -42.1357421875, -39.474609375, -36.8134765625, -34.15234375, -31.4912109375, -28.830078125, -26.1689453125, -23.5078125, -20.8466796875, -18.185546875, -15.5244140625, -12.86328125, -10.2021484375, -7.541015625, -4.8798828125, -2.21875, 0.4423828125, 3.103515625, 5.7646484375, 8.42578125, 11.0869140625, 13.748046875, 16.4091796875, 19.0703125, 21.7314453125, 24.392578125, 27.0537109375, 29.71484375, 32.3759765625, 35.037109375, 37.6982421875, 40.359375, 43.0205078125, 45.681640625, 48.3427734375, 51.00390625, 53.6650390625, 56.326171875, 58.9873046875, 61.6484375, 64.3095703125, 66.970703125, 69.6318359375, 72.29296875, 74.9541015625, 77.615234375, 80.2763671875, 82.9375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 124.0, 879.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.61348342895508, -30.83932876586914, -18.065176010131836, -5.291023254394531, 7.483131408691406, 20.257286071777344, 33.031436920166016, 45.80559158325195, 58.57974624633789, 71.35389709472656, 84.1280517578125, 96.90220642089844, 109.67636108398438, 122.45051574707031, 135.22467041015625, 147.9988250732422, 160.77297973632812, 173.54713439941406, 186.3212890625, 199.09544372558594, 211.86959838867188, 224.6437530517578, 237.41790771484375, 250.19204711914062, 262.9662170410156, 275.7403564453125, 288.5145263671875, 301.2886657714844, 314.0628356933594, 326.83697509765625, 339.61114501953125, 352.3852844238281, 365.1594543457031, 377.93359375, 390.707763671875, 403.4819030761719, 416.2560729980469, 429.03021240234375, 441.80438232421875, 454.5785217285156, 467.3526916503906, 480.1268310546875, 492.9010009765625, 505.6751403808594, 518.4492797851562, 531.2234497070312, 543.9976196289062, 556.7717895507812, 569.5458984375, 582.320068359375, 595.0941772460938, 607.8683471679688, 620.6425170898438, 633.4166870117188, 646.1907958984375, 658.9649658203125, 671.7391357421875, 684.5133056640625, 697.2874145507812, 710.0615844726562, 722.8357543945312, 735.6099243164062, 748.384033203125, 761.158203125, 773.932373046875]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 8.0, 15.0, 14.0, 19.0, 21.0, 25.0, 31.0, 29.0, 40.0, 46.0, 33.0, 41.0, 46.0, 44.0, 55.0, 58.0, 37.0, 44.0, 47.0, 37.0, 41.0, 27.0, 32.0, 35.0, 21.0, 29.0, 15.0, 21.0, 16.0, 10.0, 14.0, 9.0, 7.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.82135009765625, -55.056297302246094, -53.29124450683594, -51.52619171142578, -49.761138916015625, -47.99608612060547, -46.23102951049805, -44.46597671508789, -42.700923919677734, -40.93587112426758, -39.17081832885742, -37.405765533447266, -35.640708923339844, -33.87565612792969, -32.11060333251953, -30.345550537109375, -28.58049774169922, -26.815444946289062, -25.050392150878906, -23.285337448120117, -21.52028465270996, -19.755231857299805, -17.990177154541016, -16.22512435913086, -14.460071563720703, -12.695018768310547, -10.929965019226074, -9.164911270141602, -7.399858474731445, -5.634805679321289, -3.8697519302368164, -2.1046981811523438, -0.3396453857421875, 1.425407886505127, 3.1904611587524414, 4.955514430999756, 6.72056770324707, 8.485620498657227, 10.2506742477417, 12.015727996826172, 13.780780792236328, 15.545833587646484, 17.31088638305664, 19.07594108581543, 20.840993881225586, 22.606046676635742, 24.37110137939453, 26.136154174804688, 27.901206970214844, 29.666259765625, 31.431312561035156, 33.19636535644531, 34.96141815185547, 36.726470947265625, 38.49152755737305, 40.2565803527832, 42.02163314819336, 43.786685943603516, 45.55173873901367, 47.31679153442383, 49.08184814453125, 50.846900939941406, 52.61195373535156, 54.37700653076172, 56.142059326171875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 11.0, 10.0, 12.0, 15.0, 15.0, 16.0, 24.0, 23.0, 23.0, 30.0, 27.0, 29.0, 37.0, 31.0, 36.0, 52.0, 45.0, 50.0, 33.0, 41.0, 45.0, 39.0, 28.0, 37.0, 39.0, 33.0, 30.0, 24.0, 23.0, 15.0, 19.0, 14.0, 16.0, 10.0, 8.0, 20.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.44921875, -4.3258056640625, -4.202392578125, -4.0789794921875, -3.95556640625, -3.8321533203125, -3.708740234375, -3.5853271484375, -3.4619140625, -3.3385009765625, -3.215087890625, -3.0916748046875, -2.96826171875, -2.8448486328125, -2.721435546875, -2.5980224609375, -2.474609375, -2.3511962890625, -2.227783203125, -2.1043701171875, -1.98095703125, -1.8575439453125, -1.734130859375, -1.6107177734375, -1.4873046875, -1.3638916015625, -1.240478515625, -1.1170654296875, -0.99365234375, -0.8702392578125, -0.746826171875, -0.6234130859375, -0.5, -0.3765869140625, -0.253173828125, -0.1297607421875, -0.00634765625, 0.1170654296875, 0.240478515625, 0.3638916015625, 0.4873046875, 0.6107177734375, 0.734130859375, 0.8575439453125, 0.98095703125, 1.1043701171875, 1.227783203125, 1.3511962890625, 1.474609375, 1.5980224609375, 1.721435546875, 1.8448486328125, 1.96826171875, 2.0916748046875, 2.215087890625, 2.3385009765625, 2.4619140625, 2.5853271484375, 2.708740234375, 2.8321533203125, 2.95556640625, 3.0789794921875, 3.202392578125, 3.3258056640625, 3.44921875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 13.0, 23.0, 27.0, 36.0, 68.0, 94.0, 109.0, 178.0, 280.0, 378.0, 574.0, 827.0, 1245.0, 1806.0, 2588.0, 3828.0, 5682.0, 8442.0, 12824.0, 19129.0, 30210.0, 46890.0, 75127.0, 122378.0, 204956.0, 194205.0, 115956.0, 71225.0, 44968.0, 28780.0, 18232.0, 12263.0, 8164.0, 5440.0, 3637.0, 2511.0, 1717.0, 1201.0, 780.0, 603.0, 346.0, 243.0, 184.0, 135.0, 87.0, 47.0, 32.0, 29.0, 21.0, 15.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0], "bins": [-0.54345703125, -0.5269622802734375, -0.510467529296875, -0.4939727783203125, -0.47747802734375, -0.4609832763671875, -0.444488525390625, -0.4279937744140625, -0.4114990234375, -0.3950042724609375, -0.378509521484375, -0.3620147705078125, -0.34552001953125, -0.3290252685546875, -0.312530517578125, -0.2960357666015625, -0.279541015625, -0.2630462646484375, -0.246551513671875, -0.2300567626953125, -0.21356201171875, -0.1970672607421875, -0.180572509765625, -0.1640777587890625, -0.1475830078125, -0.1310882568359375, -0.114593505859375, -0.0980987548828125, -0.08160400390625, -0.0651092529296875, -0.048614501953125, -0.0321197509765625, -0.015625, 0.0008697509765625, 0.017364501953125, 0.0338592529296875, 0.05035400390625, 0.0668487548828125, 0.083343505859375, 0.0998382568359375, 0.1163330078125, 0.1328277587890625, 0.149322509765625, 0.1658172607421875, 0.18231201171875, 0.1988067626953125, 0.215301513671875, 0.2317962646484375, 0.248291015625, 0.2647857666015625, 0.281280517578125, 0.2977752685546875, 0.31427001953125, 0.3307647705078125, 0.347259521484375, 0.3637542724609375, 0.3802490234375, 0.3967437744140625, 0.413238525390625, 0.4297332763671875, 0.44622802734375, 0.4627227783203125, 0.479217529296875, 0.4957122802734375, 0.51220703125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 7.0, 2.0, 5.0, 13.0, 8.0, 14.0, 14.0, 20.0, 18.0, 20.0, 25.0, 34.0, 49.0, 36.0, 35.0, 34.0, 49.0, 51.0, 40.0, 1064.0, 48.0, 48.0, 37.0, 36.0, 38.0, 28.0, 24.0, 46.0, 26.0, 23.0, 20.0, 21.0, 18.0, 9.0, 15.0, 9.0, 7.0, 6.0, 8.0, 8.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.135223388671875, -2.05169677734375, -1.968170166015625, -1.8846435546875, -1.801116943359375, -1.71759033203125, -1.634063720703125, -1.550537109375, -1.467010498046875, -1.38348388671875, -1.299957275390625, -1.2164306640625, -1.132904052734375, -1.04937744140625, -0.965850830078125, -0.88232421875, -0.798797607421875, -0.71527099609375, -0.631744384765625, -0.5482177734375, -0.464691162109375, -0.38116455078125, -0.297637939453125, -0.214111328125, -0.130584716796875, -0.04705810546875, 0.036468505859375, 0.1199951171875, 0.203521728515625, 0.28704833984375, 0.370574951171875, 0.4541015625, 0.537628173828125, 0.62115478515625, 0.704681396484375, 0.7882080078125, 0.871734619140625, 0.95526123046875, 1.038787841796875, 1.122314453125, 1.205841064453125, 1.28936767578125, 1.372894287109375, 1.4564208984375, 1.539947509765625, 1.62347412109375, 1.707000732421875, 1.79052734375, 1.874053955078125, 1.95758056640625, 2.041107177734375, 2.1246337890625, 2.208160400390625, 2.29168701171875, 2.375213623046875, 2.458740234375, 2.542266845703125, 2.62579345703125, 2.709320068359375, 2.7928466796875, 2.876373291015625, 2.95989990234375, 3.043426513671875, 3.126953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 13.0, 18.0, 28.0, 35.0, 66.0, 117.0, 118.0, 223.0, 287.0, 447.0, 712.0, 1014.0, 1555.0, 2518.0, 3847.0, 5808.0, 9262.0, 14358.0, 23662.0, 38844.0, 66718.0, 117951.0, 223409.0, 1283368.0, 124935.0, 69955.0, 40919.0, 24445.0, 15249.0, 9563.0, 6089.0, 3925.0, 2720.0, 1582.0, 1168.0, 756.0, 468.0, 318.0, 222.0, 164.0, 103.0, 49.0, 41.0, 25.0, 20.0, 15.0, 3.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.591796875, -0.5738906860351562, -0.5559844970703125, -0.5380783081054688, -0.520172119140625, -0.5022659301757812, -0.4843597412109375, -0.46645355224609375, -0.44854736328125, -0.43064117431640625, -0.4127349853515625, -0.39482879638671875, -0.376922607421875, -0.35901641845703125, -0.3411102294921875, -0.32320404052734375, -0.3052978515625, -0.28739166259765625, -0.2694854736328125, -0.25157928466796875, -0.233673095703125, -0.21576690673828125, -0.1978607177734375, -0.17995452880859375, -0.16204833984375, -0.14414215087890625, -0.1262359619140625, -0.10832977294921875, -0.090423583984375, -0.07251739501953125, -0.0546112060546875, -0.03670501708984375, -0.018798828125, -0.00089263916015625, 0.0170135498046875, 0.03491973876953125, 0.052825927734375, 0.07073211669921875, 0.0886383056640625, 0.10654449462890625, 0.12445068359375, 0.14235687255859375, 0.1602630615234375, 0.17816925048828125, 0.196075439453125, 0.21398162841796875, 0.2318878173828125, 0.24979400634765625, 0.2677001953125, 0.28560638427734375, 0.3035125732421875, 0.32141876220703125, 0.339324951171875, 0.35723114013671875, 0.3751373291015625, 0.39304351806640625, 0.41094970703125, 0.42885589599609375, 0.4467620849609375, 0.46466827392578125, 0.482574462890625, 0.5004806518554688, 0.5183868408203125, 0.5362930297851562, 0.55419921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 14.0, 8.0, 9.0, 25.0, 30.0, 33.0, 57.0, 54.0, 61.0, 76.0, 76.0, 72.0, 94.0, 57.0, 62.0, 66.0, 42.0, 42.0, 38.0, 28.0, 10.0, 9.0, 7.0, 7.0, 1.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009570121765136719, -0.0009286552667617798, -0.0009002983570098877, -0.0008719414472579956, -0.0008435845375061035, -0.0008152276277542114, -0.0007868707180023193, -0.0007585138082504272, -0.0007301568984985352, -0.0007017999887466431, -0.000673443078994751, -0.0006450861692428589, -0.0006167292594909668, -0.0005883723497390747, -0.0005600154399871826, -0.0005316585302352905, -0.0005033016204833984, -0.00047494471073150635, -0.00044658780097961426, -0.00041823089122772217, -0.0003898739814758301, -0.000361517071723938, -0.0003331601619720459, -0.0003048032522201538, -0.0002764463424682617, -0.00024808943271636963, -0.00021973252296447754, -0.00019137561321258545, -0.00016301870346069336, -0.00013466179370880127, -0.00010630488395690918, -7.794797420501709e-05, -4.9591064453125e-05, -2.123415470123291e-05, 7.12275505065918e-06, 3.547966480255127e-05, 6.383657455444336e-05, 9.219348430633545e-05, 0.00012055039405822754, 0.00014890730381011963, 0.00017726421356201172, 0.0002056211233139038, 0.0002339780330657959, 0.000262334942817688, 0.0002906918525695801, 0.00031904876232147217, 0.00034740567207336426, 0.00037576258182525635, 0.00040411949157714844, 0.00043247640132904053, 0.0004608333110809326, 0.0004891902208328247, 0.0005175471305847168, 0.0005459040403366089, 0.000574260950088501, 0.0006026178598403931, 0.0006309747695922852, 0.0006593316793441772, 0.0006876885890960693, 0.0007160454988479614, 0.0007444024085998535, 0.0007727593183517456, 0.0008011162281036377, 0.0008294731378555298, 0.0008578300476074219]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 11.0, 17.0, 8.0, 25.0, 31.0, 56.0, 82.0, 117.0, 180.0, 290.0, 356.0, 633.0, 9574.0, 1034878.0, 869.0, 475.0, 308.0, 207.0, 162.0, 79.0, 56.0, 27.0, 28.0, 24.0, 13.0, 13.0, 9.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01702880859375, -0.016445636749267578, -0.015862464904785156, -0.015279293060302734, -0.014696121215820312, -0.01411294937133789, -0.013529777526855469, -0.012946605682373047, -0.012363433837890625, -0.011780261993408203, -0.011197090148925781, -0.01061391830444336, -0.010030746459960938, -0.009447574615478516, -0.008864402770996094, -0.008281230926513672, -0.00769805908203125, -0.007114887237548828, -0.006531715393066406, -0.005948543548583984, -0.0053653717041015625, -0.004782199859619141, -0.004199028015136719, -0.003615856170654297, -0.003032684326171875, -0.002449512481689453, -0.0018663406372070312, -0.0012831687927246094, -0.0006999969482421875, -0.00011682510375976562, 0.00046634674072265625, 0.0010495185852050781, 0.0016326904296875, 0.002215862274169922, 0.0027990341186523438, 0.0033822059631347656, 0.0039653778076171875, 0.004548549652099609, 0.005131721496582031, 0.005714893341064453, 0.006298065185546875, 0.006881237030029297, 0.007464408874511719, 0.00804758071899414, 0.008630752563476562, 0.009213924407958984, 0.009797096252441406, 0.010380268096923828, 0.01096343994140625, 0.011546611785888672, 0.012129783630371094, 0.012712955474853516, 0.013296127319335938, 0.01387929916381836, 0.014462471008300781, 0.015045642852783203, 0.015628814697265625, 0.016211986541748047, 0.01679515838623047, 0.01737833023071289, 0.017961502075195312, 0.018544673919677734, 0.019127845764160156, 0.019711017608642578, 0.020294189453125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 22.0, 491.0, 475.0, 22.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011437686625868082, -0.0010979968355968595, -0.0010522250086069107, -0.0010064532980322838, -0.000960681471042335, -0.0009149096440523863, -0.0008691378170624375, -0.0008233659900724888, -0.000777594221290201, -0.0007318223943002522, -0.0006860506255179644, -0.0006402787985280156, -0.0005945069715380669, -0.000548735202755779, -0.0005029633757658303, -0.000457191577879712, -0.0004114197799935937, -0.0003656479821074754, -0.0003198761842213571, -0.00027410435723140836, -0.00022833255934529006, -0.00018256076145917177, -0.00013678893446922302, -9.101713658310473e-05, -4.524533869698644e-05, 5.264664650894701e-07, 4.629827162716538e-05, 9.20700840651989e-05, 0.0001378418819513172, 0.00018361367983743548, 0.00022938550682738423, 0.0002751573047135025, 0.00032092921901494265, 0.00036670101690106094, 0.00041247281478717923, 0.000458244641777128, 0.0005040164105594158, 0.0005497882375493646, 0.0005955600645393133, 0.0006413318915292621, 0.0006871036603115499, 0.0007328754873014987, 0.0007786472560837865, 0.0008244190830737352, 0.000870190910063684, 0.0009159626788459718, 0.0009617345058359206, 0.0010075062746182084, 0.0010532781016081572, 0.001099049928598106, 0.0011448217555880547, 0.0011905934661626816, 0.0012363652931526303, 0.001282137120142579, 0.0013279089471325278, 0.0013736807741224766, 0.0014194524846971035, 0.0014652243116870522, 0.001510996138677001, 0.001556767849251628, 0.0016025396762415767, 0.0016483115032315254, 0.0016940833302214742, 0.001739855157211423, 0.0017856269842013717]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 10.0, 7.0, 12.0, 15.0, 24.0, 17.0, 19.0, 28.0, 26.0, 32.0, 51.0, 30.0, 46.0, 44.0, 52.0, 56.0, 49.0, 64.0, 60.0, 47.0, 46.0, 42.0, 38.0, 35.0, 22.0, 24.0, 26.0, 19.0, 12.0, 10.0, 13.0, 8.0, 7.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004139542579650879, -0.0004001632332801819, -0.0003863722085952759, -0.0003725811839103699, -0.00035879015922546387, -0.00034499913454055786, -0.00033120810985565186, -0.00031741708517074585, -0.00030362606048583984, -0.00028983503580093384, -0.00027604401111602783, -0.0002622529864311218, -0.0002484619617462158, -0.00023467093706130981, -0.0002208799123764038, -0.0002070888876914978, -0.0001932978630065918, -0.0001795068383216858, -0.00016571581363677979, -0.00015192478895187378, -0.00013813376426696777, -0.00012434273958206177, -0.00011055171489715576, -9.676069021224976e-05, -8.296966552734375e-05, -6.917864084243774e-05, -5.538761615753174e-05, -4.159659147262573e-05, -2.7805566787719727e-05, -1.401454210281372e-05, -2.2351741790771484e-07, 1.3567507266998291e-05, 2.7358531951904297e-05, 4.11495566368103e-05, 5.494058132171631e-05, 6.873160600662231e-05, 8.252263069152832e-05, 9.631365537643433e-05, 0.00011010468006134033, 0.00012389570474624634, 0.00013768672943115234, 0.00015147775411605835, 0.00016526877880096436, 0.00017905980348587036, 0.00019285082817077637, 0.00020664185285568237, 0.00022043287754058838, 0.00023422390222549438, 0.0002480149269104004, 0.0002618059515953064, 0.0002755969762802124, 0.0002893880009651184, 0.0003031790256500244, 0.0003169700503349304, 0.0003307610750198364, 0.00034455209970474243, 0.00035834312438964844, 0.00037213414907455444, 0.00038592517375946045, 0.00039971619844436646, 0.00041350722312927246, 0.00042729824781417847, 0.00044108927249908447, 0.0004548802971839905, 0.0004686713218688965]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 11.0, 10.0, 12.0, 15.0, 15.0, 16.0, 24.0, 23.0, 23.0, 30.0, 27.0, 29.0, 37.0, 31.0, 36.0, 52.0, 45.0, 50.0, 33.0, 41.0, 45.0, 39.0, 28.0, 37.0, 39.0, 33.0, 30.0, 24.0, 23.0, 15.0, 19.0, 14.0, 16.0, 10.0, 8.0, 20.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.44921875, -4.3258056640625, -4.202392578125, -4.0789794921875, -3.95556640625, -3.8321533203125, -3.708740234375, -3.5853271484375, -3.4619140625, -3.3385009765625, -3.215087890625, -3.0916748046875, -2.96826171875, -2.8448486328125, -2.721435546875, -2.5980224609375, -2.474609375, -2.3511962890625, -2.227783203125, -2.1043701171875, -1.98095703125, -1.8575439453125, -1.734130859375, -1.6107177734375, -1.4873046875, -1.3638916015625, -1.240478515625, -1.1170654296875, -0.99365234375, -0.8702392578125, -0.746826171875, -0.6234130859375, -0.5, -0.3765869140625, -0.253173828125, -0.1297607421875, -0.00634765625, 0.1170654296875, 0.240478515625, 0.3638916015625, 0.4873046875, 0.6107177734375, 0.734130859375, 0.8575439453125, 0.98095703125, 1.1043701171875, 1.227783203125, 1.3511962890625, 1.474609375, 1.5980224609375, 1.721435546875, 1.8448486328125, 1.96826171875, 2.0916748046875, 2.215087890625, 2.3385009765625, 2.4619140625, 2.5853271484375, 2.708740234375, 2.8321533203125, 2.95556640625, 3.0789794921875, 3.202392578125, 3.3258056640625, 3.44921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 0.0, 6.0, 6.0, 4.0, 15.0, 12.0, 21.0, 26.0, 31.0, 42.0, 52.0, 77.0, 98.0, 127.0, 178.0, 224.0, 295.0, 438.0, 588.0, 731.0, 1106.0, 1519.0, 2284.0, 3523.0, 5911.0, 11831.0, 37362.0, 816093.0, 126570.0, 17726.0, 7965.0, 4360.0, 2768.0, 1859.0, 1272.0, 900.0, 657.0, 478.0, 363.0, 270.0, 180.0, 159.0, 111.0, 74.0, 60.0, 44.0, 42.0, 25.0, 29.0, 12.0, 13.0, 10.0, 7.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-26.25, -25.422607421875, -24.59521484375, -23.767822265625, -22.9404296875, -22.113037109375, -21.28564453125, -20.458251953125, -19.630859375, -18.803466796875, -17.97607421875, -17.148681640625, -16.3212890625, -15.493896484375, -14.66650390625, -13.839111328125, -13.01171875, -12.184326171875, -11.35693359375, -10.529541015625, -9.7021484375, -8.874755859375, -8.04736328125, -7.219970703125, -6.392578125, -5.565185546875, -4.73779296875, -3.910400390625, -3.0830078125, -2.255615234375, -1.42822265625, -0.600830078125, 0.2265625, 1.053955078125, 1.88134765625, 2.708740234375, 3.5361328125, 4.363525390625, 5.19091796875, 6.018310546875, 6.845703125, 7.673095703125, 8.50048828125, 9.327880859375, 10.1552734375, 10.982666015625, 11.81005859375, 12.637451171875, 13.46484375, 14.292236328125, 15.11962890625, 15.947021484375, 16.7744140625, 17.601806640625, 18.42919921875, 19.256591796875, 20.083984375, 20.911376953125, 21.73876953125, 22.566162109375, 23.3935546875, 24.220947265625, 25.04833984375, 25.875732421875, 26.703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 6.0, 9.0, 10.0, 17.0, 13.0, 24.0, 21.0, 26.0, 29.0, 32.0, 25.0, 30.0, 41.0, 38.0, 42.0, 47.0, 76.0, 204.0, 1655.0, 221.0, 80.0, 45.0, 44.0, 39.0, 32.0, 35.0, 33.0, 26.0, 27.0, 14.0, 19.0, 18.0, 14.0, 13.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6328125, -11.2386474609375, -10.844482421875, -10.4503173828125, -10.05615234375, -9.6619873046875, -9.267822265625, -8.8736572265625, -8.4794921875, -8.0853271484375, -7.691162109375, -7.2969970703125, -6.90283203125, -6.5086669921875, -6.114501953125, -5.7203369140625, -5.326171875, -4.9320068359375, -4.537841796875, -4.1436767578125, -3.74951171875, -3.3553466796875, -2.961181640625, -2.5670166015625, -2.1728515625, -1.7786865234375, -1.384521484375, -0.9903564453125, -0.59619140625, -0.2020263671875, 0.192138671875, 0.5863037109375, 0.98046875, 1.3746337890625, 1.768798828125, 2.1629638671875, 2.55712890625, 2.9512939453125, 3.345458984375, 3.7396240234375, 4.1337890625, 4.5279541015625, 4.922119140625, 5.3162841796875, 5.71044921875, 6.1046142578125, 6.498779296875, 6.8929443359375, 7.287109375, 7.6812744140625, 8.075439453125, 8.4696044921875, 8.86376953125, 9.2579345703125, 9.652099609375, 10.0462646484375, 10.4404296875, 10.8345947265625, 11.228759765625, 11.6229248046875, 12.01708984375, 12.4112548828125, 12.805419921875, 13.1995849609375, 13.59375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 12.0, 15.0, 22.0, 20.0, 24.0, 26.0, 31.0, 34.0, 38.0, 45.0, 77.0, 149.0, 415.0, 1683.0, 2897714.0, 243207.0, 1294.0, 342.0, 123.0, 74.0, 52.0, 49.0, 30.0, 30.0, 25.0, 26.0, 21.0, 20.0, 18.0, 18.0, 11.0, 9.0, 8.0, 3.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-61.75, -59.9287109375, -58.107421875, -56.2861328125, -54.46484375, -52.6435546875, -50.822265625, -49.0009765625, -47.1796875, -45.3583984375, -43.537109375, -41.7158203125, -39.89453125, -38.0732421875, -36.251953125, -34.4306640625, -32.609375, -30.7880859375, -28.966796875, -27.1455078125, -25.32421875, -23.5029296875, -21.681640625, -19.8603515625, -18.0390625, -16.2177734375, -14.396484375, -12.5751953125, -10.75390625, -8.9326171875, -7.111328125, -5.2900390625, -3.46875, -1.6474609375, 0.173828125, 1.9951171875, 3.81640625, 5.6376953125, 7.458984375, 9.2802734375, 11.1015625, 12.9228515625, 14.744140625, 16.5654296875, 18.38671875, 20.2080078125, 22.029296875, 23.8505859375, 25.671875, 27.4931640625, 29.314453125, 31.1357421875, 32.95703125, 34.7783203125, 36.599609375, 38.4208984375, 40.2421875, 42.0634765625, 43.884765625, 45.7060546875, 47.52734375, 49.3486328125, 51.169921875, 52.9912109375, 54.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1013.0, 4.0, 0.0, 2.0, 1.0], "bins": [-919.3739624023438, -903.9884033203125, -888.6028442382812, -873.2173461914062, -857.831787109375, -842.4462280273438, -827.0606689453125, -811.6751708984375, -796.2896118164062, -780.904052734375, -765.5184936523438, -750.1329956054688, -734.7474365234375, -719.3618774414062, -703.976318359375, -688.5908203125, -673.2052612304688, -657.8197021484375, -642.4341430664062, -627.0486450195312, -611.6630859375, -596.2775268554688, -580.8919677734375, -565.5064697265625, -550.1209106445312, -534.7353515625, -519.3497924804688, -503.9642639160156, -488.5787353515625, -473.19317626953125, -457.8076477050781, -442.4220886230469, -427.0365295410156, -411.6509704589844, -396.26544189453125, -380.8798828125, -365.4943542480469, -350.1087951660156, -334.7232666015625, -319.33770751953125, -303.9521789550781, -288.5666198730469, -273.18109130859375, -257.7955322265625, -242.41000366210938, -227.02444458007812, -211.638916015625, -196.25335693359375, -180.86782836914062, -165.48228454589844, -150.09674072265625, -134.71119689941406, -119.32565307617188, -103.94010162353516, -88.55455780029297, -73.16901397705078, -57.78346252441406, -42.397918701171875, -27.012372970581055, -11.626827239990234, 3.758716583251953, 19.144264221191406, 34.529808044433594, 49.91535186767578, 65.30089569091797]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 16.0, 8.0, 7.0, 13.0, 12.0, 10.0, 21.0, 19.0, 24.0, 25.0, 26.0, 26.0, 24.0, 40.0, 30.0, 41.0, 33.0, 28.0, 41.0, 45.0, 36.0, 30.0, 48.0, 34.0, 35.0, 37.0, 19.0, 33.0, 22.0, 32.0, 23.0, 20.0, 25.0, 22.0, 12.0, 9.0, 19.0, 13.0, 5.0, 9.0, 7.0, 7.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.865394592285156, -40.73388671875, -39.602378845214844, -38.47086715698242, -37.339359283447266, -36.20785140991211, -35.07633972167969, -33.94483184814453, -32.813323974609375, -31.68181610107422, -30.55030632019043, -29.41879653930664, -28.287288665771484, -27.155780792236328, -26.02427101135254, -24.89276123046875, -23.761253356933594, -22.629745483398438, -21.49823570251465, -20.36672592163086, -19.235218048095703, -18.103710174560547, -16.972200393676758, -15.840691566467285, -14.709182739257812, -13.57767391204834, -12.446165084838867, -11.314656257629395, -10.183147430419922, -9.05163860321045, -7.920129776000977, -6.788620948791504, -5.657112121582031, -4.525603294372559, -3.394094467163086, -2.2625856399536133, -1.1310768127441406, 0.00043201446533203125, 1.1319408416748047, 2.2634496688842773, 3.39495849609375, 4.526467323303223, 5.657976150512695, 6.789484977722168, 7.920993804931641, 9.052502632141113, 10.184011459350586, 11.315520286560059, 12.447029113769531, 13.578537940979004, 14.710046768188477, 15.84155559539795, 16.973064422607422, 18.104572296142578, 19.236082077026367, 20.367591857910156, 21.499099731445312, 22.63060760498047, 23.762117385864258, 24.893627166748047, 26.025135040283203, 27.15664291381836, 28.28815269470215, 29.419662475585938, 30.551170349121094]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 6.0, 11.0, 10.0, 14.0, 13.0, 12.0, 14.0, 26.0, 25.0, 23.0, 27.0, 24.0, 35.0, 34.0, 29.0, 40.0, 45.0, 47.0, 39.0, 50.0, 50.0, 39.0, 32.0, 29.0, 47.0, 33.0, 39.0, 22.0, 27.0, 18.0, 22.0, 18.0, 15.0, 17.0, 13.0, 9.0, 10.0, 12.0, 7.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.74609375, -4.6148681640625, -4.483642578125, -4.3524169921875, -4.22119140625, -4.0899658203125, -3.958740234375, -3.8275146484375, -3.6962890625, -3.5650634765625, -3.433837890625, -3.3026123046875, -3.17138671875, -3.0401611328125, -2.908935546875, -2.7777099609375, -2.646484375, -2.5152587890625, -2.384033203125, -2.2528076171875, -2.12158203125, -1.9903564453125, -1.859130859375, -1.7279052734375, -1.5966796875, -1.4654541015625, -1.334228515625, -1.2030029296875, -1.07177734375, -0.9405517578125, -0.809326171875, -0.6781005859375, -0.546875, -0.4156494140625, -0.284423828125, -0.1531982421875, -0.02197265625, 0.1092529296875, 0.240478515625, 0.3717041015625, 0.5029296875, 0.6341552734375, 0.765380859375, 0.8966064453125, 1.02783203125, 1.1590576171875, 1.290283203125, 1.4215087890625, 1.552734375, 1.6839599609375, 1.815185546875, 1.9464111328125, 2.07763671875, 2.2088623046875, 2.340087890625, 2.4713134765625, 2.6025390625, 2.7337646484375, 2.864990234375, 2.9962158203125, 3.12744140625, 3.2586669921875, 3.389892578125, 3.5211181640625, 3.65234375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 6.0, 10.0, 10.0, 11.0, 15.0, 18.0, 32.0, 48.0, 60.0, 86.0, 128.0, 215.0, 310.0, 558.0, 1065.0, 1905.0, 3922.0, 8387.0, 21535.0, 89816.0, 2610630.0, 1363771.0, 60730.0, 16873.0, 6986.0, 3329.0, 1673.0, 873.0, 492.0, 251.0, 150.0, 107.0, 77.0, 51.0, 45.0, 23.0, 14.0, 11.0, 9.0, 8.0, 10.0, 6.0, 11.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-28.25, -27.4404296875, -26.630859375, -25.8212890625, -25.01171875, -24.2021484375, -23.392578125, -22.5830078125, -21.7734375, -20.9638671875, -20.154296875, -19.3447265625, -18.53515625, -17.7255859375, -16.916015625, -16.1064453125, -15.296875, -14.4873046875, -13.677734375, -12.8681640625, -12.05859375, -11.2490234375, -10.439453125, -9.6298828125, -8.8203125, -8.0107421875, -7.201171875, -6.3916015625, -5.58203125, -4.7724609375, -3.962890625, -3.1533203125, -2.34375, -1.5341796875, -0.724609375, 0.0849609375, 0.89453125, 1.7041015625, 2.513671875, 3.3232421875, 4.1328125, 4.9423828125, 5.751953125, 6.5615234375, 7.37109375, 8.1806640625, 8.990234375, 9.7998046875, 10.609375, 11.4189453125, 12.228515625, 13.0380859375, 13.84765625, 14.6572265625, 15.466796875, 16.2763671875, 17.0859375, 17.8955078125, 18.705078125, 19.5146484375, 20.32421875, 21.1337890625, 21.943359375, 22.7529296875, 23.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 5.0, 2.0, 6.0, 13.0, 14.0, 23.0, 35.0, 37.0, 50.0, 72.0, 97.0, 166.0, 240.0, 372.0, 582.0, 698.0, 587.0, 400.0, 229.0, 142.0, 100.0, 70.0, 37.0, 27.0, 23.0, 18.0, 13.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.814453125, -23.03515625, -22.255859375, -21.4765625, -20.697265625, -19.91796875, -19.138671875, -18.359375, -17.580078125, -16.80078125, -16.021484375, -15.2421875, -14.462890625, -13.68359375, -12.904296875, -12.125, -11.345703125, -10.56640625, -9.787109375, -9.0078125, -8.228515625, -7.44921875, -6.669921875, -5.890625, -5.111328125, -4.33203125, -3.552734375, -2.7734375, -1.994140625, -1.21484375, -0.435546875, 0.34375, 1.123046875, 1.90234375, 2.681640625, 3.4609375, 4.240234375, 5.01953125, 5.798828125, 6.578125, 7.357421875, 8.13671875, 8.916015625, 9.6953125, 10.474609375, 11.25390625, 12.033203125, 12.8125, 13.591796875, 14.37109375, 15.150390625, 15.9296875, 16.708984375, 17.48828125, 18.267578125, 19.046875, 19.826171875, 20.60546875, 21.384765625, 22.1640625, 22.943359375, 23.72265625, 24.501953125, 25.28125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 6.0, 7.0, 18.0, 15.0, 29.0, 39.0, 62.0, 102.0, 166.0, 315.0, 813.0, 48934.0, 4140416.0, 2087.0, 506.0, 283.0, 158.0, 108.0, 69.0, 43.0, 34.0, 22.0, 20.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.625, -134.455078125, -130.28515625, -126.115234375, -121.9453125, -117.775390625, -113.60546875, -109.435546875, -105.265625, -101.095703125, -96.92578125, -92.755859375, -88.5859375, -84.416015625, -80.24609375, -76.076171875, -71.90625, -67.736328125, -63.56640625, -59.396484375, -55.2265625, -51.056640625, -46.88671875, -42.716796875, -38.546875, -34.376953125, -30.20703125, -26.037109375, -21.8671875, -17.697265625, -13.52734375, -9.357421875, -5.1875, -1.017578125, 3.15234375, 7.322265625, 11.4921875, 15.662109375, 19.83203125, 24.001953125, 28.171875, 32.341796875, 36.51171875, 40.681640625, 44.8515625, 49.021484375, 53.19140625, 57.361328125, 61.53125, 65.701171875, 69.87109375, 74.041015625, 78.2109375, 82.380859375, 86.55078125, 90.720703125, 94.890625, 99.060546875, 103.23046875, 107.400390625, 111.5703125, 115.740234375, 119.91015625, 124.080078125, 128.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 57.0, 621.0, 325.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-439.4454650878906, -431.275390625, -423.1053466796875, -414.9352722167969, -406.7652282714844, -398.59515380859375, -390.42510986328125, -382.2550354003906, -374.0849609375, -365.9148864746094, -357.7448425292969, -349.57476806640625, -341.40472412109375, -333.2346496582031, -325.0646057128906, -316.89453125, -308.7244873046875, -300.5544128417969, -292.3843688964844, -284.21429443359375, -276.04425048828125, -267.8741760253906, -259.7041320800781, -251.5340576171875, -243.36399841308594, -235.19393920898438, -227.0238800048828, -218.85382080078125, -210.68374633789062, -202.51370239257812, -194.3436279296875, -186.17356872558594, -178.0034942626953, -169.83343505859375, -161.6633758544922, -153.49331665039062, -145.3232421875, -137.1531982421875, -128.98312377929688, -120.81306457519531, -112.64300537109375, -104.47294616699219, -96.30288696289062, -88.13282012939453, -79.96276092529297, -71.7927017211914, -63.62263870239258, -55.45257568359375, -47.28251647949219, -39.112457275390625, -30.942394256591797, -22.7723331451416, -14.602272033691406, -6.432212829589844, 1.7378501892089844, 9.907913208007812, 18.077972412109375, 26.24803352355957, 34.418094635009766, 42.588157653808594, 50.758216857910156, 58.92827606201172, 67.09834289550781, 75.26840209960938, 83.43846130371094]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 5.0, 2.0, 3.0, 12.0, 6.0, 9.0, 22.0, 18.0, 20.0, 22.0, 18.0, 32.0, 29.0, 25.0, 33.0, 21.0, 36.0, 40.0, 38.0, 37.0, 37.0, 49.0, 44.0, 50.0, 35.0, 37.0, 39.0, 33.0, 34.0, 23.0, 33.0, 15.0, 21.0, 23.0, 17.0, 24.0, 8.0, 10.0, 11.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.48123168945312, -74.95472717285156, -72.42822265625, -69.90171813964844, -67.3752212524414, -64.84871673583984, -62.32221221923828, -59.79570770263672, -57.269203186035156, -54.742698669433594, -52.2161979675293, -49.689693450927734, -47.16318893432617, -44.636688232421875, -42.11018371582031, -39.58367919921875, -37.05717849731445, -34.53067398071289, -32.004173278808594, -29.47766876220703, -26.95116424560547, -24.42466163635254, -21.89815902709961, -19.371654510498047, -16.845151901245117, -14.318648338317871, -11.792144775390625, -9.265642166137695, -6.739138603210449, -4.212635040283203, -1.6861324310302734, 0.8403720855712891, 3.3668746948242188, 5.893378257751465, 8.419881820678711, 10.94638442993164, 13.472887992858887, 15.999391555786133, 18.525894165039062, 21.052398681640625, 23.578901290893555, 26.105403900146484, 28.631908416748047, 31.158411026000977, 33.684913635253906, 36.21141815185547, 38.73792266845703, 41.264427185058594, 43.79092788696289, 46.31743240356445, 48.84393310546875, 51.37043762207031, 53.896942138671875, 56.42344665527344, 58.949947357177734, 61.4764518737793, 64.0029525756836, 66.52945709228516, 69.05596160888672, 71.58245849609375, 74.10896301269531, 76.63546752929688, 79.16197204589844, 81.6884765625, 84.21498107910156]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 25.0, 12.0, 15.0, 20.0, 21.0, 20.0, 31.0, 30.0, 34.0, 30.0, 26.0, 35.0, 39.0, 41.0, 41.0, 41.0, 46.0, 37.0, 31.0, 40.0, 35.0, 34.0, 47.0, 31.0, 27.0, 21.0, 22.0, 21.0, 14.0, 18.0, 13.0, 17.0, 6.0, 9.0, 6.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.546875, -4.41815185546875, -4.2894287109375, -4.16070556640625, -4.031982421875, -3.90325927734375, -3.7745361328125, -3.64581298828125, -3.51708984375, -3.38836669921875, -3.2596435546875, -3.13092041015625, -3.002197265625, -2.87347412109375, -2.7447509765625, -2.61602783203125, -2.4873046875, -2.35858154296875, -2.2298583984375, -2.10113525390625, -1.972412109375, -1.84368896484375, -1.7149658203125, -1.58624267578125, -1.45751953125, -1.32879638671875, -1.2000732421875, -1.07135009765625, -0.942626953125, -0.81390380859375, -0.6851806640625, -0.55645751953125, -0.427734375, -0.29901123046875, -0.1702880859375, -0.04156494140625, 0.087158203125, 0.21588134765625, 0.3446044921875, 0.47332763671875, 0.60205078125, 0.73077392578125, 0.8594970703125, 0.98822021484375, 1.116943359375, 1.24566650390625, 1.3743896484375, 1.50311279296875, 1.6318359375, 1.76055908203125, 1.8892822265625, 2.01800537109375, 2.146728515625, 2.27545166015625, 2.4041748046875, 2.53289794921875, 2.66162109375, 2.79034423828125, 2.9190673828125, 3.04779052734375, 3.176513671875, 3.30523681640625, 3.4339599609375, 3.56268310546875, 3.69140625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 7.0, 21.0, 24.0, 37.0, 53.0, 88.0, 144.0, 181.0, 319.0, 397.0, 692.0, 1083.0, 1566.0, 2501.0, 3705.0, 5812.0, 9114.0, 13650.0, 21259.0, 33058.0, 51968.0, 83724.0, 141470.0, 234639.0, 171736.0, 100676.0, 61439.0, 38688.0, 24831.0, 15927.0, 10349.0, 6741.0, 4387.0, 2834.0, 1912.0, 1189.0, 774.0, 555.0, 315.0, 247.0, 149.0, 111.0, 61.0, 40.0, 27.0, 20.0, 7.0, 17.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61962890625, -0.600067138671875, -0.58050537109375, -0.560943603515625, -0.5413818359375, -0.521820068359375, -0.50225830078125, -0.482696533203125, -0.463134765625, -0.443572998046875, -0.42401123046875, -0.404449462890625, -0.3848876953125, -0.365325927734375, -0.34576416015625, -0.326202392578125, -0.306640625, -0.287078857421875, -0.26751708984375, -0.247955322265625, -0.2283935546875, -0.208831787109375, -0.18927001953125, -0.169708251953125, -0.150146484375, -0.130584716796875, -0.11102294921875, -0.091461181640625, -0.0718994140625, -0.052337646484375, -0.03277587890625, -0.013214111328125, 0.00634765625, 0.025909423828125, 0.04547119140625, 0.065032958984375, 0.0845947265625, 0.104156494140625, 0.12371826171875, 0.143280029296875, 0.162841796875, 0.182403564453125, 0.20196533203125, 0.221527099609375, 0.2410888671875, 0.260650634765625, 0.28021240234375, 0.299774169921875, 0.3193359375, 0.338897705078125, 0.35845947265625, 0.378021240234375, 0.3975830078125, 0.417144775390625, 0.43670654296875, 0.456268310546875, 0.475830078125, 0.495391845703125, 0.51495361328125, 0.534515380859375, 0.5540771484375, 0.573638916015625, 0.59320068359375, 0.612762451171875, 0.63232421875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 1.0, 1.0, 1.0, 5.0, 4.0, 8.0, 6.0, 10.0, 12.0, 7.0, 15.0, 15.0, 23.0, 14.0, 17.0, 30.0, 39.0, 27.0, 31.0, 35.0, 29.0, 41.0, 40.0, 33.0, 26.0, 1061.0, 36.0, 28.0, 26.0, 40.0, 37.0, 27.0, 34.0, 23.0, 35.0, 28.0, 33.0, 17.0, 12.0, 22.0, 13.0, 10.0, 14.0, 15.0, 7.0, 8.0, 4.0, 9.0, 1.0, 7.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.427734375, -2.351715087890625, -2.27569580078125, -2.199676513671875, -2.1236572265625, -2.047637939453125, -1.97161865234375, -1.895599365234375, -1.819580078125, -1.743560791015625, -1.66754150390625, -1.591522216796875, -1.5155029296875, -1.439483642578125, -1.36346435546875, -1.287445068359375, -1.21142578125, -1.135406494140625, -1.05938720703125, -0.983367919921875, -0.9073486328125, -0.831329345703125, -0.75531005859375, -0.679290771484375, -0.603271484375, -0.527252197265625, -0.45123291015625, -0.375213623046875, -0.2991943359375, -0.223175048828125, -0.14715576171875, -0.071136474609375, 0.0048828125, 0.080902099609375, 0.15692138671875, 0.232940673828125, 0.3089599609375, 0.384979248046875, 0.46099853515625, 0.537017822265625, 0.613037109375, 0.689056396484375, 0.76507568359375, 0.841094970703125, 0.9171142578125, 0.993133544921875, 1.06915283203125, 1.145172119140625, 1.22119140625, 1.297210693359375, 1.37322998046875, 1.449249267578125, 1.5252685546875, 1.601287841796875, 1.67730712890625, 1.753326416015625, 1.829345703125, 1.905364990234375, 1.98138427734375, 2.057403564453125, 2.1334228515625, 2.209442138671875, 2.28546142578125, 2.361480712890625, 2.4375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 8.0, 14.0, 22.0, 33.0, 58.0, 79.0, 108.0, 141.0, 244.0, 304.0, 474.0, 621.0, 959.0, 1414.0, 2004.0, 3005.0, 4442.0, 6431.0, 9726.0, 15061.0, 23695.0, 37501.0, 61461.0, 102666.0, 171980.0, 1276914.0, 145864.0, 87129.0, 52612.0, 32062.0, 20406.0, 13155.0, 8525.0, 5773.0, 3885.0, 2691.0, 1747.0, 1210.0, 843.0, 582.0, 405.0, 266.0, 169.0, 146.0, 90.0, 75.0, 54.0, 31.0, 22.0, 12.0, 11.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.48720550537109375, -0.4700164794921875, -0.45282745361328125, -0.435638427734375, -0.41844940185546875, -0.4012603759765625, -0.38407135009765625, -0.36688232421875, -0.34969329833984375, -0.3325042724609375, -0.31531524658203125, -0.298126220703125, -0.28093719482421875, -0.2637481689453125, -0.24655914306640625, -0.2293701171875, -0.21218109130859375, -0.1949920654296875, -0.17780303955078125, -0.160614013671875, -0.14342498779296875, -0.1262359619140625, -0.10904693603515625, -0.09185791015625, -0.07466888427734375, -0.0574798583984375, -0.04029083251953125, -0.023101806640625, -0.00591278076171875, 0.0112762451171875, 0.02846527099609375, 0.045654296875, 0.06284332275390625, 0.0800323486328125, 0.09722137451171875, 0.114410400390625, 0.13159942626953125, 0.1487884521484375, 0.16597747802734375, 0.18316650390625, 0.20035552978515625, 0.2175445556640625, 0.23473358154296875, 0.251922607421875, 0.26911163330078125, 0.2863006591796875, 0.30348968505859375, 0.3206787109375, 0.33786773681640625, 0.3550567626953125, 0.37224578857421875, 0.389434814453125, 0.40662384033203125, 0.4238128662109375, 0.44100189208984375, 0.45819091796875, 0.47537994384765625, 0.4925689697265625, 0.5097579956054688, 0.526947021484375, 0.5441360473632812, 0.5613250732421875, 0.5785140991210938, 0.595703125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 4.0, 4.0, 5.0, 7.0, 5.0, 10.0, 12.0, 10.0, 16.0, 15.0, 19.0, 18.0, 28.0, 32.0, 50.0, 56.0, 67.0, 71.0, 106.0, 92.0, 80.0, 51.0, 57.0, 39.0, 32.0, 25.0, 15.0, 11.0, 10.0, 8.0, 15.0, 9.0, 7.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0010843276977539062, -0.0010530203580856323, -0.0010217130184173584, -0.0009904056787490845, -0.0009590983390808105, -0.0009277909994125366, -0.0008964836597442627, -0.0008651763200759888, -0.0008338689804077148, -0.0008025616407394409, -0.000771254301071167, -0.0007399469614028931, -0.0007086396217346191, -0.0006773322820663452, -0.0006460249423980713, -0.0006147176027297974, -0.0005834102630615234, -0.0005521029233932495, -0.0005207955837249756, -0.0004894882440567017, -0.00045818090438842773, -0.0004268735647201538, -0.0003955662250518799, -0.00036425888538360596, -0.00033295154571533203, -0.0003016442060470581, -0.0002703368663787842, -0.00023902952671051025, -0.00020772218704223633, -0.0001764148473739624, -0.00014510750770568848, -0.00011380016803741455, -8.249282836914062e-05, -5.11854887008667e-05, -1.9878149032592773e-05, 1.1429190635681152e-05, 4.273653030395508e-05, 7.4043869972229e-05, 0.00010535120964050293, 0.00013665854930877686, 0.00016796588897705078, 0.0001992732286453247, 0.00023058056831359863, 0.00026188790798187256, 0.0002931952476501465, 0.0003245025873184204, 0.00035580992698669434, 0.00038711726665496826, 0.0004184246063232422, 0.0004497319459915161, 0.00048103928565979004, 0.000512346625328064, 0.0005436539649963379, 0.0005749613046646118, 0.0006062686443328857, 0.0006375759840011597, 0.0006688833236694336, 0.0007001906633377075, 0.0007314980030059814, 0.0007628053426742554, 0.0007941126823425293, 0.0008254200220108032, 0.0008567273616790771, 0.0008880347013473511, 0.000919342041015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 11.0, 10.0, 14.0, 16.0, 14.0, 25.0, 38.0, 50.0, 78.0, 90.0, 127.0, 236.0, 667.0, 603967.0, 441786.0, 650.0, 254.0, 149.0, 83.0, 67.0, 38.0, 31.0, 21.0, 19.0, 18.0, 9.0, 13.0, 9.0, 10.0, 8.0, 5.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025115966796875, -0.02435469627380371, -0.023593425750732422, -0.022832155227661133, -0.022070884704589844, -0.021309614181518555, -0.020548343658447266, -0.019787073135375977, -0.019025802612304688, -0.0182645320892334, -0.01750326156616211, -0.01674199104309082, -0.01598072052001953, -0.015219449996948242, -0.014458179473876953, -0.013696908950805664, -0.012935638427734375, -0.012174367904663086, -0.011413097381591797, -0.010651826858520508, -0.009890556335449219, -0.00912928581237793, -0.00836801528930664, -0.0076067447662353516, -0.0068454742431640625, -0.0060842037200927734, -0.005322933197021484, -0.004561662673950195, -0.0038003921508789062, -0.003039121627807617, -0.002277851104736328, -0.001516580581665039, -0.00075531005859375, 5.9604644775390625e-06, 0.0007672309875488281, 0.0015285015106201172, 0.0022897720336914062, 0.0030510425567626953, 0.0038123130798339844, 0.0045735836029052734, 0.0053348541259765625, 0.0060961246490478516, 0.006857395172119141, 0.00761866569519043, 0.008379936218261719, 0.009141206741333008, 0.009902477264404297, 0.010663747787475586, 0.011425018310546875, 0.012186288833618164, 0.012947559356689453, 0.013708829879760742, 0.014470100402832031, 0.01523137092590332, 0.01599264144897461, 0.0167539119720459, 0.017515182495117188, 0.018276453018188477, 0.019037723541259766, 0.019798994064331055, 0.020560264587402344, 0.021321535110473633, 0.022082805633544922, 0.02284407615661621, 0.0236053466796875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 372.0, 641.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001021572737954557, -0.0009201943757943809, -0.0008188160718418658, -0.0007174377096816897, -0.0006160594057291746, -0.0005146810435689986, -0.00041330268140882254, -0.0003119243774563074, -0.00021054601529613137, -0.00010916767496382818, -7.78933463152498e-06, 9.358901297673583e-05, 0.0001949673460330814, 0.000296345679089427, 0.00039772404124960303, 0.0004991023452021182, 0.0006004807073622942, 0.0007018590695224702, 0.0008032373734749854, 0.0009046157356351614, 0.0010059940395876765, 0.0011073723435401917, 0.0012087507639080286, 0.0013101290678605437, 0.0014115073718130589, 0.001512885675765574, 0.001614264096133411, 0.001715642400085926, 0.0018170207040384412, 0.0019183990079909563, 0.0020197774283587933, 0.0021211556158959866, 0.0022225340362638235, 0.0023239124566316605, 0.0024252906441688538, 0.0025266690645366907, 0.0026280474849045277, 0.002729425672441721, 0.002830804092809558, 0.002932182513177395, 0.003033560700714588, 0.003134939121082425, 0.0032363173086196184, 0.0033376957289874554, 0.0034390741493552923, 0.0035404523368924856, 0.0036418307572603226, 0.003743208944797516, 0.0038445875979959965, 0.00394596578553319, 0.00404734443873167, 0.004148722626268864, 0.004250100813806057, 0.004351479467004538, 0.004452857654541731, 0.004554235842078924, 0.0046556140296161175, 0.004756992217153311, 0.004858370870351791, 0.004959749057888985, 0.005061127245426178, 0.005162505898624659, 0.005263884086161852, 0.005365262273699045, 0.005466640926897526]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 6.0, 7.0, 9.0, 16.0, 15.0, 22.0, 14.0, 19.0, 24.0, 23.0, 32.0, 43.0, 31.0, 36.0, 45.0, 40.0, 37.0, 41.0, 44.0, 39.0, 43.0, 46.0, 43.0, 44.0, 29.0, 31.0, 33.0, 25.0, 24.0, 23.0, 24.0, 10.0, 20.0, 14.0, 10.0, 10.0, 9.0, 5.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045174360275268555, -0.00043627992272377014, -0.00042081624269485474, -0.00040535256266593933, -0.0003898888826370239, -0.0003744252026081085, -0.0003589615225791931, -0.0003434978425502777, -0.0003280341625213623, -0.0003125704824924469, -0.0002971068024635315, -0.0002816431224346161, -0.0002661794424057007, -0.0002507157623767853, -0.00023525208234786987, -0.00021978840231895447, -0.00020432472229003906, -0.00018886104226112366, -0.00017339736223220825, -0.00015793368220329285, -0.00014247000217437744, -0.00012700632214546204, -0.00011154264211654663, -9.607896208763123e-05, -8.061528205871582e-05, -6.515160202980042e-05, -4.968792200088501e-05, -3.4224241971969604e-05, -1.87605619430542e-05, -3.296881914138794e-06, 1.2166798114776611e-05, 2.7630478143692017e-05, 4.309415817260742e-05, 5.855783820152283e-05, 7.402151823043823e-05, 8.948519825935364e-05, 0.00010494887828826904, 0.00012041255831718445, 0.00013587623834609985, 0.00015133991837501526, 0.00016680359840393066, 0.00018226727843284607, 0.00019773095846176147, 0.00021319463849067688, 0.00022865831851959229, 0.0002441219985485077, 0.0002595856785774231, 0.0002750493586063385, 0.0002905130386352539, 0.0003059767186641693, 0.0003214403986930847, 0.0003369040787220001, 0.00035236775875091553, 0.00036783143877983093, 0.00038329511880874634, 0.00039875879883766174, 0.00041422247886657715, 0.00042968615889549255, 0.00044514983892440796, 0.00046061351895332336, 0.00047607719898223877, 0.0004915408790111542, 0.0005070045590400696, 0.000522468239068985, 0.0005379319190979004]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 9.0, 3.0, 7.0, 9.0, 5.0, 7.0, 12.0, 25.0, 12.0, 15.0, 20.0, 21.0, 20.0, 31.0, 30.0, 34.0, 30.0, 26.0, 35.0, 39.0, 41.0, 41.0, 41.0, 46.0, 37.0, 31.0, 40.0, 35.0, 35.0, 46.0, 31.0, 27.0, 21.0, 22.0, 21.0, 14.0, 18.0, 13.0, 17.0, 6.0, 9.0, 6.0, 3.0, 1.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.546875, -4.41815185546875, -4.2894287109375, -4.16070556640625, -4.031982421875, -3.90325927734375, -3.7745361328125, -3.64581298828125, -3.51708984375, -3.38836669921875, -3.2596435546875, -3.13092041015625, -3.002197265625, -2.87347412109375, -2.7447509765625, -2.61602783203125, -2.4873046875, -2.35858154296875, -2.2298583984375, -2.10113525390625, -1.972412109375, -1.84368896484375, -1.7149658203125, -1.58624267578125, -1.45751953125, -1.32879638671875, -1.2000732421875, -1.07135009765625, -0.942626953125, -0.81390380859375, -0.6851806640625, -0.55645751953125, -0.427734375, -0.29901123046875, -0.1702880859375, -0.04156494140625, 0.087158203125, 0.21588134765625, 0.3446044921875, 0.47332763671875, 0.60205078125, 0.73077392578125, 0.8594970703125, 0.98822021484375, 1.116943359375, 1.24566650390625, 1.3743896484375, 1.50311279296875, 1.6318359375, 1.76055908203125, 1.8892822265625, 2.01800537109375, 2.146728515625, 2.27545166015625, 2.4041748046875, 2.53289794921875, 2.66162109375, 2.79034423828125, 2.9190673828125, 3.04779052734375, 3.176513671875, 3.30523681640625, 3.4339599609375, 3.56268310546875, 3.69140625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 12.0, 7.0, 6.0, 7.0, 10.0, 16.0, 28.0, 32.0, 41.0, 74.0, 86.0, 114.0, 149.0, 217.0, 283.0, 457.0, 742.0, 1307.0, 2664.0, 6005.0, 15517.0, 48317.0, 171727.0, 463162.0, 236807.0, 65320.0, 20462.0, 7508.0, 3300.0, 1590.0, 857.0, 514.0, 381.0, 221.0, 157.0, 128.0, 99.0, 62.0, 48.0, 35.0, 16.0, 15.0, 23.0, 10.0, 9.0, 8.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.36328125, -4.2335205078125, -4.103759765625, -3.9739990234375, -3.84423828125, -3.7144775390625, -3.584716796875, -3.4549560546875, -3.3251953125, -3.1954345703125, -3.065673828125, -2.9359130859375, -2.80615234375, -2.6763916015625, -2.546630859375, -2.4168701171875, -2.287109375, -2.1573486328125, -2.027587890625, -1.8978271484375, -1.76806640625, -1.6383056640625, -1.508544921875, -1.3787841796875, -1.2490234375, -1.1192626953125, -0.989501953125, -0.8597412109375, -0.72998046875, -0.6002197265625, -0.470458984375, -0.3406982421875, -0.2109375, -0.0811767578125, 0.048583984375, 0.1783447265625, 0.30810546875, 0.4378662109375, 0.567626953125, 0.6973876953125, 0.8271484375, 0.9569091796875, 1.086669921875, 1.2164306640625, 1.34619140625, 1.4759521484375, 1.605712890625, 1.7354736328125, 1.865234375, 1.9949951171875, 2.124755859375, 2.2545166015625, 2.38427734375, 2.5140380859375, 2.643798828125, 2.7735595703125, 2.9033203125, 3.0330810546875, 3.162841796875, 3.2926025390625, 3.42236328125, 3.5521240234375, 3.681884765625, 3.8116455078125, 3.94140625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 4.0, 7.0, 6.0, 9.0, 11.0, 23.0, 24.0, 16.0, 21.0, 18.0, 28.0, 22.0, 37.0, 31.0, 31.0, 46.0, 57.0, 75.0, 296.0, 1687.0, 150.0, 54.0, 44.0, 49.0, 44.0, 39.0, 27.0, 29.0, 26.0, 34.0, 16.0, 17.0, 9.0, 13.0, 12.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.171875, -13.687744140625, -13.20361328125, -12.719482421875, -12.2353515625, -11.751220703125, -11.26708984375, -10.782958984375, -10.298828125, -9.814697265625, -9.33056640625, -8.846435546875, -8.3623046875, -7.878173828125, -7.39404296875, -6.909912109375, -6.42578125, -5.941650390625, -5.45751953125, -4.973388671875, -4.4892578125, -4.005126953125, -3.52099609375, -3.036865234375, -2.552734375, -2.068603515625, -1.58447265625, -1.100341796875, -0.6162109375, -0.132080078125, 0.35205078125, 0.836181640625, 1.3203125, 1.804443359375, 2.28857421875, 2.772705078125, 3.2568359375, 3.740966796875, 4.22509765625, 4.709228515625, 5.193359375, 5.677490234375, 6.16162109375, 6.645751953125, 7.1298828125, 7.614013671875, 8.09814453125, 8.582275390625, 9.06640625, 9.550537109375, 10.03466796875, 10.518798828125, 11.0029296875, 11.487060546875, 11.97119140625, 12.455322265625, 12.939453125, 13.423583984375, 13.90771484375, 14.391845703125, 14.8759765625, 15.360107421875, 15.84423828125, 16.328369140625, 16.8125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 6.0, 10.0, 14.0, 9.0, 16.0, 14.0, 27.0, 32.0, 43.0, 35.0, 63.0, 74.0, 126.0, 248.0, 618.0, 3664.0, 3078906.0, 59542.0, 1226.0, 420.0, 160.0, 95.0, 68.0, 43.0, 37.0, 33.0, 22.0, 25.0, 18.0, 18.0, 22.0, 13.0, 8.0, 9.0, 7.0, 2.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-38.875, -37.75634765625, -36.6376953125, -35.51904296875, -34.400390625, -33.28173828125, -32.1630859375, -31.04443359375, -29.92578125, -28.80712890625, -27.6884765625, -26.56982421875, -25.451171875, -24.33251953125, -23.2138671875, -22.09521484375, -20.9765625, -19.85791015625, -18.7392578125, -17.62060546875, -16.501953125, -15.38330078125, -14.2646484375, -13.14599609375, -12.02734375, -10.90869140625, -9.7900390625, -8.67138671875, -7.552734375, -6.43408203125, -5.3154296875, -4.19677734375, -3.078125, -1.95947265625, -0.8408203125, 0.27783203125, 1.396484375, 2.51513671875, 3.6337890625, 4.75244140625, 5.87109375, 6.98974609375, 8.1083984375, 9.22705078125, 10.345703125, 11.46435546875, 12.5830078125, 13.70166015625, 14.8203125, 15.93896484375, 17.0576171875, 18.17626953125, 19.294921875, 20.41357421875, 21.5322265625, 22.65087890625, 23.76953125, 24.88818359375, 26.0068359375, 27.12548828125, 28.244140625, 29.36279296875, 30.4814453125, 31.60009765625, 32.71875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [101.0, 917.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12860631942749, -1.2157740592956543, 3.6970582008361816, 8.60988998413086, 13.522722244262695, 18.43555450439453, 23.348386764526367, 28.26121711730957, 33.17405319213867, 38.086883544921875, 42.999717712402344, 47.91255187988281, 52.825382232666016, 57.73821258544922, 62.65104675292969, 67.56387329101562, 72.4767074584961, 77.38954162597656, 82.3023681640625, 87.21520233154297, 92.12803649902344, 97.0408706665039, 101.95370483398438, 106.86653137207031, 111.77936553955078, 116.69219970703125, 121.60502624511719, 126.51786041259766, 131.43069458007812, 136.34352111816406, 141.25636291503906, 146.169189453125, 151.08203125, 155.99485778808594, 160.90769958496094, 165.82052612304688, 170.73336791992188, 175.6461944580078, 180.55902099609375, 185.47186279296875, 190.3846893310547, 195.29751586914062, 200.21035766601562, 205.12318420410156, 210.0360107421875, 214.9488525390625, 219.86167907714844, 224.77450561523438, 229.68734741210938, 234.6001739501953, 239.5130157470703, 244.42584228515625, 249.33868408203125, 254.2515106201172, 259.1643371582031, 264.0771789550781, 268.989990234375, 273.90283203125, 278.8156433105469, 283.7284851074219, 288.6413269042969, 293.55413818359375, 298.46697998046875, 303.37982177734375, 308.29266357421875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 14.0, 12.0, 16.0, 7.0, 17.0, 20.0, 27.0, 30.0, 27.0, 20.0, 27.0, 36.0, 33.0, 41.0, 44.0, 34.0, 40.0, 63.0, 52.0, 47.0, 48.0, 39.0, 36.0, 41.0, 31.0, 22.0, 29.0, 23.0, 19.0, 26.0, 8.0, 8.0, 9.0, 9.0, 6.0, 4.0, 7.0, 4.0, 1.0, 5.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-47.761878967285156, -46.26251983642578, -44.763160705566406, -43.26380157470703, -41.764442443847656, -40.265079498291016, -38.76572036743164, -37.266361236572266, -35.76700210571289, -34.267642974853516, -32.76828384399414, -31.268922805786133, -29.769563674926758, -28.270204544067383, -26.770843505859375, -25.271484375, -23.772125244140625, -22.27276611328125, -20.773406982421875, -19.274045944213867, -17.774686813354492, -16.275327682495117, -14.775967597961426, -13.276607513427734, -11.77724838256836, -10.277889251708984, -8.778529167175293, -7.27916955947876, -5.779809951782227, -4.280450344085693, -2.78109073638916, -1.2817306518554688, 0.21762847900390625, 1.7169880867004395, 3.2163476943969727, 4.715707302093506, 6.215066909790039, 7.714426517486572, 9.213786125183105, 10.713146209716797, 12.212505340576172, 13.711864471435547, 15.211224555969238, 16.71058464050293, 18.209943771362305, 19.70930290222168, 21.208663940429688, 22.708023071289062, 24.207382202148438, 25.706741333007812, 27.206100463867188, 28.705461502075195, 30.20482063293457, 31.704179763793945, 33.20354080200195, 34.70289993286133, 36.2022590637207, 37.70161819458008, 39.20097732543945, 40.70033645629883, 42.19969940185547, 43.699058532714844, 45.19841766357422, 46.697776794433594, 48.19713592529297]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 9.0, 3.0, 9.0, 7.0, 9.0, 22.0, 17.0, 12.0, 17.0, 17.0, 25.0, 21.0, 34.0, 34.0, 36.0, 27.0, 27.0, 47.0, 45.0, 34.0, 49.0, 44.0, 43.0, 40.0, 40.0, 34.0, 38.0, 41.0, 33.0, 28.0, 21.0, 26.0, 20.0, 16.0, 15.0, 16.0, 13.0, 6.0, 7.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.62005615234375, -4.4822998046875, -4.34454345703125, -4.206787109375, -4.06903076171875, -3.9312744140625, -3.79351806640625, -3.65576171875, -3.51800537109375, -3.3802490234375, -3.24249267578125, -3.104736328125, -2.96697998046875, -2.8292236328125, -2.69146728515625, -2.5537109375, -2.41595458984375, -2.2781982421875, -2.14044189453125, -2.002685546875, -1.86492919921875, -1.7271728515625, -1.58941650390625, -1.45166015625, -1.31390380859375, -1.1761474609375, -1.03839111328125, -0.900634765625, -0.76287841796875, -0.6251220703125, -0.48736572265625, -0.349609375, -0.21185302734375, -0.0740966796875, 0.06365966796875, 0.201416015625, 0.33917236328125, 0.4769287109375, 0.61468505859375, 0.75244140625, 0.89019775390625, 1.0279541015625, 1.16571044921875, 1.303466796875, 1.44122314453125, 1.5789794921875, 1.71673583984375, 1.8544921875, 1.99224853515625, 2.1300048828125, 2.26776123046875, 2.405517578125, 2.54327392578125, 2.6810302734375, 2.81878662109375, 2.95654296875, 3.09429931640625, 3.2320556640625, 3.36981201171875, 3.507568359375, 3.64532470703125, 3.7830810546875, 3.92083740234375, 4.05859375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 11.0, 6.0, 8.0, 10.0, 18.0, 10.0, 19.0, 20.0, 26.0, 36.0, 48.0, 54.0, 77.0, 116.0, 191.0, 316.0, 763.0, 3034.0, 22387.0, 341478.0, 2853152.0, 912369.0, 52262.0, 5555.0, 1160.0, 458.0, 195.0, 129.0, 80.0, 66.0, 36.0, 24.0, 33.0, 25.0, 26.0, 10.0, 11.0, 11.0, 7.0, 8.0, 8.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.8819580078125, -13.443603515625, -13.0052490234375, -12.56689453125, -12.1285400390625, -11.690185546875, -11.2518310546875, -10.8134765625, -10.3751220703125, -9.936767578125, -9.4984130859375, -9.06005859375, -8.6217041015625, -8.183349609375, -7.7449951171875, -7.306640625, -6.8682861328125, -6.429931640625, -5.9915771484375, -5.55322265625, -5.1148681640625, -4.676513671875, -4.2381591796875, -3.7998046875, -3.3614501953125, -2.923095703125, -2.4847412109375, -2.04638671875, -1.6080322265625, -1.169677734375, -0.7313232421875, -0.29296875, 0.1453857421875, 0.583740234375, 1.0220947265625, 1.46044921875, 1.8988037109375, 2.337158203125, 2.7755126953125, 3.2138671875, 3.6522216796875, 4.090576171875, 4.5289306640625, 4.96728515625, 5.4056396484375, 5.843994140625, 6.2823486328125, 6.720703125, 7.1590576171875, 7.597412109375, 8.0357666015625, 8.47412109375, 8.9124755859375, 9.350830078125, 9.7891845703125, 10.2275390625, 10.6658935546875, 11.104248046875, 11.5426025390625, 11.98095703125, 12.4193115234375, 12.857666015625, 13.2960205078125, 13.734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 6.0, 9.0, 9.0, 8.0, 15.0, 21.0, 33.0, 41.0, 55.0, 66.0, 94.0, 131.0, 197.0, 271.0, 333.0, 476.0, 518.0, 432.0, 369.0, 265.0, 209.0, 116.0, 94.0, 66.0, 65.0, 58.0, 33.0, 24.0, 11.0, 10.0, 11.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.28125, -14.764404296875, -14.24755859375, -13.730712890625, -13.2138671875, -12.697021484375, -12.18017578125, -11.663330078125, -11.146484375, -10.629638671875, -10.11279296875, -9.595947265625, -9.0791015625, -8.562255859375, -8.04541015625, -7.528564453125, -7.01171875, -6.494873046875, -5.97802734375, -5.461181640625, -4.9443359375, -4.427490234375, -3.91064453125, -3.393798828125, -2.876953125, -2.360107421875, -1.84326171875, -1.326416015625, -0.8095703125, -0.292724609375, 0.22412109375, 0.740966796875, 1.2578125, 1.774658203125, 2.29150390625, 2.808349609375, 3.3251953125, 3.842041015625, 4.35888671875, 4.875732421875, 5.392578125, 5.909423828125, 6.42626953125, 6.943115234375, 7.4599609375, 7.976806640625, 8.49365234375, 9.010498046875, 9.52734375, 10.044189453125, 10.56103515625, 11.077880859375, 11.5947265625, 12.111572265625, 12.62841796875, 13.145263671875, 13.662109375, 14.178955078125, 14.69580078125, 15.212646484375, 15.7294921875, 16.246337890625, 16.76318359375, 17.280029296875, 17.796875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 5.0, 11.0, 13.0, 27.0, 45.0, 36.0, 77.0, 80.0, 116.0, 165.0, 296.0, 663.0, 3808.0, 1427524.0, 2754667.0, 4977.0, 751.0, 335.0, 194.0, 137.0, 98.0, 69.0, 43.0, 39.0, 23.0, 23.0, 4.0, 10.0, 9.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-61.28125, -59.24169921875, -57.2021484375, -55.16259765625, -53.123046875, -51.08349609375, -49.0439453125, -47.00439453125, -44.96484375, -42.92529296875, -40.8857421875, -38.84619140625, -36.806640625, -34.76708984375, -32.7275390625, -30.68798828125, -28.6484375, -26.60888671875, -24.5693359375, -22.52978515625, -20.490234375, -18.45068359375, -16.4111328125, -14.37158203125, -12.33203125, -10.29248046875, -8.2529296875, -6.21337890625, -4.173828125, -2.13427734375, -0.0947265625, 1.94482421875, 3.984375, 6.02392578125, 8.0634765625, 10.10302734375, 12.142578125, 14.18212890625, 16.2216796875, 18.26123046875, 20.30078125, 22.34033203125, 24.3798828125, 26.41943359375, 28.458984375, 30.49853515625, 32.5380859375, 34.57763671875, 36.6171875, 38.65673828125, 40.6962890625, 42.73583984375, 44.775390625, 46.81494140625, 48.8544921875, 50.89404296875, 52.93359375, 54.97314453125, 57.0126953125, 59.05224609375, 61.091796875, 63.13134765625, 65.1708984375, 67.21044921875, 69.25]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 11.0, 244.0, 677.0, 82.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.37440490722656, -65.42137908935547, -56.46834945678711, -47.51531982421875, -38.562294006347656, -29.609268188476562, -20.656238555908203, -11.703208923339844, -2.75018310546875, 6.202844619750977, 15.155872344970703, 24.10890007019043, 33.061927795410156, 42.01495361328125, 50.96798324584961, 59.92101287841797, 68.87403869628906, 77.82706451416016, 86.78009033203125, 95.73312377929688, 104.68614959716797, 113.63917541503906, 122.59220886230469, 131.54522705078125, 140.49826049804688, 149.4512939453125, 158.40431213378906, 167.3573455810547, 176.31036376953125, 185.26339721679688, 194.2164306640625, 203.16946411132812, 212.12246704101562, 221.07550048828125, 230.0285186767578, 238.98155212402344, 247.9345703125, 256.8876037597656, 265.84063720703125, 274.7936706542969, 283.7467041015625, 292.6997375488281, 301.65277099609375, 310.60577392578125, 319.5588073730469, 328.5118408203125, 337.4648742675781, 346.41790771484375, 355.37091064453125, 364.3239440917969, 373.2769775390625, 382.22998046875, 391.1830139160156, 400.13604736328125, 409.0890808105469, 418.0421142578125, 426.9951171875, 435.9481506347656, 444.90118408203125, 453.85418701171875, 462.8072204589844, 471.76025390625, 480.7132873535156, 489.66632080078125, 498.6193542480469]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 11.0, 11.0, 16.0, 19.0, 26.0, 15.0, 23.0, 20.0, 35.0, 26.0, 51.0, 30.0, 37.0, 30.0, 32.0, 33.0, 30.0, 51.0, 42.0, 34.0, 44.0, 28.0, 39.0, 28.0, 30.0, 25.0, 28.0, 25.0, 15.0, 21.0, 24.0, 16.0, 17.0, 13.0, 5.0, 4.0, 10.0, 8.0, 7.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-49.354095458984375, -47.81196212768555, -46.26982879638672, -44.727691650390625, -43.1855583190918, -41.64342498779297, -40.101287841796875, -38.55915451049805, -37.01702117919922, -35.47488784790039, -33.93275451660156, -32.39061737060547, -30.84848403930664, -29.306350708007812, -27.76421546936035, -26.22208023071289, -24.679946899414062, -23.137813568115234, -21.595678329467773, -20.053543090820312, -18.511409759521484, -16.969276428222656, -15.427141189575195, -13.88500690460205, -12.342872619628906, -10.800738334655762, -9.258604049682617, -7.716469764709473, -6.174335479736328, -4.632201194763184, -3.090066909790039, -1.5479326248168945, -0.00579833984375, 1.5363359451293945, 3.078470230102539, 4.620604515075684, 6.162738800048828, 7.704873085021973, 9.247007369995117, 10.789141654968262, 12.331275939941406, 13.87341022491455, 15.415544509887695, 16.957679748535156, 18.499813079833984, 20.041946411132812, 21.584081649780273, 23.126216888427734, 24.668350219726562, 26.21048355102539, 27.75261878967285, 29.294754028320312, 30.83688735961914, 32.37902069091797, 33.92115783691406, 35.46329116821289, 37.00542449951172, 38.54755783081055, 40.089691162109375, 41.63182830810547, 43.1739616394043, 44.716094970703125, 46.25823211669922, 47.80036544799805, 49.342498779296875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 6.0, 5.0, 11.0, 13.0, 14.0, 12.0, 20.0, 20.0, 13.0, 17.0, 25.0, 23.0, 35.0, 43.0, 32.0, 30.0, 36.0, 45.0, 49.0, 29.0, 47.0, 52.0, 37.0, 36.0, 34.0, 33.0, 42.0, 26.0, 29.0, 30.0, 21.0, 26.0, 16.0, 12.0, 18.0, 14.0, 6.0, 13.0, 8.0, 4.0, 9.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.15234375, -5.01275634765625, -4.8731689453125, -4.73358154296875, -4.593994140625, -4.45440673828125, -4.3148193359375, -4.17523193359375, -4.03564453125, -3.89605712890625, -3.7564697265625, -3.61688232421875, -3.477294921875, -3.33770751953125, -3.1981201171875, -3.05853271484375, -2.9189453125, -2.77935791015625, -2.6397705078125, -2.50018310546875, -2.360595703125, -2.22100830078125, -2.0814208984375, -1.94183349609375, -1.80224609375, -1.66265869140625, -1.5230712890625, -1.38348388671875, -1.243896484375, -1.10430908203125, -0.9647216796875, -0.82513427734375, -0.685546875, -0.54595947265625, -0.4063720703125, -0.26678466796875, -0.127197265625, 0.01239013671875, 0.1519775390625, 0.29156494140625, 0.43115234375, 0.57073974609375, 0.7103271484375, 0.84991455078125, 0.989501953125, 1.12908935546875, 1.2686767578125, 1.40826416015625, 1.5478515625, 1.68743896484375, 1.8270263671875, 1.96661376953125, 2.106201171875, 2.24578857421875, 2.3853759765625, 2.52496337890625, 2.66455078125, 2.80413818359375, 2.9437255859375, 3.08331298828125, 3.222900390625, 3.36248779296875, 3.5020751953125, 3.64166259765625, 3.78125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 18.0, 22.0, 24.0, 38.0, 62.0, 65.0, 126.0, 194.0, 288.0, 491.0, 661.0, 993.0, 1618.0, 2449.0, 3735.0, 5908.0, 9201.0, 14916.0, 23924.0, 39022.0, 66318.0, 114308.0, 208217.0, 236112.0, 129984.0, 74762.0, 43620.0, 26289.0, 16518.0, 10235.0, 6534.0, 4132.0, 2706.0, 1687.0, 1172.0, 759.0, 482.0, 297.0, 233.0, 128.0, 99.0, 67.0, 48.0, 31.0, 20.0, 12.0, 8.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.67431640625, -0.6526412963867188, -0.6309661865234375, -0.6092910766601562, -0.587615966796875, -0.5659408569335938, -0.5442657470703125, -0.5225906372070312, -0.50091552734375, -0.47924041748046875, -0.4575653076171875, -0.43589019775390625, -0.414215087890625, -0.39253997802734375, -0.3708648681640625, -0.34918975830078125, -0.3275146484375, -0.30583953857421875, -0.2841644287109375, -0.26248931884765625, -0.240814208984375, -0.21913909912109375, -0.1974639892578125, -0.17578887939453125, -0.15411376953125, -0.13243865966796875, -0.1107635498046875, -0.08908843994140625, -0.067413330078125, -0.04573822021484375, -0.0240631103515625, -0.00238800048828125, 0.019287109375, 0.04096221923828125, 0.0626373291015625, 0.08431243896484375, 0.105987548828125, 0.12766265869140625, 0.1493377685546875, 0.17101287841796875, 0.19268798828125, 0.21436309814453125, 0.2360382080078125, 0.25771331787109375, 0.279388427734375, 0.30106353759765625, 0.3227386474609375, 0.34441375732421875, 0.3660888671875, 0.38776397705078125, 0.4094390869140625, 0.43111419677734375, 0.452789306640625, 0.47446441650390625, 0.4961395263671875, 0.5178146362304688, 0.53948974609375, 0.5611648559570312, 0.5828399658203125, 0.6045150756835938, 0.626190185546875, 0.6478652954101562, 0.6695404052734375, 0.6912155151367188, 0.712890625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 5.0, 6.0, 8.0, 11.0, 8.0, 20.0, 21.0, 25.0, 27.0, 23.0, 25.0, 37.0, 33.0, 39.0, 35.0, 53.0, 35.0, 38.0, 1068.0, 42.0, 43.0, 48.0, 40.0, 34.0, 42.0, 27.0, 25.0, 35.0, 23.0, 18.0, 17.0, 9.0, 11.0, 17.0, 10.0, 13.0, 8.0, 6.0, 6.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.91796875, -2.82733154296875, -2.7366943359375, -2.64605712890625, -2.555419921875, -2.46478271484375, -2.3741455078125, -2.28350830078125, -2.19287109375, -2.10223388671875, -2.0115966796875, -1.92095947265625, -1.830322265625, -1.73968505859375, -1.6490478515625, -1.55841064453125, -1.4677734375, -1.37713623046875, -1.2864990234375, -1.19586181640625, -1.105224609375, -1.01458740234375, -0.9239501953125, -0.83331298828125, -0.74267578125, -0.65203857421875, -0.5614013671875, -0.47076416015625, -0.380126953125, -0.28948974609375, -0.1988525390625, -0.10821533203125, -0.017578125, 0.07305908203125, 0.1636962890625, 0.25433349609375, 0.344970703125, 0.43560791015625, 0.5262451171875, 0.61688232421875, 0.70751953125, 0.79815673828125, 0.8887939453125, 0.97943115234375, 1.070068359375, 1.16070556640625, 1.2513427734375, 1.34197998046875, 1.4326171875, 1.52325439453125, 1.6138916015625, 1.70452880859375, 1.795166015625, 1.88580322265625, 1.9764404296875, 2.06707763671875, 2.15771484375, 2.24835205078125, 2.3389892578125, 2.42962646484375, 2.520263671875, 2.61090087890625, 2.7015380859375, 2.79217529296875, 2.8828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 5.0, 9.0, 6.0, 12.0, 22.0, 36.0, 45.0, 70.0, 90.0, 133.0, 204.0, 292.0, 404.0, 572.0, 812.0, 1132.0, 1597.0, 2409.0, 3393.0, 4996.0, 7500.0, 11086.0, 17128.0, 27106.0, 43970.0, 73510.0, 125723.0, 1265682.0, 206493.0, 117523.0, 69105.0, 41080.0, 25648.0, 16125.0, 10622.0, 7077.0, 4783.0, 3293.0, 2324.0, 1529.0, 1105.0, 727.0, 530.0, 364.0, 255.0, 190.0, 129.0, 66.0, 75.0, 45.0, 38.0, 25.0, 11.0, 12.0, 10.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5458984375, -0.5276641845703125, -0.509429931640625, -0.4911956787109375, -0.47296142578125, -0.4547271728515625, -0.436492919921875, -0.4182586669921875, -0.4000244140625, -0.3817901611328125, -0.363555908203125, -0.3453216552734375, -0.32708740234375, -0.3088531494140625, -0.290618896484375, -0.2723846435546875, -0.254150390625, -0.2359161376953125, -0.217681884765625, -0.1994476318359375, -0.18121337890625, -0.1629791259765625, -0.144744873046875, -0.1265106201171875, -0.1082763671875, -0.0900421142578125, -0.071807861328125, -0.0535736083984375, -0.03533935546875, -0.0171051025390625, 0.001129150390625, 0.0193634033203125, 0.03759765625, 0.0558319091796875, 0.074066162109375, 0.0923004150390625, 0.11053466796875, 0.1287689208984375, 0.147003173828125, 0.1652374267578125, 0.1834716796875, 0.2017059326171875, 0.219940185546875, 0.2381744384765625, 0.25640869140625, 0.2746429443359375, 0.292877197265625, 0.3111114501953125, 0.329345703125, 0.3475799560546875, 0.365814208984375, 0.3840484619140625, 0.40228271484375, 0.4205169677734375, 0.438751220703125, 0.4569854736328125, 0.4752197265625, 0.4934539794921875, 0.511688232421875, 0.5299224853515625, 0.54815673828125, 0.5663909912109375, 0.584625244140625, 0.6028594970703125, 0.62109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 7.0, 6.0, 8.0, 14.0, 21.0, 33.0, 40.0, 48.0, 83.0, 91.0, 126.0, 117.0, 119.0, 68.0, 39.0, 41.0, 34.0, 23.0, 24.0, 10.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012760162353515625, -0.0012321621179580688, -0.0011883080005645752, -0.0011444538831710815, -0.0011005997657775879, -0.0010567456483840942, -0.0010128915309906006, -0.0009690374135971069, -0.0009251832962036133, -0.0008813291788101196, -0.000837475061416626, -0.0007936209440231323, -0.0007497668266296387, -0.000705912709236145, -0.0006620585918426514, -0.0006182044744491577, -0.0005743503570556641, -0.0005304962396621704, -0.00048664212226867676, -0.0004427880048751831, -0.00039893388748168945, -0.0003550797700881958, -0.00031122565269470215, -0.0002673715353012085, -0.00022351741790771484, -0.0001796633005142212, -0.00013580918312072754, -9.195506572723389e-05, -4.8100948333740234e-05, -4.246830940246582e-06, 3.960728645324707e-05, 8.346140384674072e-05, 0.00012731552124023438, 0.00017116963863372803, 0.00021502375602722168, 0.00025887787342071533, 0.000302731990814209, 0.00034658610820770264, 0.0003904402256011963, 0.00043429434299468994, 0.0004781484603881836, 0.0005220025777816772, 0.0005658566951751709, 0.0006097108125686646, 0.0006535649299621582, 0.0006974190473556519, 0.0007412731647491455, 0.0007851272821426392, 0.0008289813995361328, 0.0008728355169296265, 0.0009166896343231201, 0.0009605437517166138, 0.0010043978691101074, 0.001048251986503601, 0.0010921061038970947, 0.0011359602212905884, 0.001179814338684082, 0.0012236684560775757, 0.0012675225734710693, 0.001311376690864563, 0.0013552308082580566, 0.0013990849256515503, 0.001442939043045044, 0.0014867931604385376, 0.0015306472778320312]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 4.0, 11.0, 13.0, 30.0, 41.0, 47.0, 87.0, 142.0, 279.0, 1165.0, 1044982.0, 1102.0, 284.0, 122.0, 73.0, 56.0, 25.0, 26.0, 6.0, 10.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04071044921875, -0.039530277252197266, -0.03835010528564453, -0.0371699333190918, -0.03598976135253906, -0.03480958938598633, -0.033629417419433594, -0.03244924545288086, -0.031269073486328125, -0.03008890151977539, -0.028908729553222656, -0.027728557586669922, -0.026548385620117188, -0.025368213653564453, -0.02418804168701172, -0.023007869720458984, -0.02182769775390625, -0.020647525787353516, -0.01946735382080078, -0.018287181854248047, -0.017107009887695312, -0.015926837921142578, -0.014746665954589844, -0.01356649398803711, -0.012386322021484375, -0.01120615005493164, -0.010025978088378906, -0.008845806121826172, -0.0076656341552734375, -0.006485462188720703, -0.005305290222167969, -0.004125118255615234, -0.0029449462890625, -0.0017647743225097656, -0.0005846023559570312, 0.0005955696105957031, 0.0017757415771484375, 0.002955913543701172, 0.004136085510253906, 0.005316257476806641, 0.006496429443359375, 0.007676601409912109, 0.008856773376464844, 0.010036945343017578, 0.011217117309570312, 0.012397289276123047, 0.013577461242675781, 0.014757633209228516, 0.01593780517578125, 0.017117977142333984, 0.01829814910888672, 0.019478321075439453, 0.020658493041992188, 0.021838665008544922, 0.023018836975097656, 0.02419900894165039, 0.025379180908203125, 0.02655935287475586, 0.027739524841308594, 0.028919696807861328, 0.030099868774414062, 0.0312800407409668, 0.03246021270751953, 0.033640384674072266, 0.034820556640625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 565.0, 431.0, 14.0, 2.0, 0.0, 1.0], "bins": [-0.0048218173906207085, -0.004739995580166578, -0.004658174235373735, -0.004576352424919605, -0.004494530614465475, -0.004412709269672632, -0.004330887459218502, -0.004249066114425659, -0.004167244303971529, -0.004085422493517399, -0.004003601148724556, -0.003921779338270426, -0.0038399577606469393, -0.0037581361830234528, -0.0036763143725693226, -0.003594492794945836, -0.0035126712173223495, -0.003430849639698863, -0.003349027829244733, -0.0032672062516212463, -0.00318538467399776, -0.0031035630963742733, -0.003021741285920143, -0.0029399197082966566, -0.0028580978978425264, -0.00277627632021904, -0.0026944545097649097, -0.0026126329321414232, -0.0025308113545179367, -0.00244898977689445, -0.00236716796644032, -0.0022853463888168335, -0.002203524811193347, -0.0021217032335698605, -0.0020398814231157303, -0.0019580598454922438, -0.0018762382678687572, -0.001794416573829949, -0.0017125948797911406, -0.001630773302167654, -0.0015489516081288457, -0.0014671299140900373, -0.0013853083364665508, -0.0013034866424277425, -0.001221665064804256, -0.0011398433707654476, -0.001058021793141961, -0.0009762000991031528, -0.0008943785214796662, -0.0008125568856485188, -0.0007307352498173714, -0.000648913555778563, -0.0005670919781550765, -0.0004852703132200986, -0.0004034486482851207, -0.0003216270124539733, -0.0002398053475189954, -0.00015798371168784797, -7.616206130478531e-05, 5.6595890782773495e-06, 8.748122490942478e-05, 0.00016930286074057221, 0.0002511245256755501, 0.00033294616150669754, 0.00041476779733784497]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 12.0, 10.0, 15.0, 19.0, 19.0, 28.0, 32.0, 31.0, 36.0, 37.0, 31.0, 33.0, 46.0, 37.0, 44.0, 60.0, 42.0, 45.0, 39.0, 36.0, 37.0, 35.0, 28.0, 44.0, 33.0, 15.0, 25.0, 16.0, 15.0, 13.0, 10.0, 10.0, 9.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0004946589469909668, -0.0004779137670993805, -0.0004611685872077942, -0.0004444234073162079, -0.0004276782274246216, -0.0004109330475330353, -0.000394187867641449, -0.00037744268774986267, -0.00036069750785827637, -0.00034395232796669006, -0.00032720714807510376, -0.00031046196818351746, -0.00029371678829193115, -0.00027697160840034485, -0.00026022642850875854, -0.00024348124861717224, -0.00022673606872558594, -0.00020999088883399963, -0.00019324570894241333, -0.00017650052905082703, -0.00015975534915924072, -0.00014301016926765442, -0.00012626498937606812, -0.00010951980948448181, -9.277462959289551e-05, -7.60294497013092e-05, -5.92842698097229e-05, -4.25390899181366e-05, -2.5793910026550293e-05, -9.04873013496399e-06, 7.696449756622314e-06, 2.4441629648208618e-05, 4.118680953979492e-05, 5.7931989431381226e-05, 7.467716932296753e-05, 9.142234921455383e-05, 0.00010816752910614014, 0.00012491270899772644, 0.00014165788888931274, 0.00015840306878089905, 0.00017514824867248535, 0.00019189342856407166, 0.00020863860845565796, 0.00022538378834724426, 0.00024212896823883057, 0.00025887414813041687, 0.0002756193280220032, 0.0002923645079135895, 0.0003091096878051758, 0.0003258548676967621, 0.0003426000475883484, 0.0003593452274799347, 0.000376090407371521, 0.0003928355872631073, 0.0004095807671546936, 0.0004263259470462799, 0.0004430711269378662, 0.0004598163068294525, 0.0004765614867210388, 0.0004933066666126251, 0.0005100518465042114, 0.0005267970263957977, 0.000543542206287384, 0.0005602873861789703, 0.0005770325660705566]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 6.0, 5.0, 11.0, 13.0, 14.0, 12.0, 20.0, 20.0, 13.0, 17.0, 25.0, 23.0, 35.0, 43.0, 32.0, 30.0, 36.0, 45.0, 49.0, 29.0, 47.0, 52.0, 37.0, 36.0, 34.0, 33.0, 42.0, 26.0, 29.0, 30.0, 21.0, 26.0, 16.0, 12.0, 18.0, 14.0, 6.0, 13.0, 8.0, 4.0, 9.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.15234375, -5.01275634765625, -4.8731689453125, -4.73358154296875, -4.593994140625, -4.45440673828125, -4.3148193359375, -4.17523193359375, -4.03564453125, -3.89605712890625, -3.7564697265625, -3.61688232421875, -3.477294921875, -3.33770751953125, -3.1981201171875, -3.05853271484375, -2.9189453125, -2.77935791015625, -2.6397705078125, -2.50018310546875, -2.360595703125, -2.22100830078125, -2.0814208984375, -1.94183349609375, -1.80224609375, -1.66265869140625, -1.5230712890625, -1.38348388671875, -1.243896484375, -1.10430908203125, -0.9647216796875, -0.82513427734375, -0.685546875, -0.54595947265625, -0.4063720703125, -0.26678466796875, -0.127197265625, 0.01239013671875, 0.1519775390625, 0.29156494140625, 0.43115234375, 0.57073974609375, 0.7103271484375, 0.84991455078125, 0.989501953125, 1.12908935546875, 1.2686767578125, 1.40826416015625, 1.5478515625, 1.68743896484375, 1.8270263671875, 1.96661376953125, 2.106201171875, 2.24578857421875, 2.3853759765625, 2.52496337890625, 2.66455078125, 2.80413818359375, 2.9437255859375, 3.08331298828125, 3.222900390625, 3.36248779296875, 3.5020751953125, 3.64166259765625, 3.78125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 11.0, 12.0, 15.0, 20.0, 28.0, 36.0, 49.0, 76.0, 81.0, 131.0, 174.0, 235.0, 391.0, 559.0, 898.0, 1344.0, 2350.0, 4068.0, 7436.0, 14965.0, 31298.0, 74489.0, 199622.0, 410383.0, 174548.0, 66306.0, 28499.0, 13661.0, 6889.0, 3746.0, 2211.0, 1309.0, 876.0, 582.0, 385.0, 235.0, 197.0, 109.0, 88.0, 71.0, 36.0, 37.0, 28.0, 17.0, 17.0, 11.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0], "bins": [-3.2109375, -3.120330810546875, -3.02972412109375, -2.939117431640625, -2.8485107421875, -2.757904052734375, -2.66729736328125, -2.576690673828125, -2.486083984375, -2.395477294921875, -2.30487060546875, -2.214263916015625, -2.1236572265625, -2.033050537109375, -1.94244384765625, -1.851837158203125, -1.76123046875, -1.670623779296875, -1.58001708984375, -1.489410400390625, -1.3988037109375, -1.308197021484375, -1.21759033203125, -1.126983642578125, -1.036376953125, -0.945770263671875, -0.85516357421875, -0.764556884765625, -0.6739501953125, -0.583343505859375, -0.49273681640625, -0.402130126953125, -0.3115234375, -0.220916748046875, -0.13031005859375, -0.039703369140625, 0.0509033203125, 0.141510009765625, 0.23211669921875, 0.322723388671875, 0.413330078125, 0.503936767578125, 0.59454345703125, 0.685150146484375, 0.7757568359375, 0.866363525390625, 0.95697021484375, 1.047576904296875, 1.13818359375, 1.228790283203125, 1.31939697265625, 1.410003662109375, 1.5006103515625, 1.591217041015625, 1.68182373046875, 1.772430419921875, 1.863037109375, 1.953643798828125, 2.04425048828125, 2.134857177734375, 2.2254638671875, 2.316070556640625, 2.40667724609375, 2.497283935546875, 2.587890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 14.0, 12.0, 18.0, 15.0, 24.0, 20.0, 25.0, 31.0, 37.0, 42.0, 36.0, 51.0, 49.0, 60.0, 126.0, 1792.0, 212.0, 83.0, 43.0, 30.0, 45.0, 33.0, 35.0, 26.0, 32.0, 27.0, 20.0, 14.0, 12.0, 13.0, 8.0, 11.0, 7.0, 4.0, 4.0, 7.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-19.328125, -18.78662109375, -18.2451171875, -17.70361328125, -17.162109375, -16.62060546875, -16.0791015625, -15.53759765625, -14.99609375, -14.45458984375, -13.9130859375, -13.37158203125, -12.830078125, -12.28857421875, -11.7470703125, -11.20556640625, -10.6640625, -10.12255859375, -9.5810546875, -9.03955078125, -8.498046875, -7.95654296875, -7.4150390625, -6.87353515625, -6.33203125, -5.79052734375, -5.2490234375, -4.70751953125, -4.166015625, -3.62451171875, -3.0830078125, -2.54150390625, -2.0, -1.45849609375, -0.9169921875, -0.37548828125, 0.166015625, 0.70751953125, 1.2490234375, 1.79052734375, 2.33203125, 2.87353515625, 3.4150390625, 3.95654296875, 4.498046875, 5.03955078125, 5.5810546875, 6.12255859375, 6.6640625, 7.20556640625, 7.7470703125, 8.28857421875, 8.830078125, 9.37158203125, 9.9130859375, 10.45458984375, 10.99609375, 11.53759765625, 12.0791015625, 12.62060546875, 13.162109375, 13.70361328125, 14.2451171875, 14.78662109375, 15.328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 2.0, 4.0, 11.0, 12.0, 7.0, 13.0, 19.0, 25.0, 24.0, 33.0, 44.0, 71.0, 82.0, 110.0, 197.0, 458.0, 1362.0, 28614.0, 3077900.0, 34100.0, 1427.0, 446.0, 208.0, 132.0, 84.0, 67.0, 48.0, 38.0, 25.0, 27.0, 25.0, 15.0, 16.0, 9.0, 12.0, 9.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.984375, -24.076416015625, -23.16845703125, -22.260498046875, -21.3525390625, -20.444580078125, -19.53662109375, -18.628662109375, -17.720703125, -16.812744140625, -15.90478515625, -14.996826171875, -14.0888671875, -13.180908203125, -12.27294921875, -11.364990234375, -10.45703125, -9.549072265625, -8.64111328125, -7.733154296875, -6.8251953125, -5.917236328125, -5.00927734375, -4.101318359375, -3.193359375, -2.285400390625, -1.37744140625, -0.469482421875, 0.4384765625, 1.346435546875, 2.25439453125, 3.162353515625, 4.0703125, 4.978271484375, 5.88623046875, 6.794189453125, 7.7021484375, 8.610107421875, 9.51806640625, 10.426025390625, 11.333984375, 12.241943359375, 13.14990234375, 14.057861328125, 14.9658203125, 15.873779296875, 16.78173828125, 17.689697265625, 18.59765625, 19.505615234375, 20.41357421875, 21.321533203125, 22.2294921875, 23.137451171875, 24.04541015625, 24.953369140625, 25.861328125, 26.769287109375, 27.67724609375, 28.585205078125, 29.4931640625, 30.401123046875, 31.30908203125, 32.217041015625, 33.125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 136.0, 732.0, 138.0, 4.0, 1.0, 2.0], "bins": [-185.34841918945312, -182.23292541503906, -179.11744689941406, -176.001953125, -172.88645935058594, -169.77098083496094, -166.65548706054688, -163.5399932861328, -160.4245147705078, -157.30902099609375, -154.19354248046875, -151.0780487060547, -147.96255493164062, -144.84707641601562, -141.73158264160156, -138.6160888671875, -135.5006103515625, -132.38511657714844, -129.26963806152344, -126.15414428710938, -123.03865814208984, -119.92317199707031, -116.80767822265625, -113.69219207763672, -110.57669067382812, -107.4612045288086, -104.34571075439453, -101.230224609375, -98.11473846435547, -94.99925231933594, -91.88375854492188, -88.76827239990234, -85.65279388427734, -82.53730773925781, -79.42181396484375, -76.30632781982422, -73.19084167480469, -70.07534790039062, -66.9598617553711, -63.84437561035156, -60.728885650634766, -57.61339569091797, -54.49790954589844, -51.38241958618164, -48.266929626464844, -45.15144348144531, -42.035953521728516, -38.92046356201172, -35.80497741699219, -32.68948745727539, -29.57400131225586, -26.458511352539062, -23.3430233001709, -20.227535247802734, -17.112045288085938, -13.996557235717773, -10.88106918334961, -7.765580654144287, -4.650092124938965, -1.5346031188964844, 1.5808849334716797, 4.696372985839844, 7.811862945556641, 10.927350997924805, 14.042839050292969]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 5.0, 6.0, 5.0, 7.0, 11.0, 19.0, 24.0, 15.0, 23.0, 40.0, 35.0, 33.0, 29.0, 42.0, 43.0, 40.0, 44.0, 39.0, 48.0, 57.0, 36.0, 46.0, 38.0, 47.0, 35.0, 30.0, 26.0, 26.0, 28.0, 21.0, 16.0, 16.0, 14.0, 10.0, 10.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.50587463378906, -45.75878143310547, -44.01169204711914, -42.26459884643555, -40.51750946044922, -38.770416259765625, -37.02332305908203, -35.2762336730957, -33.529144287109375, -31.782052993774414, -30.034961700439453, -28.28786849975586, -26.54077911376953, -24.793685913085938, -23.046594619750977, -21.299503326416016, -19.552410125732422, -17.80531883239746, -16.0582275390625, -14.311135292053223, -12.564043998718262, -10.8169527053833, -9.069860458374023, -7.3227691650390625, -5.575677871704102, -3.8285863399505615, -2.0814948081970215, -0.33440303802490234, 1.4126882553100586, 3.1597795486450195, 4.906871795654297, 6.653963088989258, 8.401054382324219, 10.14814567565918, 11.89523696899414, 13.642329216003418, 15.389420509338379, 17.136512756347656, 18.883604049682617, 20.630695343017578, 22.37778663635254, 24.1248779296875, 25.87196922302246, 27.619060516357422, 29.366153717041016, 31.113243103027344, 32.86033630371094, 34.60742950439453, 36.35451889038086, 38.10161209106445, 39.84870147705078, 41.595794677734375, 43.3428840637207, 45.0899772644043, 46.837066650390625, 48.58415985107422, 50.33125305175781, 52.078346252441406, 53.825435638427734, 55.57252883911133, 57.319618225097656, 59.06671142578125, 60.813804626464844, 62.56089401245117, 64.3079833984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 4.0, 9.0, 10.0, 13.0, 18.0, 12.0, 21.0, 20.0, 19.0, 23.0, 30.0, 34.0, 34.0, 32.0, 27.0, 38.0, 50.0, 46.0, 43.0, 47.0, 45.0, 43.0, 40.0, 21.0, 40.0, 37.0, 39.0, 24.0, 23.0, 21.0, 27.0, 17.0, 20.0, 13.0, 9.0, 16.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3203125, -5.17193603515625, -5.0235595703125, -4.87518310546875, -4.726806640625, -4.57843017578125, -4.4300537109375, -4.28167724609375, -4.13330078125, -3.98492431640625, -3.8365478515625, -3.68817138671875, -3.539794921875, -3.39141845703125, -3.2430419921875, -3.09466552734375, -2.9462890625, -2.79791259765625, -2.6495361328125, -2.50115966796875, -2.352783203125, -2.20440673828125, -2.0560302734375, -1.90765380859375, -1.75927734375, -1.61090087890625, -1.4625244140625, -1.31414794921875, -1.165771484375, -1.01739501953125, -0.8690185546875, -0.72064208984375, -0.572265625, -0.42388916015625, -0.2755126953125, -0.12713623046875, 0.021240234375, 0.16961669921875, 0.3179931640625, 0.46636962890625, 0.61474609375, 0.76312255859375, 0.9114990234375, 1.05987548828125, 1.208251953125, 1.35662841796875, 1.5050048828125, 1.65338134765625, 1.8017578125, 1.95013427734375, 2.0985107421875, 2.24688720703125, 2.395263671875, 2.54364013671875, 2.6920166015625, 2.84039306640625, 2.98876953125, 3.13714599609375, 3.2855224609375, 3.43389892578125, 3.582275390625, 3.73065185546875, 3.8790283203125, 4.02740478515625, 4.17578125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 6.0, 8.0, 10.0, 10.0, 11.0, 9.0, 9.0, 18.0, 19.0, 24.0, 18.0, 19.0, 18.0, 40.0, 33.0, 47.0, 74.0, 169.0, 691.0, 21952.0, 3468749.0, 697897.0, 3704.0, 309.0, 96.0, 41.0, 46.0, 32.0, 35.0, 27.0, 23.0, 21.0, 17.0, 25.0, 17.0, 14.0, 10.0, 12.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-35.15625, -34.20068359375, -33.2451171875, -32.28955078125, -31.333984375, -30.37841796875, -29.4228515625, -28.46728515625, -27.51171875, -26.55615234375, -25.6005859375, -24.64501953125, -23.689453125, -22.73388671875, -21.7783203125, -20.82275390625, -19.8671875, -18.91162109375, -17.9560546875, -17.00048828125, -16.044921875, -15.08935546875, -14.1337890625, -13.17822265625, -12.22265625, -11.26708984375, -10.3115234375, -9.35595703125, -8.400390625, -7.44482421875, -6.4892578125, -5.53369140625, -4.578125, -3.62255859375, -2.6669921875, -1.71142578125, -0.755859375, 0.19970703125, 1.1552734375, 2.11083984375, 3.06640625, 4.02197265625, 4.9775390625, 5.93310546875, 6.888671875, 7.84423828125, 8.7998046875, 9.75537109375, 10.7109375, 11.66650390625, 12.6220703125, 13.57763671875, 14.533203125, 15.48876953125, 16.4443359375, 17.39990234375, 18.35546875, 19.31103515625, 20.2666015625, 21.22216796875, 22.177734375, 23.13330078125, 24.0888671875, 25.04443359375, 26.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 14.0, 14.0, 24.0, 38.0, 40.0, 58.0, 97.0, 129.0, 213.0, 324.0, 436.0, 551.0, 573.0, 503.0, 333.0, 245.0, 163.0, 115.0, 62.0, 40.0, 25.0, 12.0, 24.0, 14.0, 4.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.21875, -21.6370849609375, -21.055419921875, -20.4737548828125, -19.89208984375, -19.3104248046875, -18.728759765625, -18.1470947265625, -17.5654296875, -16.9837646484375, -16.402099609375, -15.8204345703125, -15.23876953125, -14.6571044921875, -14.075439453125, -13.4937744140625, -12.912109375, -12.3304443359375, -11.748779296875, -11.1671142578125, -10.58544921875, -10.0037841796875, -9.422119140625, -8.8404541015625, -8.2587890625, -7.6771240234375, -7.095458984375, -6.5137939453125, -5.93212890625, -5.3504638671875, -4.768798828125, -4.1871337890625, -3.60546875, -3.0238037109375, -2.442138671875, -1.8604736328125, -1.27880859375, -0.6971435546875, -0.115478515625, 0.4661865234375, 1.0478515625, 1.6295166015625, 2.211181640625, 2.7928466796875, 3.37451171875, 3.9561767578125, 4.537841796875, 5.1195068359375, 5.701171875, 6.2828369140625, 6.864501953125, 7.4461669921875, 8.02783203125, 8.6094970703125, 9.191162109375, 9.7728271484375, 10.3544921875, 10.9361572265625, 11.517822265625, 12.0994873046875, 12.68115234375, 13.2628173828125, 13.844482421875, 14.4261474609375, 15.0078125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 13.0, 11.0, 11.0, 21.0, 42.0, 34.0, 50.0, 77.0, 143.0, 239.0, 394.0, 1065.0, 47171.0, 4133826.0, 9301.0, 841.0, 386.0, 198.0, 158.0, 91.0, 41.0, 39.0, 47.0, 35.0, 19.0, 8.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.9375, -74.4052734375, -71.873046875, -69.3408203125, -66.80859375, -64.2763671875, -61.744140625, -59.2119140625, -56.6796875, -54.1474609375, -51.615234375, -49.0830078125, -46.55078125, -44.0185546875, -41.486328125, -38.9541015625, -36.421875, -33.8896484375, -31.357421875, -28.8251953125, -26.29296875, -23.7607421875, -21.228515625, -18.6962890625, -16.1640625, -13.6318359375, -11.099609375, -8.5673828125, -6.03515625, -3.5029296875, -0.970703125, 1.5615234375, 4.09375, 6.6259765625, 9.158203125, 11.6904296875, 14.22265625, 16.7548828125, 19.287109375, 21.8193359375, 24.3515625, 26.8837890625, 29.416015625, 31.9482421875, 34.48046875, 37.0126953125, 39.544921875, 42.0771484375, 44.609375, 47.1416015625, 49.673828125, 52.2060546875, 54.73828125, 57.2705078125, 59.802734375, 62.3349609375, 64.8671875, 67.3994140625, 69.931640625, 72.4638671875, 74.99609375, 77.5283203125, 80.060546875, 82.5927734375, 85.125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 13.0, 221.0, 609.0, 162.0, 10.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.762542724609375, -45.41909408569336, -37.075645446777344, -28.732196807861328, -20.388748168945312, -12.045299530029297, -3.7018508911132812, 4.641597747802734, 12.98504638671875, 21.328495025634766, 29.67194366455078, 38.0153923034668, 46.35884094238281, 54.70228958129883, 63.045738220214844, 71.38919067382812, 79.73263549804688, 88.07608032226562, 96.4195327758789, 104.76298522949219, 113.10643005371094, 121.44987487792969, 129.7933349609375, 138.13677978515625, 146.480224609375, 154.82366943359375, 163.1671142578125, 171.5105743408203, 179.85401916503906, 188.1974639892578, 196.54092407226562, 204.88436889648438, 213.227783203125, 221.57122802734375, 229.9146728515625, 238.2581329345703, 246.60157775878906, 254.9450225830078, 263.2884826660156, 271.6319274902344, 279.9753723144531, 288.3188171386719, 296.6622619628906, 305.0057067871094, 313.34918212890625, 321.692626953125, 330.03607177734375, 338.3795166015625, 346.72296142578125, 355.06640625, 363.40985107421875, 371.7532958984375, 380.09674072265625, 388.4402160644531, 396.7836608886719, 405.1271057128906, 413.4705505371094, 421.8139953613281, 430.1574401855469, 438.5008850097656, 446.8443603515625, 455.18780517578125, 463.53125, 471.87469482421875, 480.2181396484375]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 9.0, 10.0, 9.0, 13.0, 17.0, 13.0, 17.0, 12.0, 16.0, 19.0, 25.0, 33.0, 25.0, 23.0, 34.0, 37.0, 37.0, 38.0, 34.0, 37.0, 41.0, 40.0, 51.0, 44.0, 35.0, 23.0, 36.0, 24.0, 26.0, 32.0, 20.0, 20.0, 22.0, 14.0, 24.0, 12.0, 9.0, 7.0, 10.0, 9.0, 5.0, 8.0, 2.0, 9.0, 1.0, 7.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-50.975921630859375, -49.38608169555664, -47.796241760253906, -46.20640182495117, -44.61656188964844, -43.02672576904297, -41.436885833740234, -39.8470458984375, -38.257205963134766, -36.66736602783203, -35.0775260925293, -33.48768615722656, -31.89784812927246, -30.308008193969727, -28.718170166015625, -27.12833023071289, -25.538490295410156, -23.948650360107422, -22.358810424804688, -20.768972396850586, -19.17913246154785, -17.589292526245117, -15.9994535446167, -14.409614562988281, -12.819774627685547, -11.229934692382812, -9.640095710754395, -8.050256729125977, -6.460416793823242, -4.870577335357666, -3.28073787689209, -1.6908988952636719, -0.1010589599609375, 1.4887804985046387, 3.078619956970215, 4.668459415435791, 6.258298873901367, 7.848138332366943, 9.43797779083252, 11.027816772460938, 12.617656707763672, 14.207496643066406, 15.797335624694824, 17.387174606323242, 18.977014541625977, 20.56685447692871, 22.156692504882812, 23.746532440185547, 25.33637237548828, 26.926212310791016, 28.51605224609375, 30.10589027404785, 31.695730209350586, 33.28556823730469, 34.87540817260742, 36.465248107910156, 38.05508804321289, 39.644927978515625, 41.23476791381836, 42.824607849121094, 44.41444396972656, 46.0042839050293, 47.59412384033203, 49.183963775634766, 50.7738037109375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 5.0, 13.0, 13.0, 13.0, 14.0, 13.0, 13.0, 16.0, 20.0, 20.0, 24.0, 25.0, 22.0, 35.0, 42.0, 35.0, 35.0, 41.0, 49.0, 42.0, 47.0, 30.0, 41.0, 31.0, 35.0, 33.0, 28.0, 29.0, 14.0, 23.0, 33.0, 31.0, 19.0, 17.0, 15.0, 17.0, 11.0, 3.0, 13.0, 12.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.859375, -4.71978759765625, -4.5802001953125, -4.44061279296875, -4.301025390625, -4.16143798828125, -4.0218505859375, -3.88226318359375, -3.74267578125, -3.60308837890625, -3.4635009765625, -3.32391357421875, -3.184326171875, -3.04473876953125, -2.9051513671875, -2.76556396484375, -2.6259765625, -2.48638916015625, -2.3468017578125, -2.20721435546875, -2.067626953125, -1.92803955078125, -1.7884521484375, -1.64886474609375, -1.50927734375, -1.36968994140625, -1.2301025390625, -1.09051513671875, -0.950927734375, -0.81134033203125, -0.6717529296875, -0.53216552734375, -0.392578125, -0.25299072265625, -0.1134033203125, 0.02618408203125, 0.165771484375, 0.30535888671875, 0.4449462890625, 0.58453369140625, 0.72412109375, 0.86370849609375, 1.0032958984375, 1.14288330078125, 1.282470703125, 1.42205810546875, 1.5616455078125, 1.70123291015625, 1.8408203125, 1.98040771484375, 2.1199951171875, 2.25958251953125, 2.399169921875, 2.53875732421875, 2.6783447265625, 2.81793212890625, 2.95751953125, 3.09710693359375, 3.2366943359375, 3.37628173828125, 3.515869140625, 3.65545654296875, 3.7950439453125, 3.93463134765625, 4.07421875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 9.0, 20.0, 20.0, 32.0, 45.0, 72.0, 90.0, 134.0, 225.0, 327.0, 486.0, 684.0, 1056.0, 1654.0, 2551.0, 3883.0, 5908.0, 9044.0, 13835.0, 21819.0, 34248.0, 54716.0, 90383.0, 158177.0, 253131.0, 156424.0, 90370.0, 53991.0, 33738.0, 21580.0, 13971.0, 8928.0, 5803.0, 3841.0, 2491.0, 1693.0, 1050.0, 702.0, 482.0, 302.0, 204.0, 134.0, 113.0, 65.0, 36.0, 32.0, 17.0, 13.0, 5.0, 9.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.72705078125, -0.7059707641601562, -0.6848907470703125, -0.6638107299804688, -0.642730712890625, -0.6216506958007812, -0.6005706787109375, -0.5794906616210938, -0.55841064453125, -0.5373306274414062, -0.5162506103515625, -0.49517059326171875, -0.474090576171875, -0.45301055908203125, -0.4319305419921875, -0.41085052490234375, -0.3897705078125, -0.36869049072265625, -0.3476104736328125, -0.32653045654296875, -0.305450439453125, -0.28437042236328125, -0.2632904052734375, -0.24221038818359375, -0.22113037109375, -0.20005035400390625, -0.1789703369140625, -0.15789031982421875, -0.136810302734375, -0.11573028564453125, -0.0946502685546875, -0.07357025146484375, -0.052490234375, -0.03141021728515625, -0.0103302001953125, 0.01074981689453125, 0.031829833984375, 0.05290985107421875, 0.0739898681640625, 0.09506988525390625, 0.11614990234375, 0.13722991943359375, 0.1583099365234375, 0.17938995361328125, 0.200469970703125, 0.22154998779296875, 0.2426300048828125, 0.26371002197265625, 0.2847900390625, 0.30587005615234375, 0.3269500732421875, 0.34803009033203125, 0.369110107421875, 0.39019012451171875, 0.4112701416015625, 0.43235015869140625, 0.45343017578125, 0.47451019287109375, 0.4955902099609375, 0.5166702270507812, 0.537750244140625, 0.5588302612304688, 0.5799102783203125, 0.6009902954101562, 0.6220703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 5.0, 6.0, 11.0, 12.0, 18.0, 17.0, 21.0, 21.0, 30.0, 17.0, 30.0, 49.0, 25.0, 29.0, 40.0, 41.0, 31.0, 31.0, 43.0, 1058.0, 56.0, 43.0, 42.0, 41.0, 37.0, 24.0, 23.0, 24.0, 31.0, 20.0, 24.0, 13.0, 24.0, 16.0, 14.0, 13.0, 9.0, 5.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.01953125, -2.926910400390625, -2.83428955078125, -2.741668701171875, -2.6490478515625, -2.556427001953125, -2.46380615234375, -2.371185302734375, -2.278564453125, -2.185943603515625, -2.09332275390625, -2.000701904296875, -1.9080810546875, -1.815460205078125, -1.72283935546875, -1.630218505859375, -1.53759765625, -1.444976806640625, -1.35235595703125, -1.259735107421875, -1.1671142578125, -1.074493408203125, -0.98187255859375, -0.889251708984375, -0.796630859375, -0.704010009765625, -0.61138916015625, -0.518768310546875, -0.4261474609375, -0.333526611328125, -0.24090576171875, -0.148284912109375, -0.0556640625, 0.036956787109375, 0.12957763671875, 0.222198486328125, 0.3148193359375, 0.407440185546875, 0.50006103515625, 0.592681884765625, 0.685302734375, 0.777923583984375, 0.87054443359375, 0.963165283203125, 1.0557861328125, 1.148406982421875, 1.24102783203125, 1.333648681640625, 1.42626953125, 1.518890380859375, 1.61151123046875, 1.704132080078125, 1.7967529296875, 1.889373779296875, 1.98199462890625, 2.074615478515625, 2.167236328125, 2.259857177734375, 2.35247802734375, 2.445098876953125, 2.5377197265625, 2.630340576171875, 2.72296142578125, 2.815582275390625, 2.908203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 7.0, 19.0, 13.0, 27.0, 41.0, 44.0, 78.0, 82.0, 125.0, 167.0, 238.0, 359.0, 492.0, 736.0, 999.0, 1494.0, 2130.0, 3015.0, 4333.0, 6350.0, 9573.0, 14247.0, 21562.0, 33481.0, 52430.0, 84586.0, 140006.0, 1282521.0, 167476.0, 97625.0, 60333.0, 38187.0, 24251.0, 16188.0, 10677.0, 7152.0, 4977.0, 3332.0, 2316.0, 1629.0, 1108.0, 815.0, 568.0, 412.0, 285.0, 190.0, 126.0, 94.0, 68.0, 47.0, 37.0, 24.0, 17.0, 16.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.5595703125, -0.5413131713867188, -0.5230560302734375, -0.5047988891601562, -0.486541748046875, -0.46828460693359375, -0.4500274658203125, -0.43177032470703125, -0.41351318359375, -0.39525604248046875, -0.3769989013671875, -0.35874176025390625, -0.340484619140625, -0.32222747802734375, -0.3039703369140625, -0.28571319580078125, -0.2674560546875, -0.24919891357421875, -0.2309417724609375, -0.21268463134765625, -0.194427490234375, -0.17617034912109375, -0.1579132080078125, -0.13965606689453125, -0.12139892578125, -0.10314178466796875, -0.0848846435546875, -0.06662750244140625, -0.048370361328125, -0.03011322021484375, -0.0118560791015625, 0.00640106201171875, 0.024658203125, 0.04291534423828125, 0.0611724853515625, 0.07942962646484375, 0.097686767578125, 0.11594390869140625, 0.1342010498046875, 0.15245819091796875, 0.17071533203125, 0.18897247314453125, 0.2072296142578125, 0.22548675537109375, 0.243743896484375, 0.26200103759765625, 0.2802581787109375, 0.29851531982421875, 0.3167724609375, 0.33502960205078125, 0.3532867431640625, 0.37154388427734375, 0.389801025390625, 0.40805816650390625, 0.4263153076171875, 0.44457244873046875, 0.46282958984375, 0.48108673095703125, 0.4993438720703125, 0.5176010131835938, 0.535858154296875, 0.5541152954101562, 0.5723724365234375, 0.5906295776367188, 0.60888671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 11.0, 13.0, 18.0, 26.0, 33.0, 38.0, 53.0, 93.0, 99.0, 116.0, 113.0, 95.0, 67.0, 59.0, 37.0, 26.0, 18.0, 19.0, 13.0, 13.0, 6.0, 1.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0017309188842773438, -0.0016883164644241333, -0.0016457140445709229, -0.0016031116247177124, -0.001560509204864502, -0.0015179067850112915, -0.001475304365158081, -0.0014327019453048706, -0.0013900995254516602, -0.0013474971055984497, -0.0013048946857452393, -0.0012622922658920288, -0.0012196898460388184, -0.001177087426185608, -0.0011344850063323975, -0.001091882586479187, -0.0010492801666259766, -0.0010066777467727661, -0.0009640753269195557, -0.0009214729070663452, -0.0008788704872131348, -0.0008362680673599243, -0.0007936656475067139, -0.0007510632276535034, -0.000708460807800293, -0.0006658583879470825, -0.0006232559680938721, -0.0005806535482406616, -0.0005380511283874512, -0.0004954487085342407, -0.0004528462886810303, -0.0004102438688278198, -0.0003676414489746094, -0.0003250390291213989, -0.0002824366092681885, -0.00023983418941497803, -0.00019723176956176758, -0.00015462934970855713, -0.00011202692985534668, -6.942451000213623e-05, -2.682209014892578e-05, 1.5780329704284668e-05, 5.838274955749512e-05, 0.00010098516941070557, 0.00014358758926391602, 0.00018619000911712646, 0.00022879242897033691, 0.00027139484882354736, 0.0003139972686767578, 0.00035659968852996826, 0.0003992021083831787, 0.00044180452823638916, 0.0004844069480895996, 0.0005270093679428101, 0.0005696117877960205, 0.000612214207649231, 0.0006548166275024414, 0.0006974190473556519, 0.0007400214672088623, 0.0007826238870620728, 0.0008252263069152832, 0.0008678287267684937, 0.0009104311466217041, 0.0009530335664749146, 0.000995635986328125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 4.0, 5.0, 16.0, 20.0, 19.0, 46.0, 42.0, 60.0, 138.0, 272.0, 867.0, 1043577.0, 2623.0, 429.0, 159.0, 111.0, 42.0, 27.0, 30.0, 19.0, 12.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0263671875, -0.025253772735595703, -0.024140357971191406, -0.02302694320678711, -0.021913528442382812, -0.020800113677978516, -0.01968669891357422, -0.018573284149169922, -0.017459869384765625, -0.016346454620361328, -0.015233039855957031, -0.014119625091552734, -0.013006210327148438, -0.01189279556274414, -0.010779380798339844, -0.009665966033935547, -0.00855255126953125, -0.007439136505126953, -0.006325721740722656, -0.005212306976318359, -0.0040988922119140625, -0.0029854774475097656, -0.0018720626831054688, -0.0007586479187011719, 0.000354766845703125, 0.0014681816101074219, 0.0025815963745117188, 0.0036950111389160156, 0.0048084259033203125, 0.005921840667724609, 0.007035255432128906, 0.008148670196533203, 0.0092620849609375, 0.010375499725341797, 0.011488914489746094, 0.01260232925415039, 0.013715744018554688, 0.014829158782958984, 0.01594257354736328, 0.017055988311767578, 0.018169403076171875, 0.019282817840576172, 0.02039623260498047, 0.021509647369384766, 0.022623062133789062, 0.02373647689819336, 0.024849891662597656, 0.025963306427001953, 0.02707672119140625, 0.028190135955810547, 0.029303550720214844, 0.03041696548461914, 0.03153038024902344, 0.032643795013427734, 0.03375720977783203, 0.03487062454223633, 0.035984039306640625, 0.03709745407104492, 0.03821086883544922, 0.039324283599853516, 0.04043769836425781, 0.04155111312866211, 0.042664527893066406, 0.0437779426574707, 0.044891357421875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 14.0, 92.0, 340.0, 431.0, 123.0, 14.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040240728412754834, -0.0003530175890773535, -0.00030362786492332816, -0.0002542381698731333, -0.00020484847482293844, -0.00015545877977274358, -0.00010606905561871827, -5.667936056852341e-05, -7.2896655183285475e-06, 4.2100036807823926e-05, 9.14897391339764e-05, 0.0001408794487360865, 0.00019026914378628135, 0.0002396588388364762, 0.0002890485629905015, 0.0003384382580406964, 0.00038782795309089124, 0.0004372176481410861, 0.0004866073722951114, 0.0005359970964491367, 0.0005853867623955011, 0.0006347764283418655, 0.0006841662107035518, 0.0007335558766499162, 0.0007829455425962806, 0.0008323352667503059, 0.0008817249326966703, 0.0009311146568506956, 0.00098050432279706, 0.0010298939887434244, 0.0010792837711051106, 0.001128673437051475, 0.0011780632194131613, 0.0012274528853595257, 0.001276842667721212, 0.0013262323336675763, 0.0013756219996139407, 0.001425011781975627, 0.0014744014479219913, 0.0015237911138683558, 0.0015731807798147202, 0.0016225704457610846, 0.0016719602281227708, 0.0017213498940691352, 0.0017707395600154996, 0.0018201293423771858, 0.0018695190083235502, 0.0019189086742699146, 0.0019682985730469227, 0.002017688238993287, 0.0020670779049396515, 0.0021164678037166595, 0.002165857469663024, 0.0022152471356093884, 0.0022646368015557528, 0.002314026467502117, 0.0023634161334484816, 0.002412805799394846, 0.0024621954653412104, 0.0025115851312875748, 0.002560975030064583, 0.0026103646960109472, 0.0026597543619573116, 0.002709144027903676, 0.0027585336938500404]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 13.0, 11.0, 11.0, 11.0, 13.0, 16.0, 19.0, 25.0, 26.0, 35.0, 38.0, 27.0, 35.0, 33.0, 28.0, 45.0, 41.0, 47.0, 45.0, 29.0, 36.0, 38.0, 34.0, 25.0, 32.0, 39.0, 20.0, 30.0, 29.0, 26.0, 21.0, 13.0, 18.0, 11.0, 10.0, 11.0, 7.0, 7.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.0005034804344177246, -0.0004883827641606331, -0.00047328509390354156, -0.00045818742364645004, -0.0004430897533893585, -0.000427992083132267, -0.0004128944128751755, -0.00039779674261808395, -0.00038269907236099243, -0.0003676014021039009, -0.0003525037318468094, -0.00033740606158971786, -0.00032230839133262634, -0.0003072107210755348, -0.0002921130508184433, -0.0002770153805613518, -0.00026191771030426025, -0.00024682004004716873, -0.0002317223697900772, -0.0002166246995329857, -0.00020152702927589417, -0.00018642935901880264, -0.00017133168876171112, -0.0001562340185046196, -0.00014113634824752808, -0.00012603867799043655, -0.00011094100773334503, -9.584333747625351e-05, -8.074566721916199e-05, -6.564799696207047e-05, -5.055032670497894e-05, -3.545265644788742e-05, -2.03549861907959e-05, -5.257315933704376e-06, 9.840354323387146e-06, 2.4938024580478668e-05, 4.003569483757019e-05, 5.513336509466171e-05, 7.023103535175323e-05, 8.532870560884476e-05, 0.00010042637586593628, 0.0001155240461230278, 0.00013062171638011932, 0.00014571938663721085, 0.00016081705689430237, 0.0001759147271513939, 0.0001910123974084854, 0.00020611006766557693, 0.00022120773792266846, 0.00023630540817975998, 0.0002514030784368515, 0.000266500748693943, 0.00028159841895103455, 0.00029669608920812607, 0.0003117937594652176, 0.0003268914297223091, 0.00034198909997940063, 0.00035708677023649216, 0.0003721844404935837, 0.0003872821107506752, 0.0004023797810077667, 0.00041747745126485825, 0.00043257512152194977, 0.0004476727917790413, 0.0004627704620361328]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 10.0, 5.0, 13.0, 13.0, 13.0, 14.0, 13.0, 13.0, 16.0, 20.0, 20.0, 24.0, 25.0, 22.0, 35.0, 42.0, 35.0, 35.0, 41.0, 49.0, 42.0, 47.0, 30.0, 41.0, 31.0, 35.0, 33.0, 28.0, 29.0, 14.0, 23.0, 33.0, 31.0, 19.0, 17.0, 15.0, 17.0, 11.0, 3.0, 13.0, 12.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.859375, -4.71978759765625, -4.5802001953125, -4.44061279296875, -4.301025390625, -4.16143798828125, -4.0218505859375, -3.88226318359375, -3.74267578125, -3.60308837890625, -3.4635009765625, -3.32391357421875, -3.184326171875, -3.04473876953125, -2.9051513671875, -2.76556396484375, -2.6259765625, -2.48638916015625, -2.3468017578125, -2.20721435546875, -2.067626953125, -1.92803955078125, -1.7884521484375, -1.64886474609375, -1.50927734375, -1.36968994140625, -1.2301025390625, -1.09051513671875, -0.950927734375, -0.81134033203125, -0.6717529296875, -0.53216552734375, -0.392578125, -0.25299072265625, -0.1134033203125, 0.02618408203125, 0.165771484375, 0.30535888671875, 0.4449462890625, 0.58453369140625, 0.72412109375, 0.86370849609375, 1.0032958984375, 1.14288330078125, 1.282470703125, 1.42205810546875, 1.5616455078125, 1.70123291015625, 1.8408203125, 1.98040771484375, 2.1199951171875, 2.25958251953125, 2.399169921875, 2.53875732421875, 2.6783447265625, 2.81793212890625, 2.95751953125, 3.09710693359375, 3.2366943359375, 3.37628173828125, 3.515869140625, 3.65545654296875, 3.7950439453125, 3.93463134765625, 4.07421875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 15.0, 15.0, 19.0, 22.0, 23.0, 54.0, 83.0, 121.0, 169.0, 201.0, 303.0, 530.0, 794.0, 1285.0, 2304.0, 4240.0, 8877.0, 22108.0, 66343.0, 235451.0, 464861.0, 161390.0, 46914.0, 16410.0, 7165.0, 3479.0, 1951.0, 1221.0, 732.0, 477.0, 311.0, 206.0, 153.0, 85.0, 66.0, 52.0, 31.0, 17.0, 13.0, 14.0, 10.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0], "bins": [-3.802734375, -3.692047119140625, -3.58135986328125, -3.470672607421875, -3.3599853515625, -3.249298095703125, -3.13861083984375, -3.027923583984375, -2.917236328125, -2.806549072265625, -2.69586181640625, -2.585174560546875, -2.4744873046875, -2.363800048828125, -2.25311279296875, -2.142425537109375, -2.03173828125, -1.921051025390625, -1.81036376953125, -1.699676513671875, -1.5889892578125, -1.478302001953125, -1.36761474609375, -1.256927490234375, -1.146240234375, -1.035552978515625, -0.92486572265625, -0.814178466796875, -0.7034912109375, -0.592803955078125, -0.48211669921875, -0.371429443359375, -0.2607421875, -0.150054931640625, -0.03936767578125, 0.071319580078125, 0.1820068359375, 0.292694091796875, 0.40338134765625, 0.514068603515625, 0.624755859375, 0.735443115234375, 0.84613037109375, 0.956817626953125, 1.0675048828125, 1.178192138671875, 1.28887939453125, 1.399566650390625, 1.51025390625, 1.620941162109375, 1.73162841796875, 1.842315673828125, 1.9530029296875, 2.063690185546875, 2.17437744140625, 2.285064697265625, 2.395751953125, 2.506439208984375, 2.61712646484375, 2.727813720703125, 2.8385009765625, 2.949188232421875, 3.05987548828125, 3.170562744140625, 3.28125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 7.0, 16.0, 23.0, 18.0, 32.0, 35.0, 35.0, 33.0, 47.0, 39.0, 50.0, 58.0, 85.0, 1765.0, 322.0, 80.0, 54.0, 62.0, 36.0, 37.0, 30.0, 28.0, 41.0, 21.0, 17.0, 15.0, 8.0, 5.0, 8.0, 9.0, 0.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.265625, -17.60986328125, -16.9541015625, -16.29833984375, -15.642578125, -14.98681640625, -14.3310546875, -13.67529296875, -13.01953125, -12.36376953125, -11.7080078125, -11.05224609375, -10.396484375, -9.74072265625, -9.0849609375, -8.42919921875, -7.7734375, -7.11767578125, -6.4619140625, -5.80615234375, -5.150390625, -4.49462890625, -3.8388671875, -3.18310546875, -2.52734375, -1.87158203125, -1.2158203125, -0.56005859375, 0.095703125, 0.75146484375, 1.4072265625, 2.06298828125, 2.71875, 3.37451171875, 4.0302734375, 4.68603515625, 5.341796875, 5.99755859375, 6.6533203125, 7.30908203125, 7.96484375, 8.62060546875, 9.2763671875, 9.93212890625, 10.587890625, 11.24365234375, 11.8994140625, 12.55517578125, 13.2109375, 13.86669921875, 14.5224609375, 15.17822265625, 15.833984375, 16.48974609375, 17.1455078125, 17.80126953125, 18.45703125, 19.11279296875, 19.7685546875, 20.42431640625, 21.080078125, 21.73583984375, 22.3916015625, 23.04736328125, 23.703125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 0.0, 6.0, 8.0, 9.0, 6.0, 11.0, 18.0, 21.0, 35.0, 37.0, 52.0, 65.0, 90.0, 140.0, 337.0, 876.0, 5662.0, 2975871.0, 158586.0, 2463.0, 628.0, 268.0, 139.0, 97.0, 59.0, 41.0, 48.0, 37.0, 23.0, 16.0, 13.0, 9.0, 9.0, 7.0, 10.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.0625, -38.001953125, -36.94140625, -35.880859375, -34.8203125, -33.759765625, -32.69921875, -31.638671875, -30.578125, -29.517578125, -28.45703125, -27.396484375, -26.3359375, -25.275390625, -24.21484375, -23.154296875, -22.09375, -21.033203125, -19.97265625, -18.912109375, -17.8515625, -16.791015625, -15.73046875, -14.669921875, -13.609375, -12.548828125, -11.48828125, -10.427734375, -9.3671875, -8.306640625, -7.24609375, -6.185546875, -5.125, -4.064453125, -3.00390625, -1.943359375, -0.8828125, 0.177734375, 1.23828125, 2.298828125, 3.359375, 4.419921875, 5.48046875, 6.541015625, 7.6015625, 8.662109375, 9.72265625, 10.783203125, 11.84375, 12.904296875, 13.96484375, 15.025390625, 16.0859375, 17.146484375, 18.20703125, 19.267578125, 20.328125, 21.388671875, 22.44921875, 23.509765625, 24.5703125, 25.630859375, 26.69140625, 27.751953125, 28.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 821.0, 198.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.5876693725586, -69.7220230102539, -61.85638427734375, -53.99073791503906, -46.125099182128906, -38.25945281982422, -30.393810272216797, -22.528167724609375, -14.662525177001953, -6.796882152557373, 1.068760871887207, 8.934404373168945, 16.800046920776367, 24.665691375732422, 32.531333923339844, 40.396976470947266, 48.26261901855469, 56.12826156616211, 63.99390411376953, 71.85955047607422, 79.72518920898438, 87.59083557128906, 95.45648193359375, 103.3221206665039, 111.18775939941406, 119.05340576171875, 126.9190444946289, 134.78468322753906, 142.65032958984375, 150.51597595214844, 158.38162231445312, 166.24725341796875, 174.11289978027344, 181.97854614257812, 189.8441925048828, 197.70982360839844, 205.57546997070312, 213.4411163330078, 221.3067626953125, 229.17239379882812, 237.0380401611328, 244.9036865234375, 252.7693328857422, 260.6349792480469, 268.5006103515625, 276.36627197265625, 284.2319030761719, 292.0975341796875, 299.96319580078125, 307.8288269042969, 315.6944885253906, 323.56011962890625, 331.42578125, 339.2914123535156, 347.15704345703125, 355.022705078125, 362.8883361816406, 370.75396728515625, 378.61962890625, 386.4852600097656, 394.3509216308594, 402.216552734375, 410.0821838378906, 417.9478454589844, 425.8134765625]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 7.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 12.0, 19.0, 12.0, 16.0, 19.0, 19.0, 14.0, 25.0, 21.0, 31.0, 23.0, 26.0, 35.0, 32.0, 32.0, 37.0, 35.0, 47.0, 38.0, 31.0, 39.0, 29.0, 35.0, 38.0, 37.0, 33.0, 27.0, 23.0, 18.0, 25.0, 23.0, 22.0, 22.0, 17.0, 12.0, 13.0, 6.0, 11.0, 5.0, 2.0, 5.0, 8.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.917457580566406, -44.3903923034668, -42.86332702636719, -41.336265563964844, -39.809200286865234, -38.282135009765625, -36.755069732666016, -35.228004455566406, -33.70094299316406, -32.17387771606445, -30.646814346313477, -29.119749069213867, -27.59268569946289, -26.06562042236328, -24.538555145263672, -23.011489868164062, -21.484424591064453, -19.957359313964844, -18.430295944213867, -16.903230667114258, -15.376166343688965, -13.849102020263672, -12.322036743164062, -10.79497241973877, -9.267908096313477, -7.740843772888184, -6.213778972625732, -4.686714172363281, -3.1596498489379883, -1.6325855255126953, -0.10552024841308594, 1.421544075012207, 2.9486045837402344, 4.475668907165527, 6.0027337074279785, 7.52979850769043, 9.056862831115723, 10.583927154541016, 12.110992431640625, 13.638056755065918, 15.165121078491211, 16.69218635559082, 18.219249725341797, 19.746315002441406, 21.273380279541016, 22.800443649291992, 24.3275089263916, 25.854572296142578, 27.381637573242188, 28.908702850341797, 30.435766220092773, 31.962831497192383, 33.48989486694336, 35.01696014404297, 36.54402542114258, 38.07109069824219, 39.59815216064453, 41.12521743774414, 42.65228271484375, 44.179344177246094, 45.7064094543457, 47.23347473144531, 48.76054000854492, 50.28760528564453, 51.81467056274414]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 15.0, 11.0, 9.0, 15.0, 19.0, 11.0, 29.0, 24.0, 14.0, 25.0, 34.0, 31.0, 42.0, 39.0, 35.0, 41.0, 46.0, 35.0, 43.0, 36.0, 40.0, 27.0, 27.0, 33.0, 29.0, 21.0, 24.0, 29.0, 28.0, 28.0, 19.0, 16.0, 17.0, 8.0, 13.0, 9.0, 11.0, 9.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.91015625, -4.771148681640625, -4.63214111328125, -4.493133544921875, -4.3541259765625, -4.215118408203125, -4.07611083984375, -3.937103271484375, -3.798095703125, -3.659088134765625, -3.52008056640625, -3.381072998046875, -3.2420654296875, -3.103057861328125, -2.96405029296875, -2.825042724609375, -2.68603515625, -2.547027587890625, -2.40802001953125, -2.269012451171875, -2.1300048828125, -1.990997314453125, -1.85198974609375, -1.712982177734375, -1.573974609375, -1.434967041015625, -1.29595947265625, -1.156951904296875, -1.0179443359375, -0.878936767578125, -0.73992919921875, -0.600921630859375, -0.4619140625, -0.322906494140625, -0.18389892578125, -0.044891357421875, 0.0941162109375, 0.233123779296875, 0.37213134765625, 0.511138916015625, 0.650146484375, 0.789154052734375, 0.92816162109375, 1.067169189453125, 1.2061767578125, 1.345184326171875, 1.48419189453125, 1.623199462890625, 1.76220703125, 1.901214599609375, 2.04022216796875, 2.179229736328125, 2.3182373046875, 2.457244873046875, 2.59625244140625, 2.735260009765625, 2.874267578125, 3.013275146484375, 3.15228271484375, 3.291290283203125, 3.4302978515625, 3.569305419921875, 3.70831298828125, 3.847320556640625, 3.986328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 10.0, 4.0, 9.0, 15.0, 17.0, 13.0, 29.0, 41.0, 40.0, 75.0, 118.0, 171.0, 343.0, 698.0, 2309.0, 9469.0, 50353.0, 377279.0, 1925036.0, 1523358.0, 257851.0, 36670.0, 7123.0, 1850.0, 620.0, 282.0, 163.0, 90.0, 63.0, 37.0, 24.0, 26.0, 20.0, 16.0, 13.0, 10.0, 7.0, 2.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-11.453125, -11.15093994140625, -10.8487548828125, -10.54656982421875, -10.244384765625, -9.94219970703125, -9.6400146484375, -9.33782958984375, -9.03564453125, -8.73345947265625, -8.4312744140625, -8.12908935546875, -7.826904296875, -7.52471923828125, -7.2225341796875, -6.92034912109375, -6.6181640625, -6.31597900390625, -6.0137939453125, -5.71160888671875, -5.409423828125, -5.10723876953125, -4.8050537109375, -4.50286865234375, -4.20068359375, -3.89849853515625, -3.5963134765625, -3.29412841796875, -2.991943359375, -2.68975830078125, -2.3875732421875, -2.08538818359375, -1.783203125, -1.48101806640625, -1.1788330078125, -0.87664794921875, -0.574462890625, -0.27227783203125, 0.0299072265625, 0.33209228515625, 0.63427734375, 0.93646240234375, 1.2386474609375, 1.54083251953125, 1.843017578125, 2.14520263671875, 2.4473876953125, 2.74957275390625, 3.0517578125, 3.35394287109375, 3.6561279296875, 3.95831298828125, 4.260498046875, 4.56268310546875, 4.8648681640625, 5.16705322265625, 5.46923828125, 5.77142333984375, 6.0736083984375, 6.37579345703125, 6.677978515625, 6.98016357421875, 7.2823486328125, 7.58453369140625, 7.88671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 5.0, 4.0, 11.0, 7.0, 9.0, 18.0, 11.0, 27.0, 41.0, 54.0, 75.0, 103.0, 147.0, 231.0, 338.0, 447.0, 525.0, 540.0, 448.0, 319.0, 222.0, 149.0, 97.0, 67.0, 52.0, 45.0, 35.0, 17.0, 9.0, 10.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.8125, -19.260986328125, -18.70947265625, -18.157958984375, -17.6064453125, -17.054931640625, -16.50341796875, -15.951904296875, -15.400390625, -14.848876953125, -14.29736328125, -13.745849609375, -13.1943359375, -12.642822265625, -12.09130859375, -11.539794921875, -10.98828125, -10.436767578125, -9.88525390625, -9.333740234375, -8.7822265625, -8.230712890625, -7.67919921875, -7.127685546875, -6.576171875, -6.024658203125, -5.47314453125, -4.921630859375, -4.3701171875, -3.818603515625, -3.26708984375, -2.715576171875, -2.1640625, -1.612548828125, -1.06103515625, -0.509521484375, 0.0419921875, 0.593505859375, 1.14501953125, 1.696533203125, 2.248046875, 2.799560546875, 3.35107421875, 3.902587890625, 4.4541015625, 5.005615234375, 5.55712890625, 6.108642578125, 6.66015625, 7.211669921875, 7.76318359375, 8.314697265625, 8.8662109375, 9.417724609375, 9.96923828125, 10.520751953125, 11.072265625, 11.623779296875, 12.17529296875, 12.726806640625, 13.2783203125, 13.829833984375, 14.38134765625, 14.932861328125, 15.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 9.0, 9.0, 12.0, 13.0, 23.0, 40.0, 51.0, 71.0, 106.0, 178.0, 271.0, 746.0, 11947.0, 4138351.0, 40511.0, 1066.0, 309.0, 180.0, 111.0, 83.0, 51.0, 49.0, 23.0, 16.0, 10.0, 16.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.28515625, -63.6953125, -61.10546875, -58.515625, -55.92578125, -53.3359375, -50.74609375, -48.15625, -45.56640625, -42.9765625, -40.38671875, -37.796875, -35.20703125, -32.6171875, -30.02734375, -27.4375, -24.84765625, -22.2578125, -19.66796875, -17.078125, -14.48828125, -11.8984375, -9.30859375, -6.71875, -4.12890625, -1.5390625, 1.05078125, 3.640625, 6.23046875, 8.8203125, 11.41015625, 14.0, 16.58984375, 19.1796875, 21.76953125, 24.359375, 26.94921875, 29.5390625, 32.12890625, 34.71875, 37.30859375, 39.8984375, 42.48828125, 45.078125, 47.66796875, 50.2578125, 52.84765625, 55.4375, 58.02734375, 60.6171875, 63.20703125, 65.796875, 68.38671875, 70.9765625, 73.56640625, 76.15625, 78.74609375, 81.3359375, 83.92578125, 86.515625, 89.10546875, 91.6953125, 94.28515625, 96.875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 21.0, 81.0, 290.0, 405.0, 176.0, 35.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.4805145263672, -160.97824096679688, -155.47598266601562, -149.9737091064453, -144.47145080566406, -138.96917724609375, -133.4669189453125, -127.96464538574219, -122.4623794555664, -116.96011352539062, -111.45784759521484, -105.95558166503906, -100.45330810546875, -94.9510498046875, -89.44877624511719, -83.9465103149414, -78.44424438476562, -72.94197845458984, -67.43971252441406, -61.937442779541016, -56.435176849365234, -50.93291091918945, -45.430641174316406, -39.928375244140625, -34.426109313964844, -28.923843383789062, -23.42157554626465, -17.919307708740234, -12.417041778564453, -6.914775848388672, -1.412506103515625, 4.089759826660156, 9.592041015625, 15.094307899475098, 20.596574783325195, 26.09884262084961, 31.60110855102539, 37.10337448120117, 42.60564422607422, 48.10791015625, 53.61017608642578, 59.11244201660156, 64.61470794677734, 70.11697387695312, 75.61924743652344, 81.12150573730469, 86.623779296875, 92.12604522705078, 97.62831115722656, 103.13057708740234, 108.63284301757812, 114.13511657714844, 119.63737487792969, 125.1396484375, 130.64190673828125, 136.14418029785156, 141.64645385742188, 147.1487274169922, 152.65098571777344, 158.15325927734375, 163.655517578125, 169.1577911376953, 174.66006469726562, 180.16232299804688, 185.66458129882812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 5.0, 2.0, 10.0, 6.0, 6.0, 9.0, 11.0, 14.0, 17.0, 12.0, 19.0, 22.0, 21.0, 27.0, 27.0, 19.0, 28.0, 37.0, 23.0, 28.0, 36.0, 37.0, 36.0, 28.0, 28.0, 44.0, 27.0, 31.0, 25.0, 39.0, 35.0, 33.0, 28.0, 22.0, 28.0, 25.0, 27.0, 19.0, 14.0, 12.0, 6.0, 15.0, 13.0, 9.0, 13.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.52936553955078, -40.158119201660156, -38.7868766784668, -37.41563034057617, -36.04438781738281, -34.67314147949219, -33.30189514160156, -31.930652618408203, -30.55940818786621, -29.18816375732422, -27.816919326782227, -26.445674896240234, -25.07442855834961, -23.70318603515625, -22.331939697265625, -20.960695266723633, -19.58945083618164, -18.21820640563965, -16.846961975097656, -15.475716590881348, -14.104472160339355, -12.733227729797363, -11.361982345581055, -9.990737915039062, -8.61949348449707, -7.248249053955078, -5.877004146575928, -4.505759239196777, -3.134514808654785, -1.763270378112793, -0.3920249938964844, 0.9792194366455078, 2.3504638671875, 3.7217085361480713, 5.092953205108643, 6.464198112487793, 7.835442543029785, 9.206686973571777, 10.577932357788086, 11.949176788330078, 13.32042121887207, 14.691665649414062, 16.062910079956055, 17.434154510498047, 18.805400848388672, 20.17664337158203, 21.547889709472656, 22.91913414001465, 24.29037857055664, 25.661623001098633, 27.032867431640625, 28.40411376953125, 29.77535629272461, 31.146602630615234, 32.517845153808594, 33.88909149169922, 35.260337829589844, 36.63158416748047, 38.00282669067383, 39.37407302856445, 40.74531555175781, 42.11656188964844, 43.48780822753906, 44.85905075073242, 46.23029327392578]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 14.0, 11.0, 12.0, 22.0, 21.0, 20.0, 12.0, 26.0, 23.0, 34.0, 33.0, 32.0, 28.0, 39.0, 37.0, 41.0, 42.0, 42.0, 47.0, 34.0, 40.0, 46.0, 38.0, 37.0, 29.0, 22.0, 28.0, 26.0, 20.0, 15.0, 32.0, 21.0, 15.0, 15.0, 6.0, 5.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.51953125, -5.36383056640625, -5.2081298828125, -5.05242919921875, -4.896728515625, -4.74102783203125, -4.5853271484375, -4.42962646484375, -4.27392578125, -4.11822509765625, -3.9625244140625, -3.80682373046875, -3.651123046875, -3.49542236328125, -3.3397216796875, -3.18402099609375, -3.0283203125, -2.87261962890625, -2.7169189453125, -2.56121826171875, -2.405517578125, -2.24981689453125, -2.0941162109375, -1.93841552734375, -1.78271484375, -1.62701416015625, -1.4713134765625, -1.31561279296875, -1.159912109375, -1.00421142578125, -0.8485107421875, -0.69281005859375, -0.537109375, -0.38140869140625, -0.2257080078125, -0.07000732421875, 0.085693359375, 0.24139404296875, 0.3970947265625, 0.55279541015625, 0.70849609375, 0.86419677734375, 1.0198974609375, 1.17559814453125, 1.331298828125, 1.48699951171875, 1.6427001953125, 1.79840087890625, 1.9541015625, 2.10980224609375, 2.2655029296875, 2.42120361328125, 2.576904296875, 2.73260498046875, 2.8883056640625, 3.04400634765625, 3.19970703125, 3.35540771484375, 3.5111083984375, 3.66680908203125, 3.822509765625, 3.97821044921875, 4.1339111328125, 4.28961181640625, 4.4453125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 9.0, 14.0, 20.0, 26.0, 36.0, 50.0, 91.0, 109.0, 145.0, 234.0, 399.0, 592.0, 971.0, 1462.0, 2274.0, 3525.0, 5562.0, 8898.0, 13463.0, 21596.0, 34600.0, 57718.0, 102102.0, 192717.0, 263774.0, 140797.0, 77268.0, 44548.0, 27645.0, 17233.0, 11086.0, 7120.0, 4398.0, 2832.0, 1823.0, 1252.0, 755.0, 507.0, 319.0, 196.0, 131.0, 77.0, 61.0, 43.0, 34.0, 19.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.8291015625, -0.8055877685546875, -0.782073974609375, -0.7585601806640625, -0.73504638671875, -0.7115325927734375, -0.688018798828125, -0.6645050048828125, -0.6409912109375, -0.6174774169921875, -0.593963623046875, -0.5704498291015625, -0.54693603515625, -0.5234222412109375, -0.499908447265625, -0.4763946533203125, -0.452880859375, -0.4293670654296875, -0.405853271484375, -0.3823394775390625, -0.35882568359375, -0.3353118896484375, -0.311798095703125, -0.2882843017578125, -0.2647705078125, -0.2412567138671875, -0.217742919921875, -0.1942291259765625, -0.17071533203125, -0.1472015380859375, -0.123687744140625, -0.1001739501953125, -0.07666015625, -0.0531463623046875, -0.029632568359375, -0.0061187744140625, 0.01739501953125, 0.0409088134765625, 0.064422607421875, 0.0879364013671875, 0.1114501953125, 0.1349639892578125, 0.158477783203125, 0.1819915771484375, 0.20550537109375, 0.2290191650390625, 0.252532958984375, 0.2760467529296875, 0.299560546875, 0.3230743408203125, 0.346588134765625, 0.3701019287109375, 0.39361572265625, 0.4171295166015625, 0.440643310546875, 0.4641571044921875, 0.4876708984375, 0.5111846923828125, 0.534698486328125, 0.5582122802734375, 0.58172607421875, 0.6052398681640625, 0.628753662109375, 0.6522674560546875, 0.67578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 1.0, 7.0, 13.0, 14.0, 17.0, 24.0, 18.0, 25.0, 27.0, 22.0, 31.0, 32.0, 33.0, 34.0, 35.0, 29.0, 32.0, 46.0, 31.0, 1066.0, 36.0, 46.0, 37.0, 34.0, 18.0, 35.0, 24.0, 24.0, 31.0, 36.0, 28.0, 18.0, 14.0, 14.0, 15.0, 14.0, 11.0, 8.0, 8.0, 9.0, 5.0, 4.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.60400390625, -2.5087890625, -2.41357421875, -2.318359375, -2.22314453125, -2.1279296875, -2.03271484375, -1.9375, -1.84228515625, -1.7470703125, -1.65185546875, -1.556640625, -1.46142578125, -1.3662109375, -1.27099609375, -1.17578125, -1.08056640625, -0.9853515625, -0.89013671875, -0.794921875, -0.69970703125, -0.6044921875, -0.50927734375, -0.4140625, -0.31884765625, -0.2236328125, -0.12841796875, -0.033203125, 0.06201171875, 0.1572265625, 0.25244140625, 0.34765625, 0.44287109375, 0.5380859375, 0.63330078125, 0.728515625, 0.82373046875, 0.9189453125, 1.01416015625, 1.109375, 1.20458984375, 1.2998046875, 1.39501953125, 1.490234375, 1.58544921875, 1.6806640625, 1.77587890625, 1.87109375, 1.96630859375, 2.0615234375, 2.15673828125, 2.251953125, 2.34716796875, 2.4423828125, 2.53759765625, 2.6328125, 2.72802734375, 2.8232421875, 2.91845703125, 3.013671875, 3.10888671875, 3.2041015625, 3.29931640625, 3.39453125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 15.0, 20.0, 27.0, 36.0, 46.0, 82.0, 149.0, 191.0, 293.0, 384.0, 546.0, 847.0, 1220.0, 1848.0, 2870.0, 4233.0, 6209.0, 9464.0, 14391.0, 21997.0, 33912.0, 55072.0, 91227.0, 155423.0, 1287457.0, 159744.0, 92838.0, 55958.0, 34737.0, 22372.0, 14286.0, 9636.0, 6339.0, 4309.0, 2993.0, 1924.0, 1279.0, 904.0, 617.0, 376.0, 263.0, 184.0, 130.0, 85.0, 61.0, 47.0, 34.0, 22.0, 12.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.677734375, -0.6575164794921875, -0.637298583984375, -0.6170806884765625, -0.59686279296875, -0.5766448974609375, -0.556427001953125, -0.5362091064453125, -0.5159912109375, -0.4957733154296875, -0.475555419921875, -0.4553375244140625, -0.43511962890625, -0.4149017333984375, -0.394683837890625, -0.3744659423828125, -0.354248046875, -0.3340301513671875, -0.313812255859375, -0.2935943603515625, -0.27337646484375, -0.2531585693359375, -0.232940673828125, -0.2127227783203125, -0.1925048828125, -0.1722869873046875, -0.152069091796875, -0.1318511962890625, -0.11163330078125, -0.0914154052734375, -0.071197509765625, -0.0509796142578125, -0.03076171875, -0.0105438232421875, 0.009674072265625, 0.0298919677734375, 0.05010986328125, 0.0703277587890625, 0.090545654296875, 0.1107635498046875, 0.1309814453125, 0.1511993408203125, 0.171417236328125, 0.1916351318359375, 0.21185302734375, 0.2320709228515625, 0.252288818359375, 0.2725067138671875, 0.292724609375, 0.3129425048828125, 0.333160400390625, 0.3533782958984375, 0.37359619140625, 0.3938140869140625, 0.414031982421875, 0.4342498779296875, 0.4544677734375, 0.4746856689453125, 0.494903564453125, 0.5151214599609375, 0.53533935546875, 0.5555572509765625, 0.575775146484375, 0.5959930419921875, 0.6162109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 7.0, 16.0, 17.0, 20.0, 38.0, 32.0, 47.0, 78.0, 79.0, 109.0, 111.0, 84.0, 73.0, 68.0, 45.0, 48.0, 37.0, 21.0, 21.0, 8.0, 12.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015325546264648438, -0.001490578055381775, -0.001448601484298706, -0.0014066249132156372, -0.0013646483421325684, -0.0013226717710494995, -0.0012806951999664307, -0.0012387186288833618, -0.001196742057800293, -0.0011547654867172241, -0.0011127889156341553, -0.0010708123445510864, -0.0010288357734680176, -0.0009868592023849487, -0.0009448826313018799, -0.000902906060218811, -0.0008609294891357422, -0.0008189529180526733, -0.0007769763469696045, -0.0007349997758865356, -0.0006930232048034668, -0.000651046633720398, -0.0006090700626373291, -0.0005670934915542603, -0.0005251169204711914, -0.00048314034938812256, -0.0004411637783050537, -0.00039918720722198486, -0.000357210636138916, -0.00031523406505584717, -0.0002732574939727783, -0.00023128092288970947, -0.00018930435180664062, -0.00014732778072357178, -0.00010535120964050293, -6.337463855743408e-05, -2.1398067474365234e-05, 2.0578503608703613e-05, 6.255507469177246e-05, 0.00010453164577484131, 0.00014650821685791016, 0.000188484787940979, 0.00023046135902404785, 0.0002724379301071167, 0.00031441450119018555, 0.0003563910722732544, 0.00039836764335632324, 0.0004403442144393921, 0.00048232078552246094, 0.0005242973566055298, 0.0005662739276885986, 0.0006082504987716675, 0.0006502270698547363, 0.0006922036409378052, 0.000734180212020874, 0.0007761567831039429, 0.0008181333541870117, 0.0008601099252700806, 0.0009020864963531494, 0.0009440630674362183, 0.0009860396385192871, 0.001028016209602356, 0.0010699927806854248, 0.0011119693517684937, 0.0011539459228515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 4.0, 10.0, 15.0, 19.0, 32.0, 43.0, 46.0, 77.0, 178.0, 529.0, 677854.0, 368773.0, 543.0, 170.0, 72.0, 44.0, 33.0, 34.0, 16.0, 19.0, 12.0, 9.0, 6.0, 8.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.03384113311767578, -0.03258705139160156, -0.031332969665527344, -0.030078887939453125, -0.028824806213378906, -0.027570724487304688, -0.02631664276123047, -0.02506256103515625, -0.02380847930908203, -0.022554397583007812, -0.021300315856933594, -0.020046234130859375, -0.018792152404785156, -0.017538070678710938, -0.01628398895263672, -0.0150299072265625, -0.013775825500488281, -0.012521743774414062, -0.011267662048339844, -0.010013580322265625, -0.008759498596191406, -0.0075054168701171875, -0.006251335144042969, -0.00499725341796875, -0.0037431716918945312, -0.0024890899658203125, -0.0012350082397460938, 1.9073486328125e-05, 0.0012731552124023438, 0.0025272369384765625, 0.0037813186645507812, 0.005035400390625, 0.006289482116699219, 0.0075435638427734375, 0.008797645568847656, 0.010051727294921875, 0.011305809020996094, 0.012559890747070312, 0.013813972473144531, 0.01506805419921875, 0.01632213592529297, 0.017576217651367188, 0.018830299377441406, 0.020084381103515625, 0.021338462829589844, 0.022592544555664062, 0.02384662628173828, 0.0251007080078125, 0.02635478973388672, 0.027608871459960938, 0.028862953186035156, 0.030117034912109375, 0.031371116638183594, 0.03262519836425781, 0.03387928009033203, 0.03513336181640625, 0.03638744354248047, 0.03764152526855469, 0.038895606994628906, 0.040149688720703125, 0.041403770446777344, 0.04265785217285156, 0.04391193389892578, 0.045166015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 67.0, 638.0, 297.0, 14.0], "bins": [-0.005053472239524126, -0.004971627611666918, -0.0048897829838097095, -0.004807938821613789, -0.00472609419375658, -0.004644249565899372, -0.004562404938042164, -0.004480560310184956, -0.004398716147989035, -0.004316871520131826, -0.004235026892274618, -0.004153182730078697, -0.004071338102221489, -0.003989493474364281, -0.0039076488465070724, -0.003825804451480508, -0.0037439598236232996, -0.0036621151957660913, -0.0035802708007395267, -0.0034984261728823185, -0.003416581777855754, -0.0033347371499985456, -0.003252892754971981, -0.003171048127114773, -0.0030892034992575645, -0.0030073588714003563, -0.0029255144763737917, -0.0028436698485165834, -0.002761825453490019, -0.0026799808256328106, -0.0025981361977756023, -0.0025162918027490377, -0.0024344471748918295, -0.0023526025470346212, -0.0022707581520080566, -0.0021889135241508484, -0.002107069129124284, -0.0020252245012670755, -0.0019433799898251891, -0.0018615354783833027, -0.0017796909669414163, -0.0016978464554995298, -0.0016160019440576434, -0.001534157432615757, -0.0014523128047585487, -0.0013704684097319841, -0.0012886237818747759, -0.0012067792704328895, -0.001124934758991003, -0.0010430902475491166, -0.0009612457361072302, -0.0008794011664576828, -0.0007975566550157964, -0.00071571214357391, -0.0006338675739243627, -0.0005520230624824762, -0.00047017858014442027, -0.0003883340395987034, -0.00030648952815681696, -0.00022464498761110008, -0.00014280047616921365, -6.095596472732723e-05, 2.088860492222011e-05, 0.00010273311636410654, 0.00018457762780599296]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 7.0, 4.0, 9.0, 6.0, 10.0, 12.0, 21.0, 18.0, 12.0, 16.0, 22.0, 20.0, 25.0, 25.0, 33.0, 35.0, 30.0, 37.0, 48.0, 32.0, 47.0, 34.0, 46.0, 40.0, 56.0, 32.0, 30.0, 25.0, 33.0, 33.0, 33.0, 21.0, 27.0, 18.0, 16.0, 21.0, 12.0, 11.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0004500150680541992, -0.0004360312595963478, -0.0004220474511384964, -0.000408063642680645, -0.0003940798342227936, -0.00038009602576494217, -0.00036611221730709076, -0.00035212840884923935, -0.00033814460039138794, -0.00032416079193353653, -0.0003101769834756851, -0.0002961931750178337, -0.0002822093665599823, -0.0002682255581021309, -0.0002542417496442795, -0.00024025794118642807, -0.00022627413272857666, -0.00021229032427072525, -0.00019830651581287384, -0.00018432270735502243, -0.00017033889889717102, -0.0001563550904393196, -0.0001423712819814682, -0.0001283874735236168, -0.00011440366506576538, -0.00010041985660791397, -8.643604815006256e-05, -7.245223969221115e-05, -5.846843123435974e-05, -4.448462277650833e-05, -3.050081431865692e-05, -1.651700586080551e-05, -2.5331974029541016e-06, 1.1450611054897308e-05, 2.5434419512748718e-05, 3.941822797060013e-05, 5.340203642845154e-05, 6.738584488630295e-05, 8.136965334415436e-05, 9.535346180200577e-05, 0.00010933727025985718, 0.0001233210787177086, 0.00013730488717556, 0.0001512886956334114, 0.00016527250409126282, 0.00017925631254911423, 0.00019324012100696564, 0.00020722392946481705, 0.00022120773792266846, 0.00023519154638051987, 0.0002491753548383713, 0.0002631591632962227, 0.0002771429717540741, 0.0002911267802119255, 0.0003051105886697769, 0.0003190943971276283, 0.00033307820558547974, 0.00034706201404333115, 0.00036104582250118256, 0.00037502963095903397, 0.0003890134394168854, 0.0004029972478747368, 0.0004169810563325882, 0.0004309648647904396, 0.000444948673248291]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 14.0, 11.0, 12.0, 22.0, 21.0, 20.0, 12.0, 26.0, 23.0, 34.0, 33.0, 32.0, 28.0, 39.0, 37.0, 41.0, 42.0, 42.0, 47.0, 34.0, 40.0, 46.0, 38.0, 37.0, 29.0, 22.0, 28.0, 26.0, 20.0, 15.0, 32.0, 21.0, 15.0, 15.0, 6.0, 5.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.51953125, -5.36383056640625, -5.2081298828125, -5.05242919921875, -4.896728515625, -4.74102783203125, -4.5853271484375, -4.42962646484375, -4.27392578125, -4.11822509765625, -3.9625244140625, -3.80682373046875, -3.651123046875, -3.49542236328125, -3.3397216796875, -3.18402099609375, -3.0283203125, -2.87261962890625, -2.7169189453125, -2.56121826171875, -2.405517578125, -2.24981689453125, -2.0941162109375, -1.93841552734375, -1.78271484375, -1.62701416015625, -1.4713134765625, -1.31561279296875, -1.159912109375, -1.00421142578125, -0.8485107421875, -0.69281005859375, -0.537109375, -0.38140869140625, -0.2257080078125, -0.07000732421875, 0.085693359375, 0.24139404296875, 0.3970947265625, 0.55279541015625, 0.70849609375, 0.86419677734375, 1.0198974609375, 1.17559814453125, 1.331298828125, 1.48699951171875, 1.6427001953125, 1.79840087890625, 1.9541015625, 2.10980224609375, 2.2655029296875, 2.42120361328125, 2.576904296875, 2.73260498046875, 2.8883056640625, 3.04400634765625, 3.19970703125, 3.35540771484375, 3.5111083984375, 3.66680908203125, 3.822509765625, 3.97821044921875, 4.1339111328125, 4.28961181640625, 4.4453125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 5.0, 6.0, 10.0, 19.0, 22.0, 25.0, 52.0, 73.0, 105.0, 160.0, 302.0, 499.0, 992.0, 1872.0, 3944.0, 8441.0, 18416.0, 46810.0, 136253.0, 359541.0, 300094.0, 105010.0, 36887.0, 14977.0, 6985.0, 3303.0, 1668.0, 861.0, 493.0, 257.0, 137.0, 104.0, 67.0, 52.0, 29.0, 21.0, 21.0, 7.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.4765625, -3.37689208984375, -3.2772216796875, -3.17755126953125, -3.077880859375, -2.97821044921875, -2.8785400390625, -2.77886962890625, -2.67919921875, -2.57952880859375, -2.4798583984375, -2.38018798828125, -2.280517578125, -2.18084716796875, -2.0811767578125, -1.98150634765625, -1.8818359375, -1.78216552734375, -1.6824951171875, -1.58282470703125, -1.483154296875, -1.38348388671875, -1.2838134765625, -1.18414306640625, -1.08447265625, -0.98480224609375, -0.8851318359375, -0.78546142578125, -0.685791015625, -0.58612060546875, -0.4864501953125, -0.38677978515625, -0.287109375, -0.18743896484375, -0.0877685546875, 0.01190185546875, 0.111572265625, 0.21124267578125, 0.3109130859375, 0.41058349609375, 0.51025390625, 0.60992431640625, 0.7095947265625, 0.80926513671875, 0.908935546875, 1.00860595703125, 1.1082763671875, 1.20794677734375, 1.3076171875, 1.40728759765625, 1.5069580078125, 1.60662841796875, 1.706298828125, 1.80596923828125, 1.9056396484375, 2.00531005859375, 2.10498046875, 2.20465087890625, 2.3043212890625, 2.40399169921875, 2.503662109375, 2.60333251953125, 2.7030029296875, 2.80267333984375, 2.90234375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 4.0, 5.0, 0.0, 8.0, 10.0, 5.0, 11.0, 14.0, 18.0, 12.0, 23.0, 26.0, 29.0, 29.0, 33.0, 31.0, 31.0, 44.0, 48.0, 51.0, 103.0, 1712.0, 287.0, 70.0, 54.0, 50.0, 39.0, 47.0, 37.0, 37.0, 20.0, 21.0, 21.0, 22.0, 14.0, 14.0, 13.0, 13.0, 10.0, 7.0, 8.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-17.015625, -16.4794921875, -15.943359375, -15.4072265625, -14.87109375, -14.3349609375, -13.798828125, -13.2626953125, -12.7265625, -12.1904296875, -11.654296875, -11.1181640625, -10.58203125, -10.0458984375, -9.509765625, -8.9736328125, -8.4375, -7.9013671875, -7.365234375, -6.8291015625, -6.29296875, -5.7568359375, -5.220703125, -4.6845703125, -4.1484375, -3.6123046875, -3.076171875, -2.5400390625, -2.00390625, -1.4677734375, -0.931640625, -0.3955078125, 0.140625, 0.6767578125, 1.212890625, 1.7490234375, 2.28515625, 2.8212890625, 3.357421875, 3.8935546875, 4.4296875, 4.9658203125, 5.501953125, 6.0380859375, 6.57421875, 7.1103515625, 7.646484375, 8.1826171875, 8.71875, 9.2548828125, 9.791015625, 10.3271484375, 10.86328125, 11.3994140625, 11.935546875, 12.4716796875, 13.0078125, 13.5439453125, 14.080078125, 14.6162109375, 15.15234375, 15.6884765625, 16.224609375, 16.7607421875, 17.296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 18.0, 13.0, 18.0, 19.0, 24.0, 38.0, 48.0, 53.0, 85.0, 125.0, 183.0, 273.0, 595.0, 2070.0, 82225.0, 3047347.0, 10226.0, 1063.0, 420.0, 228.0, 142.0, 94.0, 75.0, 63.0, 46.0, 31.0, 27.0, 21.0, 17.0, 15.0, 11.0, 5.0, 9.0, 10.0, 2.0, 5.0, 5.0, 0.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-28.765625, -27.874755859375, -26.98388671875, -26.093017578125, -25.2021484375, -24.311279296875, -23.42041015625, -22.529541015625, -21.638671875, -20.747802734375, -19.85693359375, -18.966064453125, -18.0751953125, -17.184326171875, -16.29345703125, -15.402587890625, -14.51171875, -13.620849609375, -12.72998046875, -11.839111328125, -10.9482421875, -10.057373046875, -9.16650390625, -8.275634765625, -7.384765625, -6.493896484375, -5.60302734375, -4.712158203125, -3.8212890625, -2.930419921875, -2.03955078125, -1.148681640625, -0.2578125, 0.633056640625, 1.52392578125, 2.414794921875, 3.3056640625, 4.196533203125, 5.08740234375, 5.978271484375, 6.869140625, 7.760009765625, 8.65087890625, 9.541748046875, 10.4326171875, 11.323486328125, 12.21435546875, 13.105224609375, 13.99609375, 14.886962890625, 15.77783203125, 16.668701171875, 17.5595703125, 18.450439453125, 19.34130859375, 20.232177734375, 21.123046875, 22.013916015625, 22.90478515625, 23.795654296875, 24.6865234375, 25.577392578125, 26.46826171875, 27.359130859375, 28.25]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 808.0, 207.0, 1.0], "bins": [-428.8434753417969, -421.9022216796875, -414.9609680175781, -408.01971435546875, -401.0784606933594, -394.13720703125, -387.1959533691406, -380.25469970703125, -373.3134460449219, -366.3721923828125, -359.4309387207031, -352.48968505859375, -345.5484313964844, -338.607177734375, -331.6659240722656, -324.72467041015625, -317.783447265625, -310.8421936035156, -303.90093994140625, -296.9596862792969, -290.0184326171875, -283.0771789550781, -276.13592529296875, -269.1946716308594, -262.25341796875, -255.31216430664062, -248.37091064453125, -241.42965698242188, -234.4884033203125, -227.54714965820312, -220.60589599609375, -213.66465759277344, -206.72340393066406, -199.7821502685547, -192.8408966064453, -185.89964294433594, -178.95838928222656, -172.01715087890625, -165.07589721679688, -158.1346435546875, -151.19338989257812, -144.25213623046875, -137.31088256835938, -130.36962890625, -123.42838287353516, -116.48712921142578, -109.5458755493164, -102.60462951660156, -95.66336059570312, -88.72210693359375, -81.78085327148438, -74.839599609375, -67.89835357666016, -60.95709991455078, -54.015846252441406, -47.0745964050293, -40.13334655761719, -33.19209289550781, -26.250843048095703, -19.309589385986328, -12.368337631225586, -5.427085876464844, 1.5141677856445312, 8.45541763305664, 15.396671295166016]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 3.0, 4.0, 5.0, 5.0, 14.0, 18.0, 12.0, 22.0, 13.0, 13.0, 24.0, 28.0, 18.0, 24.0, 39.0, 32.0, 30.0, 31.0, 38.0, 35.0, 40.0, 38.0, 44.0, 48.0, 39.0, 48.0, 28.0, 31.0, 30.0, 26.0, 23.0, 24.0, 19.0, 22.0, 18.0, 17.0, 16.0, 11.0, 11.0, 11.0, 9.0, 9.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-51.66404342651367, -50.12351608276367, -48.58299255371094, -47.04246520996094, -45.50193786621094, -43.96141052246094, -42.42088317871094, -40.8803596496582, -39.3398323059082, -37.7993049621582, -36.25878143310547, -34.71825408935547, -33.17772674560547, -31.63719940185547, -30.0966739654541, -28.556148529052734, -27.015621185302734, -25.475093841552734, -23.934568405151367, -22.39404296875, -20.853515625, -19.31298828125, -17.772462844848633, -16.231937408447266, -14.691410064697266, -13.150883674621582, -11.610357284545898, -10.069830894470215, -8.529304504394531, -6.988778114318848, -5.448251724243164, -3.9077253341674805, -2.3671951293945312, -0.8266687393188477, 0.7138576507568359, 2.2543840408325195, 3.794910430908203, 5.335436820983887, 6.87596321105957, 8.416489601135254, 9.957015991210938, 11.497542381286621, 13.038068771362305, 14.578595161437988, 16.119121551513672, 17.659648895263672, 19.20017433166504, 20.740699768066406, 22.281227111816406, 23.821754455566406, 25.362279891967773, 26.90280532836914, 28.44333267211914, 29.98386001586914, 31.524385452270508, 33.064910888671875, 34.605438232421875, 36.145965576171875, 37.686492919921875, 39.22701644897461, 40.76754379272461, 42.30807113647461, 43.848594665527344, 45.389122009277344, 46.929649353027344]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 4.0, 13.0, 16.0, 11.0, 22.0, 14.0, 17.0, 21.0, 22.0, 38.0, 23.0, 31.0, 36.0, 27.0, 32.0, 44.0, 37.0, 52.0, 36.0, 40.0, 41.0, 39.0, 45.0, 39.0, 31.0, 28.0, 33.0, 19.0, 20.0, 24.0, 22.0, 22.0, 22.0, 18.0, 12.0, 12.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.55078125, -5.3936767578125, -5.236572265625, -5.0794677734375, -4.92236328125, -4.7652587890625, -4.608154296875, -4.4510498046875, -4.2939453125, -4.1368408203125, -3.979736328125, -3.8226318359375, -3.66552734375, -3.5084228515625, -3.351318359375, -3.1942138671875, -3.037109375, -2.8800048828125, -2.722900390625, -2.5657958984375, -2.40869140625, -2.2515869140625, -2.094482421875, -1.9373779296875, -1.7802734375, -1.6231689453125, -1.466064453125, -1.3089599609375, -1.15185546875, -0.9947509765625, -0.837646484375, -0.6805419921875, -0.5234375, -0.3663330078125, -0.209228515625, -0.0521240234375, 0.10498046875, 0.2620849609375, 0.419189453125, 0.5762939453125, 0.7333984375, 0.8905029296875, 1.047607421875, 1.2047119140625, 1.36181640625, 1.5189208984375, 1.676025390625, 1.8331298828125, 1.990234375, 2.1473388671875, 2.304443359375, 2.4615478515625, 2.61865234375, 2.7757568359375, 2.932861328125, 3.0899658203125, 3.2470703125, 3.4041748046875, 3.561279296875, 3.7183837890625, 3.87548828125, 4.0325927734375, 4.189697265625, 4.3468017578125, 4.50390625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 6.0, 6.0, 14.0, 15.0, 20.0, 16.0, 18.0, 20.0, 42.0, 38.0, 59.0, 72.0, 130.0, 268.0, 831.0, 5518.0, 74390.0, 1771526.0, 2222732.0, 109391.0, 7369.0, 1000.0, 292.0, 156.0, 87.0, 48.0, 34.0, 35.0, 20.0, 21.0, 30.0, 21.0, 17.0, 6.0, 10.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.427490234375, -17.90185546875, -17.376220703125, -16.8505859375, -16.324951171875, -15.79931640625, -15.273681640625, -14.748046875, -14.222412109375, -13.69677734375, -13.171142578125, -12.6455078125, -12.119873046875, -11.59423828125, -11.068603515625, -10.54296875, -10.017333984375, -9.49169921875, -8.966064453125, -8.4404296875, -7.914794921875, -7.38916015625, -6.863525390625, -6.337890625, -5.812255859375, -5.28662109375, -4.760986328125, -4.2353515625, -3.709716796875, -3.18408203125, -2.658447265625, -2.1328125, -1.607177734375, -1.08154296875, -0.555908203125, -0.0302734375, 0.495361328125, 1.02099609375, 1.546630859375, 2.072265625, 2.597900390625, 3.12353515625, 3.649169921875, 4.1748046875, 4.700439453125, 5.22607421875, 5.751708984375, 6.27734375, 6.802978515625, 7.32861328125, 7.854248046875, 8.3798828125, 8.905517578125, 9.43115234375, 9.956787109375, 10.482421875, 11.008056640625, 11.53369140625, 12.059326171875, 12.5849609375, 13.110595703125, 13.63623046875, 14.161865234375, 14.6875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 7.0, 11.0, 17.0, 14.0, 39.0, 41.0, 61.0, 86.0, 110.0, 142.0, 195.0, 269.0, 424.0, 467.0, 495.0, 440.0, 335.0, 270.0, 173.0, 128.0, 95.0, 64.0, 50.0, 41.0, 33.0, 18.0, 17.0, 8.0, 8.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.84375, -18.325439453125, -17.80712890625, -17.288818359375, -16.7705078125, -16.252197265625, -15.73388671875, -15.215576171875, -14.697265625, -14.178955078125, -13.66064453125, -13.142333984375, -12.6240234375, -12.105712890625, -11.58740234375, -11.069091796875, -10.55078125, -10.032470703125, -9.51416015625, -8.995849609375, -8.4775390625, -7.959228515625, -7.44091796875, -6.922607421875, -6.404296875, -5.885986328125, -5.36767578125, -4.849365234375, -4.3310546875, -3.812744140625, -3.29443359375, -2.776123046875, -2.2578125, -1.739501953125, -1.22119140625, -0.702880859375, -0.1845703125, 0.333740234375, 0.85205078125, 1.370361328125, 1.888671875, 2.406982421875, 2.92529296875, 3.443603515625, 3.9619140625, 4.480224609375, 4.99853515625, 5.516845703125, 6.03515625, 6.553466796875, 7.07177734375, 7.590087890625, 8.1083984375, 8.626708984375, 9.14501953125, 9.663330078125, 10.181640625, 10.699951171875, 11.21826171875, 11.736572265625, 12.2548828125, 12.773193359375, 13.29150390625, 13.809814453125, 14.328125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 9.0, 20.0, 25.0, 26.0, 31.0, 43.0, 53.0, 81.0, 104.0, 158.0, 211.0, 333.0, 891.0, 11232.0, 3849850.0, 327299.0, 2446.0, 561.0, 254.0, 163.0, 122.0, 90.0, 67.0, 59.0, 31.0, 21.0, 17.0, 23.0, 16.0, 6.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-66.125, -64.107421875, -62.08984375, -60.072265625, -58.0546875, -56.037109375, -54.01953125, -52.001953125, -49.984375, -47.966796875, -45.94921875, -43.931640625, -41.9140625, -39.896484375, -37.87890625, -35.861328125, -33.84375, -31.826171875, -29.80859375, -27.791015625, -25.7734375, -23.755859375, -21.73828125, -19.720703125, -17.703125, -15.685546875, -13.66796875, -11.650390625, -9.6328125, -7.615234375, -5.59765625, -3.580078125, -1.5625, 0.455078125, 2.47265625, 4.490234375, 6.5078125, 8.525390625, 10.54296875, 12.560546875, 14.578125, 16.595703125, 18.61328125, 20.630859375, 22.6484375, 24.666015625, 26.68359375, 28.701171875, 30.71875, 32.736328125, 34.75390625, 36.771484375, 38.7890625, 40.806640625, 42.82421875, 44.841796875, 46.859375, 48.876953125, 50.89453125, 52.912109375, 54.9296875, 56.947265625, 58.96484375, 60.982421875, 63.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 10.0, 114.0, 451.0, 369.0, 69.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.10033416748047, -50.55708312988281, -42.013832092285156, -33.470584869384766, -24.92733383178711, -16.384082794189453, -7.8408355712890625, 0.7024154663085938, 9.24566650390625, 17.788917541503906, 26.33216667175293, 34.87541580200195, 43.41866683959961, 51.961917877197266, 60.505165100097656, 69.04841613769531, 77.59166717529297, 86.13491821289062, 94.67816925048828, 103.22142028808594, 111.76466369628906, 120.30792236328125, 128.85116577148438, 137.3944091796875, 145.9376678466797, 154.4809112548828, 163.024169921875, 171.56741333007812, 180.1106719970703, 188.65391540527344, 197.19717407226562, 205.74041748046875, 214.28366088867188, 222.826904296875, 231.3701629638672, 239.9134063720703, 248.4566650390625, 256.9999084472656, 265.54315185546875, 274.08642578125, 282.6296691894531, 291.17291259765625, 299.7161560058594, 308.2594299316406, 316.80267333984375, 325.3459167480469, 333.88916015625, 342.43243408203125, 350.97564697265625, 359.5188903808594, 368.0621337890625, 376.60540771484375, 385.1486511230469, 393.69189453125, 402.2351379394531, 410.77838134765625, 419.3216552734375, 427.8648986816406, 436.40814208984375, 444.951416015625, 453.4946594238281, 462.03790283203125, 470.5811462402344, 479.1243896484375, 487.66766357421875]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 10.0, 10.0, 11.0, 10.0, 21.0, 12.0, 17.0, 15.0, 27.0, 31.0, 33.0, 36.0, 34.0, 28.0, 32.0, 35.0, 34.0, 43.0, 49.0, 35.0, 35.0, 40.0, 40.0, 30.0, 38.0, 27.0, 37.0, 31.0, 36.0, 20.0, 27.0, 21.0, 14.0, 10.0, 15.0, 12.0, 10.0, 4.0, 2.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.475341796875, -38.00426483154297, -36.5331916809082, -35.06211471557617, -33.591041564941406, -32.119964599609375, -30.648887634277344, -29.177812576293945, -27.706737518310547, -26.23566246032715, -24.76458740234375, -23.29351043701172, -21.82243537902832, -20.351360321044922, -18.88028335571289, -17.409208297729492, -15.938133239746094, -14.467058181762695, -12.99598217010498, -11.524906158447266, -10.053831100463867, -8.582756042480469, -7.111680030822754, -5.640604019165039, -4.169528961181641, -2.698453426361084, -1.2273778915405273, 0.2436976432800293, 1.714773178100586, 3.1858487129211426, 4.656924247741699, 6.128000259399414, 7.5990753173828125, 9.070150375366211, 10.541226387023926, 12.01230239868164, 13.483377456665039, 14.954452514648438, 16.42552947998047, 17.896604537963867, 19.367679595947266, 20.838754653930664, 22.309829711914062, 23.780906677246094, 25.251981735229492, 26.72305679321289, 28.194133758544922, 29.66520881652832, 31.13628387451172, 32.60736083984375, 34.078433990478516, 35.54951095581055, 37.02058410644531, 38.491661071777344, 39.962738037109375, 41.433815002441406, 42.90488815307617, 44.3759651184082, 45.84703826904297, 47.318115234375, 48.78919219970703, 50.2602653503418, 51.73134231567383, 53.202415466308594, 54.673492431640625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 6.0, 5.0, 13.0, 15.0, 9.0, 21.0, 18.0, 31.0, 29.0, 16.0, 22.0, 28.0, 28.0, 24.0, 38.0, 36.0, 31.0, 52.0, 41.0, 39.0, 35.0, 42.0, 46.0, 38.0, 38.0, 23.0, 34.0, 36.0, 26.0, 20.0, 24.0, 16.0, 20.0, 15.0, 23.0, 14.0, 6.0, 11.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.87109375, -5.7137451171875, -5.556396484375, -5.3990478515625, -5.24169921875, -5.0843505859375, -4.927001953125, -4.7696533203125, -4.6123046875, -4.4549560546875, -4.297607421875, -4.1402587890625, -3.98291015625, -3.8255615234375, -3.668212890625, -3.5108642578125, -3.353515625, -3.1961669921875, -3.038818359375, -2.8814697265625, -2.72412109375, -2.5667724609375, -2.409423828125, -2.2520751953125, -2.0947265625, -1.9373779296875, -1.780029296875, -1.6226806640625, -1.46533203125, -1.3079833984375, -1.150634765625, -0.9932861328125, -0.8359375, -0.6785888671875, -0.521240234375, -0.3638916015625, -0.20654296875, -0.0491943359375, 0.108154296875, 0.2655029296875, 0.4228515625, 0.5802001953125, 0.737548828125, 0.8948974609375, 1.05224609375, 1.2095947265625, 1.366943359375, 1.5242919921875, 1.681640625, 1.8389892578125, 1.996337890625, 2.1536865234375, 2.31103515625, 2.4683837890625, 2.625732421875, 2.7830810546875, 2.9404296875, 3.0977783203125, 3.255126953125, 3.4124755859375, 3.56982421875, 3.7271728515625, 3.884521484375, 4.0418701171875, 4.19921875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 17.0, 20.0, 26.0, 39.0, 62.0, 74.0, 131.0, 194.0, 281.0, 446.0, 694.0, 1103.0, 1704.0, 2684.0, 4386.0, 6738.0, 11228.0, 18789.0, 31215.0, 53568.0, 95300.0, 173186.0, 269972.0, 161514.0, 89166.0, 50572.0, 29684.0, 17465.0, 10614.0, 6518.0, 4022.0, 2650.0, 1613.0, 1050.0, 644.0, 386.0, 270.0, 174.0, 103.0, 79.0, 67.0, 36.0, 23.0, 11.0, 9.0, 9.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.740234375, -0.7142105102539062, -0.6881866455078125, -0.6621627807617188, -0.636138916015625, -0.6101150512695312, -0.5840911865234375, -0.5580673217773438, -0.53204345703125, -0.5060195922851562, -0.4799957275390625, -0.45397186279296875, -0.427947998046875, -0.40192413330078125, -0.3759002685546875, -0.34987640380859375, -0.3238525390625, -0.29782867431640625, -0.2718048095703125, -0.24578094482421875, -0.219757080078125, -0.19373321533203125, -0.1677093505859375, -0.14168548583984375, -0.11566162109375, -0.08963775634765625, -0.0636138916015625, -0.03759002685546875, -0.011566162109375, 0.01445770263671875, 0.0404815673828125, 0.06650543212890625, 0.092529296875, 0.11855316162109375, 0.1445770263671875, 0.17060089111328125, 0.196624755859375, 0.22264862060546875, 0.2486724853515625, 0.27469635009765625, 0.30072021484375, 0.32674407958984375, 0.3527679443359375, 0.37879180908203125, 0.404815673828125, 0.43083953857421875, 0.4568634033203125, 0.48288726806640625, 0.5089111328125, 0.5349349975585938, 0.5609588623046875, 0.5869827270507812, 0.613006591796875, 0.6390304565429688, 0.6650543212890625, 0.6910781860351562, 0.71710205078125, 0.7431259155273438, 0.7691497802734375, 0.7951736450195312, 0.821197509765625, 0.8472213745117188, 0.8732452392578125, 0.8992691040039062, 0.92529296875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 6.0, 4.0, 8.0, 10.0, 15.0, 13.0, 19.0, 27.0, 21.0, 24.0, 21.0, 38.0, 33.0, 39.0, 35.0, 40.0, 40.0, 43.0, 1074.0, 44.0, 36.0, 35.0, 48.0, 43.0, 38.0, 29.0, 29.0, 29.0, 23.0, 18.0, 26.0, 27.0, 15.0, 18.0, 9.0, 16.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.857421875, -3.752349853515625, -3.64727783203125, -3.542205810546875, -3.4371337890625, -3.332061767578125, -3.22698974609375, -3.121917724609375, -3.016845703125, -2.911773681640625, -2.80670166015625, -2.701629638671875, -2.5965576171875, -2.491485595703125, -2.38641357421875, -2.281341552734375, -2.17626953125, -2.071197509765625, -1.96612548828125, -1.861053466796875, -1.7559814453125, -1.650909423828125, -1.54583740234375, -1.440765380859375, -1.335693359375, -1.230621337890625, -1.12554931640625, -1.020477294921875, -0.9154052734375, -0.810333251953125, -0.70526123046875, -0.600189208984375, -0.4951171875, -0.390045166015625, -0.28497314453125, -0.179901123046875, -0.0748291015625, 0.030242919921875, 0.13531494140625, 0.240386962890625, 0.345458984375, 0.450531005859375, 0.55560302734375, 0.660675048828125, 0.7657470703125, 0.870819091796875, 0.97589111328125, 1.080963134765625, 1.18603515625, 1.291107177734375, 1.39617919921875, 1.501251220703125, 1.6063232421875, 1.711395263671875, 1.81646728515625, 1.921539306640625, 2.026611328125, 2.131683349609375, 2.23675537109375, 2.341827392578125, 2.4468994140625, 2.551971435546875, 2.65704345703125, 2.762115478515625, 2.8671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 7.0, 20.0, 27.0, 44.0, 46.0, 81.0, 114.0, 182.0, 260.0, 386.0, 578.0, 901.0, 1311.0, 2075.0, 3296.0, 5114.0, 7990.0, 12907.0, 21009.0, 35152.0, 61291.0, 110133.0, 209170.0, 1304686.0, 136433.0, 74903.0, 42129.0, 24894.0, 15411.0, 9683.0, 6177.0, 3880.0, 2356.0, 1555.0, 1032.0, 599.0, 422.0, 278.0, 189.0, 119.0, 84.0, 64.0, 39.0, 37.0, 22.0, 9.0, 11.0, 6.0, 3.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.71484375, -0.6911544799804688, -0.6674652099609375, -0.6437759399414062, -0.620086669921875, -0.5963973999023438, -0.5727081298828125, -0.5490188598632812, -0.52532958984375, -0.5016403198242188, -0.4779510498046875, -0.45426177978515625, -0.430572509765625, -0.40688323974609375, -0.3831939697265625, -0.35950469970703125, -0.3358154296875, -0.31212615966796875, -0.2884368896484375, -0.26474761962890625, -0.241058349609375, -0.21736907958984375, -0.1936798095703125, -0.16999053955078125, -0.14630126953125, -0.12261199951171875, -0.0989227294921875, -0.07523345947265625, -0.051544189453125, -0.02785491943359375, -0.0041656494140625, 0.01952362060546875, 0.043212890625, 0.06690216064453125, 0.0905914306640625, 0.11428070068359375, 0.137969970703125, 0.16165924072265625, 0.1853485107421875, 0.20903778076171875, 0.23272705078125, 0.25641632080078125, 0.2801055908203125, 0.30379486083984375, 0.327484130859375, 0.35117340087890625, 0.3748626708984375, 0.39855194091796875, 0.4222412109375, 0.44593048095703125, 0.4696197509765625, 0.49330902099609375, 0.516998291015625, 0.5406875610351562, 0.5643768310546875, 0.5880661010742188, 0.61175537109375, 0.6354446411132812, 0.6591339111328125, 0.6828231811523438, 0.706512451171875, 0.7302017211914062, 0.7538909912109375, 0.7775802612304688, 0.80126953125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 13.0, 18.0, 23.0, 20.0, 24.0, 34.0, 31.0, 32.0, 45.0, 54.0, 49.0, 69.0, 51.0, 64.0, 58.0, 59.0, 45.0, 32.0, 46.0, 39.0, 38.0, 21.0, 27.0, 17.0, 17.0, 13.0, 12.0, 9.0, 7.0, 4.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009455680847167969, -0.0009177848696708679, -0.000890001654624939, -0.00086221843957901, -0.0008344352245330811, -0.0008066520094871521, -0.0007788687944412231, -0.0007510855793952942, -0.0007233023643493652, -0.0006955191493034363, -0.0006677359342575073, -0.0006399527192115784, -0.0006121695041656494, -0.0005843862891197205, -0.0005566030740737915, -0.0005288198590278625, -0.0005010366439819336, -0.00047325342893600464, -0.0004454702138900757, -0.00041768699884414673, -0.0003899037837982178, -0.0003621205687522888, -0.00033433735370635986, -0.0003065541386604309, -0.00027877092361450195, -0.000250987708568573, -0.00022320449352264404, -0.0001954212784767151, -0.00016763806343078613, -0.00013985484838485718, -0.00011207163333892822, -8.428841829299927e-05, -5.650520324707031e-05, -2.8721988201141357e-05, -9.387731552124023e-07, 2.6844441890716553e-05, 5.462765693664551e-05, 8.241087198257446e-05, 0.00011019408702850342, 0.00013797730207443237, 0.00016576051712036133, 0.00019354373216629028, 0.00022132694721221924, 0.0002491101622581482, 0.00027689337730407715, 0.0003046765923500061, 0.00033245980739593506, 0.000360243022441864, 0.00038802623748779297, 0.0004158094525337219, 0.0004435926675796509, 0.00047137588262557983, 0.0004991590976715088, 0.0005269423127174377, 0.0005547255277633667, 0.0005825087428092957, 0.0006102919578552246, 0.0006380751729011536, 0.0006658583879470825, 0.0006936416029930115, 0.0007214248180389404, 0.0007492080330848694, 0.0007769912481307983, 0.0008047744631767273, 0.0008325576782226562]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 5.0, 9.0, 10.0, 5.0, 12.0, 24.0, 22.0, 23.0, 41.0, 49.0, 72.0, 167.0, 326.0, 1102.0, 1035368.0, 10153.0, 545.0, 211.0, 89.0, 70.0, 73.0, 36.0, 37.0, 18.0, 20.0, 16.0, 19.0, 5.0, 9.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0275726318359375, -0.026730060577392578, -0.025887489318847656, -0.025044918060302734, -0.024202346801757812, -0.02335977554321289, -0.02251720428466797, -0.021674633026123047, -0.020832061767578125, -0.019989490509033203, -0.01914691925048828, -0.01830434799194336, -0.017461776733398438, -0.016619205474853516, -0.015776634216308594, -0.014934062957763672, -0.01409149169921875, -0.013248920440673828, -0.012406349182128906, -0.011563777923583984, -0.010721206665039062, -0.00987863540649414, -0.009036064147949219, -0.008193492889404297, -0.007350921630859375, -0.006508350372314453, -0.005665779113769531, -0.004823207855224609, -0.0039806365966796875, -0.0031380653381347656, -0.0022954940795898438, -0.0014529228210449219, -0.0006103515625, 0.00023221969604492188, 0.0010747909545898438, 0.0019173622131347656, 0.0027599334716796875, 0.0036025047302246094, 0.004445075988769531, 0.005287647247314453, 0.006130218505859375, 0.006972789764404297, 0.007815361022949219, 0.00865793228149414, 0.009500503540039062, 0.010343074798583984, 0.011185646057128906, 0.012028217315673828, 0.01287078857421875, 0.013713359832763672, 0.014555931091308594, 0.015398502349853516, 0.016241073608398438, 0.01708364486694336, 0.01792621612548828, 0.018768787384033203, 0.019611358642578125, 0.020453929901123047, 0.02129650115966797, 0.02213907241821289, 0.022981643676757812, 0.023824214935302734, 0.024666786193847656, 0.025509357452392578, 0.0263519287109375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 20.0, 94.0, 162.0, 270.0, 217.0, 147.0, 67.0, 20.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005335273453965783, -0.0005037373048253357, -0.0004739472351502627, -0.00044415719457902014, -0.00041436715400777757, -0.00038457708433270454, -0.000354787043761462, -0.0003249970031902194, -0.00029520696261897683, -0.00026541692204773426, -0.00023562686692457646, -0.00020583681180141866, -0.0001760467712301761, -0.0001462567161070183, -0.00011646666098386049, -8.667662041261792e-05, -5.6886550737544894e-05, -2.7096501071355306e-05, 2.693548594834283e-06, 3.2483600080013275e-05, 6.227364792721346e-05, 9.206369577441365e-05, 0.00012185375089757144, 0.00015164379146881402, 0.00018143384659197181, 0.00021122390171512961, 0.00024101394228637218, 0.00027080398285761476, 0.0003005940525326878, 0.00033038409310393035, 0.0003601741627790034, 0.00038996420335024595, 0.0004197542439214885, 0.0004495442844927311, 0.0004793343541678041, 0.0005091243656352162, 0.0005389144644141197, 0.0005687045049853623, 0.0005984945455566049, 0.0006282845861278474, 0.00065807462669909, 0.0006878646672703326, 0.0007176547078415751, 0.0007474448066204786, 0.0007772348471917212, 0.0008070248877629638, 0.0008368149283342063, 0.0008666049689054489, 0.0008963950676843524, 0.000926185108255595, 0.0009559751488268375, 0.000985765247605741, 0.0010155552299693227, 0.0010453453287482262, 0.0010751353111118078, 0.0011049254098907113, 0.001134715392254293, 0.0011645054910331964, 0.001194295473396778, 0.0012240855721756816, 0.0012538755545392632, 0.0012836656533181667, 0.0013134556356817484, 0.0013432457344606519, 0.0013730358332395554]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 8.0, 10.0, 11.0, 12.0, 19.0, 16.0, 19.0, 29.0, 21.0, 28.0, 37.0, 30.0, 35.0, 44.0, 47.0, 44.0, 35.0, 35.0, 42.0, 54.0, 42.0, 36.0, 32.0, 29.0, 38.0, 36.0, 33.0, 23.0, 25.0, 25.0, 22.0, 18.0, 10.0, 5.0, 9.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00043082237243652344, -0.0004161745309829712, -0.00040152668952941895, -0.0003868788480758667, -0.00037223100662231445, -0.0003575831651687622, -0.00034293532371520996, -0.0003282874822616577, -0.00031363964080810547, -0.0002989917993545532, -0.000284343957901001, -0.00026969611644744873, -0.0002550482749938965, -0.00024040043354034424, -0.000225752592086792, -0.00021110475063323975, -0.0001964569091796875, -0.00018180906772613525, -0.000167161226272583, -0.00015251338481903076, -0.00013786554336547852, -0.00012321770191192627, -0.00010856986045837402, -9.392201900482178e-05, -7.927417755126953e-05, -6.462633609771729e-05, -4.997849464416504e-05, -3.533065319061279e-05, -2.0682811737060547e-05, -6.034970283508301e-06, 8.612871170043945e-06, 2.326071262359619e-05, 3.790855407714844e-05, 5.2556395530700684e-05, 6.720423698425293e-05, 8.185207843780518e-05, 9.649991989135742e-05, 0.00011114776134490967, 0.00012579560279846191, 0.00014044344425201416, 0.0001550912857055664, 0.00016973912715911865, 0.0001843869686126709, 0.00019903481006622314, 0.0002136826515197754, 0.00022833049297332764, 0.00024297833442687988, 0.00025762617588043213, 0.0002722740173339844, 0.0002869218587875366, 0.00030156970024108887, 0.0003162175416946411, 0.00033086538314819336, 0.0003455132246017456, 0.00036016106605529785, 0.0003748089075088501, 0.00038945674896240234, 0.0004041045904159546, 0.00041875243186950684, 0.0004334002733230591, 0.00044804811477661133, 0.0004626959562301636, 0.0004773437976837158, 0.0004919916391372681, 0.0005066394805908203]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 6.0, 5.0, 13.0, 15.0, 9.0, 21.0, 18.0, 31.0, 29.0, 16.0, 22.0, 28.0, 28.0, 24.0, 38.0, 36.0, 31.0, 52.0, 41.0, 39.0, 35.0, 42.0, 46.0, 38.0, 38.0, 23.0, 34.0, 36.0, 26.0, 20.0, 24.0, 16.0, 20.0, 15.0, 23.0, 14.0, 6.0, 11.0, 8.0, 5.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.87109375, -5.7137451171875, -5.556396484375, -5.3990478515625, -5.24169921875, -5.0843505859375, -4.927001953125, -4.7696533203125, -4.6123046875, -4.4549560546875, -4.297607421875, -4.1402587890625, -3.98291015625, -3.8255615234375, -3.668212890625, -3.5108642578125, -3.353515625, -3.1961669921875, -3.038818359375, -2.8814697265625, -2.72412109375, -2.5667724609375, -2.409423828125, -2.2520751953125, -2.0947265625, -1.9373779296875, -1.780029296875, -1.6226806640625, -1.46533203125, -1.3079833984375, -1.150634765625, -0.9932861328125, -0.8359375, -0.6785888671875, -0.521240234375, -0.3638916015625, -0.20654296875, -0.0491943359375, 0.108154296875, 0.2655029296875, 0.4228515625, 0.5802001953125, 0.737548828125, 0.8948974609375, 1.05224609375, 1.2095947265625, 1.366943359375, 1.5242919921875, 1.681640625, 1.8389892578125, 1.996337890625, 2.1536865234375, 2.31103515625, 2.4683837890625, 2.625732421875, 2.7830810546875, 2.9404296875, 3.0977783203125, 3.255126953125, 3.4124755859375, 3.56982421875, 3.7271728515625, 3.884521484375, 4.0418701171875, 4.19921875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 13.0, 13.0, 11.0, 15.0, 37.0, 64.0, 62.0, 108.0, 137.0, 238.0, 373.0, 489.0, 779.0, 1136.0, 1655.0, 2581.0, 3956.0, 6207.0, 10912.0, 21315.0, 49965.0, 146171.0, 455819.0, 217651.0, 67852.0, 27232.0, 13139.0, 7248.0, 4552.0, 2963.0, 1896.0, 1280.0, 874.0, 547.0, 414.0, 270.0, 181.0, 131.0, 77.0, 46.0, 36.0, 32.0, 21.0, 14.0, 15.0, 8.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.6328125, -3.51031494140625, -3.3878173828125, -3.26531982421875, -3.142822265625, -3.02032470703125, -2.8978271484375, -2.77532958984375, -2.65283203125, -2.53033447265625, -2.4078369140625, -2.28533935546875, -2.162841796875, -2.04034423828125, -1.9178466796875, -1.79534912109375, -1.6728515625, -1.55035400390625, -1.4278564453125, -1.30535888671875, -1.182861328125, -1.06036376953125, -0.9378662109375, -0.81536865234375, -0.69287109375, -0.57037353515625, -0.4478759765625, -0.32537841796875, -0.202880859375, -0.08038330078125, 0.0421142578125, 0.16461181640625, 0.287109375, 0.40960693359375, 0.5321044921875, 0.65460205078125, 0.777099609375, 0.89959716796875, 1.0220947265625, 1.14459228515625, 1.26708984375, 1.38958740234375, 1.5120849609375, 1.63458251953125, 1.757080078125, 1.87957763671875, 2.0020751953125, 2.12457275390625, 2.2470703125, 2.36956787109375, 2.4920654296875, 2.61456298828125, 2.737060546875, 2.85955810546875, 2.9820556640625, 3.10455322265625, 3.22705078125, 3.34954833984375, 3.4720458984375, 3.59454345703125, 3.717041015625, 3.83953857421875, 3.9620361328125, 4.08453369140625, 4.20703125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 2.0, 6.0, 8.0, 9.0, 8.0, 11.0, 21.0, 25.0, 20.0, 26.0, 23.0, 31.0, 42.0, 31.0, 40.0, 42.0, 57.0, 57.0, 189.0, 1801.0, 163.0, 65.0, 56.0, 35.0, 26.0, 40.0, 36.0, 32.0, 27.0, 16.0, 17.0, 14.0, 12.0, 11.0, 15.0, 6.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.290283203125, -17.68994140625, -17.089599609375, -16.4892578125, -15.888916015625, -15.28857421875, -14.688232421875, -14.087890625, -13.487548828125, -12.88720703125, -12.286865234375, -11.6865234375, -11.086181640625, -10.48583984375, -9.885498046875, -9.28515625, -8.684814453125, -8.08447265625, -7.484130859375, -6.8837890625, -6.283447265625, -5.68310546875, -5.082763671875, -4.482421875, -3.882080078125, -3.28173828125, -2.681396484375, -2.0810546875, -1.480712890625, -0.88037109375, -0.280029296875, 0.3203125, 0.920654296875, 1.52099609375, 2.121337890625, 2.7216796875, 3.322021484375, 3.92236328125, 4.522705078125, 5.123046875, 5.723388671875, 6.32373046875, 6.924072265625, 7.5244140625, 8.124755859375, 8.72509765625, 9.325439453125, 9.92578125, 10.526123046875, 11.12646484375, 11.726806640625, 12.3271484375, 12.927490234375, 13.52783203125, 14.128173828125, 14.728515625, 15.328857421875, 15.92919921875, 16.529541015625, 17.1298828125, 17.730224609375, 18.33056640625, 18.930908203125, 19.53125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 7.0, 11.0, 9.0, 17.0, 12.0, 18.0, 23.0, 22.0, 37.0, 47.0, 96.0, 157.0, 208.0, 290.0, 773.0, 6113.0, 2667316.0, 464864.0, 4034.0, 626.0, 281.0, 218.0, 127.0, 86.0, 78.0, 52.0, 42.0, 33.0, 26.0, 13.0, 14.0, 9.0, 8.0, 9.0, 6.0, 4.0, 3.0, 9.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.65625, -40.46337890625, -39.2705078125, -38.07763671875, -36.884765625, -35.69189453125, -34.4990234375, -33.30615234375, -32.11328125, -30.92041015625, -29.7275390625, -28.53466796875, -27.341796875, -26.14892578125, -24.9560546875, -23.76318359375, -22.5703125, -21.37744140625, -20.1845703125, -18.99169921875, -17.798828125, -16.60595703125, -15.4130859375, -14.22021484375, -13.02734375, -11.83447265625, -10.6416015625, -9.44873046875, -8.255859375, -7.06298828125, -5.8701171875, -4.67724609375, -3.484375, -2.29150390625, -1.0986328125, 0.09423828125, 1.287109375, 2.47998046875, 3.6728515625, 4.86572265625, 6.05859375, 7.25146484375, 8.4443359375, 9.63720703125, 10.830078125, 12.02294921875, 13.2158203125, 14.40869140625, 15.6015625, 16.79443359375, 17.9873046875, 19.18017578125, 20.373046875, 21.56591796875, 22.7587890625, 23.95166015625, 25.14453125, 26.33740234375, 27.5302734375, 28.72314453125, 29.916015625, 31.10888671875, 32.3017578125, 33.49462890625, 34.6875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 22.0, 55.0, 92.0, 146.0, 175.0, 161.0, 132.0, 91.0, 72.0, 29.0, 14.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.35685920715332, -7.607362747192383, -6.8578667640686035, -6.108370780944824, -5.358874320983887, -4.609377861022949, -3.85988187789917, -3.1103858947753906, -2.360889434814453, -1.6113932132720947, -0.8618969917297363, -0.11240077018737793, 0.6370954513549805, 1.3865916728973389, 2.1360878944396973, 2.8855838775634766, 3.635080337524414, 4.384576797485352, 5.134072780609131, 5.88356876373291, 6.633065223693848, 7.382561683654785, 8.132057189941406, 8.881553649902344, 9.631050109863281, 10.380546569824219, 11.130043029785156, 11.879538536071777, 12.629034996032715, 13.378531455993652, 14.128026962280273, 14.877523422241211, 15.627017974853516, 16.376514434814453, 17.12601089477539, 17.875507354736328, 18.625003814697266, 19.37449836730957, 20.123994827270508, 20.873491287231445, 21.622987747192383, 22.37248420715332, 23.121980667114258, 23.871477127075195, 24.6209716796875, 25.370468139648438, 26.119964599609375, 26.869461059570312, 27.61895751953125, 28.368453979492188, 29.117950439453125, 29.867446899414062, 30.616943359375, 31.366437911987305, 32.115936279296875, 32.86543273925781, 33.61492919921875, 34.36442565917969, 35.113922119140625, 35.86341857910156, 36.6129150390625, 37.36241149902344, 38.111907958984375, 38.86140441894531, 39.610897064208984]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 6.0, 4.0, 13.0, 5.0, 12.0, 21.0, 20.0, 32.0, 22.0, 25.0, 36.0, 26.0, 30.0, 38.0, 42.0, 34.0, 33.0, 45.0, 45.0, 45.0, 50.0, 49.0, 30.0, 40.0, 40.0, 31.0, 27.0, 29.0, 25.0, 32.0, 19.0, 14.0, 16.0, 15.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.16311264038086, -53.45707321166992, -51.751033782958984, -50.04499053955078, -48.338951110839844, -46.632911682128906, -44.92687225341797, -43.22083282470703, -41.514793395996094, -39.808753967285156, -38.10271453857422, -36.39667510986328, -34.69063186645508, -32.98459243774414, -31.278553009033203, -29.572513580322266, -27.866470336914062, -26.160430908203125, -24.454389572143555, -22.748350143432617, -21.042308807373047, -19.33626937866211, -17.630229949951172, -15.924189567565918, -14.218149185180664, -12.51210880279541, -10.806068420410156, -9.100028991699219, -7.393988609313965, -5.687948226928711, -3.9819087982177734, -2.2758684158325195, -0.5698318481445312, 1.1362082958221436, 2.8422484397888184, 4.548288345336914, 6.254328727722168, 7.960369110107422, 9.66640853881836, 11.372448921203613, 13.078489303588867, 14.784529685974121, 16.490570068359375, 18.196609497070312, 19.90264892578125, 21.60869026184082, 23.314729690551758, 25.020771026611328, 26.726810455322266, 28.432849884033203, 30.138891220092773, 31.84493064880371, 33.55097198486328, 35.25701141357422, 36.963050842285156, 38.669090270996094, 40.37512969970703, 42.08116912841797, 43.787208557128906, 45.493247985839844, 47.19929122924805, 48.905330657958984, 50.61137008666992, 52.31740951538086, 54.02345275878906]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 4.0, 8.0, 11.0, 14.0, 21.0, 16.0, 29.0, 28.0, 23.0, 18.0, 23.0, 34.0, 22.0, 40.0, 35.0, 43.0, 42.0, 41.0, 48.0, 45.0, 36.0, 50.0, 28.0, 32.0, 35.0, 37.0, 33.0, 26.0, 23.0, 22.0, 18.0, 20.0, 19.0, 11.0, 18.0, 7.0, 8.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-6.4140625, -6.24688720703125, -6.0797119140625, -5.91253662109375, -5.745361328125, -5.57818603515625, -5.4110107421875, -5.24383544921875, -5.07666015625, -4.90948486328125, -4.7423095703125, -4.57513427734375, -4.407958984375, -4.24078369140625, -4.0736083984375, -3.90643310546875, -3.7392578125, -3.57208251953125, -3.4049072265625, -3.23773193359375, -3.070556640625, -2.90338134765625, -2.7362060546875, -2.56903076171875, -2.40185546875, -2.23468017578125, -2.0675048828125, -1.90032958984375, -1.733154296875, -1.56597900390625, -1.3988037109375, -1.23162841796875, -1.064453125, -0.89727783203125, -0.7301025390625, -0.56292724609375, -0.395751953125, -0.22857666015625, -0.0614013671875, 0.10577392578125, 0.27294921875, 0.44012451171875, 0.6072998046875, 0.77447509765625, 0.941650390625, 1.10882568359375, 1.2760009765625, 1.44317626953125, 1.6103515625, 1.77752685546875, 1.9447021484375, 2.11187744140625, 2.279052734375, 2.44622802734375, 2.6134033203125, 2.78057861328125, 2.94775390625, 3.11492919921875, 3.2821044921875, 3.44927978515625, 3.616455078125, 3.78363037109375, 3.9508056640625, 4.11798095703125, 4.28515625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 12.0, 5.0, 14.0, 15.0, 30.0, 28.0, 57.0, 70.0, 119.0, 172.0, 314.0, 593.0, 1194.0, 2811.0, 6916.0, 18546.0, 56080.0, 204145.0, 730971.0, 1505888.0, 1122925.0, 387931.0, 105093.0, 31819.0, 10915.0, 4170.0, 1696.0, 765.0, 414.0, 211.0, 116.0, 83.0, 55.0, 41.0, 21.0, 19.0, 11.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0], "bins": [-8.1953125, -7.994140625, -7.79296875, -7.591796875, -7.390625, -7.189453125, -6.98828125, -6.787109375, -6.5859375, -6.384765625, -6.18359375, -5.982421875, -5.78125, -5.580078125, -5.37890625, -5.177734375, -4.9765625, -4.775390625, -4.57421875, -4.373046875, -4.171875, -3.970703125, -3.76953125, -3.568359375, -3.3671875, -3.166015625, -2.96484375, -2.763671875, -2.5625, -2.361328125, -2.16015625, -1.958984375, -1.7578125, -1.556640625, -1.35546875, -1.154296875, -0.953125, -0.751953125, -0.55078125, -0.349609375, -0.1484375, 0.052734375, 0.25390625, 0.455078125, 0.65625, 0.857421875, 1.05859375, 1.259765625, 1.4609375, 1.662109375, 1.86328125, 2.064453125, 2.265625, 2.466796875, 2.66796875, 2.869140625, 3.0703125, 3.271484375, 3.47265625, 3.673828125, 3.875, 4.076171875, 4.27734375, 4.478515625, 4.6796875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 8.0, 11.0, 19.0, 22.0, 25.0, 38.0, 40.0, 55.0, 69.0, 98.0, 132.0, 172.0, 225.0, 308.0, 319.0, 392.0, 412.0, 360.0, 300.0, 205.0, 188.0, 151.0, 136.0, 91.0, 71.0, 52.0, 43.0, 26.0, 23.0, 24.0, 13.0, 13.0, 4.0, 5.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.21533203125, -11.7978515625, -11.38037109375, -10.962890625, -10.54541015625, -10.1279296875, -9.71044921875, -9.29296875, -8.87548828125, -8.4580078125, -8.04052734375, -7.623046875, -7.20556640625, -6.7880859375, -6.37060546875, -5.953125, -5.53564453125, -5.1181640625, -4.70068359375, -4.283203125, -3.86572265625, -3.4482421875, -3.03076171875, -2.61328125, -2.19580078125, -1.7783203125, -1.36083984375, -0.943359375, -0.52587890625, -0.1083984375, 0.30908203125, 0.7265625, 1.14404296875, 1.5615234375, 1.97900390625, 2.396484375, 2.81396484375, 3.2314453125, 3.64892578125, 4.06640625, 4.48388671875, 4.9013671875, 5.31884765625, 5.736328125, 6.15380859375, 6.5712890625, 6.98876953125, 7.40625, 7.82373046875, 8.2412109375, 8.65869140625, 9.076171875, 9.49365234375, 9.9111328125, 10.32861328125, 10.74609375, 11.16357421875, 11.5810546875, 11.99853515625, 12.416015625, 12.83349609375, 13.2509765625, 13.66845703125, 14.0859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 9.0, 6.0, 13.0, 19.0, 27.0, 20.0, 39.0, 55.0, 71.0, 73.0, 107.0, 164.0, 262.0, 428.0, 1829.0, 222225.0, 3953382.0, 13788.0, 799.0, 309.0, 195.0, 126.0, 79.0, 63.0, 46.0, 27.0, 29.0, 25.0, 19.0, 17.0, 11.0, 5.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.9375, -67.89697265625, -65.8564453125, -63.81591796875, -61.775390625, -59.73486328125, -57.6943359375, -55.65380859375, -53.61328125, -51.57275390625, -49.5322265625, -47.49169921875, -45.451171875, -43.41064453125, -41.3701171875, -39.32958984375, -37.2890625, -35.24853515625, -33.2080078125, -31.16748046875, -29.126953125, -27.08642578125, -25.0458984375, -23.00537109375, -20.96484375, -18.92431640625, -16.8837890625, -14.84326171875, -12.802734375, -10.76220703125, -8.7216796875, -6.68115234375, -4.640625, -2.60009765625, -0.5595703125, 1.48095703125, 3.521484375, 5.56201171875, 7.6025390625, 9.64306640625, 11.68359375, 13.72412109375, 15.7646484375, 17.80517578125, 19.845703125, 21.88623046875, 23.9267578125, 25.96728515625, 28.0078125, 30.04833984375, 32.0888671875, 34.12939453125, 36.169921875, 38.21044921875, 40.2509765625, 42.29150390625, 44.33203125, 46.37255859375, 48.4130859375, 50.45361328125, 52.494140625, 54.53466796875, 56.5751953125, 58.61572265625, 60.65625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 17.0, 40.0, 84.0, 135.0, 211.0, 247.0, 156.0, 69.0, 37.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.37998962402344, -145.89996337890625, -142.419921875, -138.9398956298828, -135.45985412597656, -131.97982788085938, -128.49978637695312, -125.01976013183594, -121.53972625732422, -118.0596923828125, -114.57965850830078, -111.09962463378906, -107.61959838867188, -104.13955688476562, -100.65953063964844, -97.17949676513672, -93.699462890625, -90.21942901611328, -86.73939514160156, -83.25936126708984, -79.77932739257812, -76.29930114746094, -72.81926727294922, -69.3392333984375, -65.85919952392578, -62.37916564941406, -58.899131774902344, -55.41910171508789, -51.93906784057617, -48.45903396606445, -44.97900390625, -41.49897003173828, -38.018943786621094, -34.538909912109375, -31.05887794494629, -27.578845977783203, -24.098812103271484, -20.618778228759766, -17.13874626159668, -13.658714294433594, -10.178680419921875, -6.698647499084473, -3.2186145782470703, 0.26141834259033203, 3.7414512634277344, 7.221485137939453, 10.701517105102539, 14.181549072265625, 17.661582946777344, 21.141616821289062, 24.62164878845215, 28.101680755615234, 31.581714630126953, 35.06174850463867, 38.541778564453125, 42.021812438964844, 45.50184631347656, 48.98188018798828, 52.4619140625, 55.94194412231445, 59.42197799682617, 62.90201187133789, 66.38204193115234, 69.86207580566406, 73.34210968017578]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 7.0, 5.0, 5.0, 7.0, 21.0, 17.0, 12.0, 29.0, 28.0, 22.0, 30.0, 31.0, 40.0, 45.0, 32.0, 34.0, 45.0, 46.0, 41.0, 43.0, 44.0, 44.0, 41.0, 33.0, 48.0, 39.0, 25.0, 18.0, 34.0, 20.0, 21.0, 17.0, 11.0, 22.0, 8.0, 7.0, 8.0, 9.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.09339141845703, -49.44645309448242, -47.79951858520508, -46.15258026123047, -44.50564193725586, -42.85870361328125, -41.211769104003906, -39.5648307800293, -37.91789245605469, -36.27095413208008, -34.624019622802734, -32.977081298828125, -31.330142974853516, -29.68320655822754, -28.036270141601562, -26.389331817626953, -24.742395401000977, -23.095458984375, -21.44852066040039, -19.801584243774414, -18.154645919799805, -16.507709503173828, -14.860772132873535, -13.213834762573242, -11.56689739227295, -9.919960021972656, -8.273022651672363, -6.6260857582092285, -4.9791483879089355, -3.332211494445801, -1.6852741241455078, -0.038336753845214844, 1.6086006164550781, 3.255537986755371, 4.902475357055664, 6.549412250518799, 8.19635009765625, 9.843286514282227, 11.49022388458252, 13.137161254882812, 14.784098625183105, 16.4310359954834, 18.077972412109375, 19.724910736083984, 21.37184715270996, 23.018783569335938, 24.665721893310547, 26.312660217285156, 27.959596633911133, 29.60653305053711, 31.25347137451172, 32.90040969848633, 34.54734420776367, 36.19428253173828, 37.84122085571289, 39.4881591796875, 41.135093688964844, 42.78203201293945, 44.4289665222168, 46.075904846191406, 47.722843170166016, 49.369781494140625, 51.01671600341797, 52.66365432739258, 54.31059265136719]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 4.0, 6.0, 17.0, 21.0, 17.0, 17.0, 22.0, 21.0, 22.0, 32.0, 30.0, 38.0, 34.0, 39.0, 39.0, 43.0, 46.0, 31.0, 43.0, 44.0, 31.0, 45.0, 41.0, 32.0, 29.0, 33.0, 34.0, 22.0, 21.0, 18.0, 15.0, 13.0, 16.0, 13.0, 12.0, 9.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0], "bins": [-6.796875, -6.62548828125, -6.4541015625, -6.28271484375, -6.111328125, -5.93994140625, -5.7685546875, -5.59716796875, -5.42578125, -5.25439453125, -5.0830078125, -4.91162109375, -4.740234375, -4.56884765625, -4.3974609375, -4.22607421875, -4.0546875, -3.88330078125, -3.7119140625, -3.54052734375, -3.369140625, -3.19775390625, -3.0263671875, -2.85498046875, -2.68359375, -2.51220703125, -2.3408203125, -2.16943359375, -1.998046875, -1.82666015625, -1.6552734375, -1.48388671875, -1.3125, -1.14111328125, -0.9697265625, -0.79833984375, -0.626953125, -0.45556640625, -0.2841796875, -0.11279296875, 0.05859375, 0.22998046875, 0.4013671875, 0.57275390625, 0.744140625, 0.91552734375, 1.0869140625, 1.25830078125, 1.4296875, 1.60107421875, 1.7724609375, 1.94384765625, 2.115234375, 2.28662109375, 2.4580078125, 2.62939453125, 2.80078125, 2.97216796875, 3.1435546875, 3.31494140625, 3.486328125, 3.65771484375, 3.8291015625, 4.00048828125, 4.171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 3.0, 14.0, 17.0, 28.0, 34.0, 35.0, 68.0, 115.0, 161.0, 246.0, 327.0, 483.0, 839.0, 1349.0, 2106.0, 3270.0, 5272.0, 7855.0, 12758.0, 20587.0, 32680.0, 54383.0, 92926.0, 160812.0, 247523.0, 164398.0, 95037.0, 55151.0, 33876.0, 20512.0, 12890.0, 8208.0, 5297.0, 3301.0, 2171.0, 1335.0, 883.0, 519.0, 367.0, 240.0, 156.0, 111.0, 71.0, 41.0, 27.0, 23.0, 14.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 4.0], "bins": [-0.7958984375, -0.77142333984375, -0.7469482421875, -0.72247314453125, -0.697998046875, -0.67352294921875, -0.6490478515625, -0.62457275390625, -0.60009765625, -0.57562255859375, -0.5511474609375, -0.52667236328125, -0.502197265625, -0.47772216796875, -0.4532470703125, -0.42877197265625, -0.404296875, -0.37982177734375, -0.3553466796875, -0.33087158203125, -0.306396484375, -0.28192138671875, -0.2574462890625, -0.23297119140625, -0.20849609375, -0.18402099609375, -0.1595458984375, -0.13507080078125, -0.110595703125, -0.08612060546875, -0.0616455078125, -0.03717041015625, -0.0126953125, 0.01177978515625, 0.0362548828125, 0.06072998046875, 0.085205078125, 0.10968017578125, 0.1341552734375, 0.15863037109375, 0.18310546875, 0.20758056640625, 0.2320556640625, 0.25653076171875, 0.281005859375, 0.30548095703125, 0.3299560546875, 0.35443115234375, 0.37890625, 0.40338134765625, 0.4278564453125, 0.45233154296875, 0.476806640625, 0.50128173828125, 0.5257568359375, 0.55023193359375, 0.57470703125, 0.59918212890625, 0.6236572265625, 0.64813232421875, 0.672607421875, 0.69708251953125, 0.7215576171875, 0.74603271484375, 0.7705078125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 2.0, 3.0, 8.0, 7.0, 11.0, 10.0, 22.0, 24.0, 18.0, 19.0, 29.0, 21.0, 39.0, 36.0, 43.0, 37.0, 44.0, 43.0, 49.0, 1068.0, 55.0, 52.0, 32.0, 45.0, 39.0, 31.0, 23.0, 37.0, 34.0, 27.0, 18.0, 20.0, 24.0, 15.0, 7.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.659820556640625, -3.53643798828125, -3.413055419921875, -3.2896728515625, -3.166290283203125, -3.04290771484375, -2.919525146484375, -2.796142578125, -2.672760009765625, -2.54937744140625, -2.425994873046875, -2.3026123046875, -2.179229736328125, -2.05584716796875, -1.932464599609375, -1.80908203125, -1.685699462890625, -1.56231689453125, -1.438934326171875, -1.3155517578125, -1.192169189453125, -1.06878662109375, -0.945404052734375, -0.822021484375, -0.698638916015625, -0.57525634765625, -0.451873779296875, -0.3284912109375, -0.205108642578125, -0.08172607421875, 0.041656494140625, 0.1650390625, 0.288421630859375, 0.41180419921875, 0.535186767578125, 0.6585693359375, 0.781951904296875, 0.90533447265625, 1.028717041015625, 1.152099609375, 1.275482177734375, 1.39886474609375, 1.522247314453125, 1.6456298828125, 1.769012451171875, 1.89239501953125, 2.015777587890625, 2.13916015625, 2.262542724609375, 2.38592529296875, 2.509307861328125, 2.6326904296875, 2.756072998046875, 2.87945556640625, 3.002838134765625, 3.126220703125, 3.249603271484375, 3.37298583984375, 3.496368408203125, 3.6197509765625, 3.743133544921875, 3.86651611328125, 3.989898681640625, 4.11328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 10.0, 11.0, 24.0, 36.0, 52.0, 92.0, 117.0, 202.0, 305.0, 451.0, 670.0, 1041.0, 1567.0, 2360.0, 3741.0, 5807.0, 8770.0, 13625.0, 21635.0, 34822.0, 58092.0, 100959.0, 181413.0, 1300886.0, 146623.0, 83805.0, 48241.0, 29448.0, 18518.0, 11795.0, 7622.0, 5057.0, 3221.0, 2015.0, 1454.0, 902.0, 560.0, 390.0, 266.0, 164.0, 110.0, 85.0, 54.0, 35.0, 17.0, 15.0, 7.0, 7.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-0.75341796875, -0.7293701171875, -0.705322265625, -0.6812744140625, -0.6572265625, -0.6331787109375, -0.609130859375, -0.5850830078125, -0.56103515625, -0.5369873046875, -0.512939453125, -0.4888916015625, -0.46484375, -0.4407958984375, -0.416748046875, -0.3927001953125, -0.36865234375, -0.3446044921875, -0.320556640625, -0.2965087890625, -0.2724609375, -0.2484130859375, -0.224365234375, -0.2003173828125, -0.17626953125, -0.1522216796875, -0.128173828125, -0.1041259765625, -0.080078125, -0.0560302734375, -0.031982421875, -0.0079345703125, 0.01611328125, 0.0401611328125, 0.064208984375, 0.0882568359375, 0.1123046875, 0.1363525390625, 0.160400390625, 0.1844482421875, 0.20849609375, 0.2325439453125, 0.256591796875, 0.2806396484375, 0.3046875, 0.3287353515625, 0.352783203125, 0.3768310546875, 0.40087890625, 0.4249267578125, 0.448974609375, 0.4730224609375, 0.4970703125, 0.5211181640625, 0.545166015625, 0.5692138671875, 0.59326171875, 0.6173095703125, 0.641357421875, 0.6654052734375, 0.689453125, 0.7135009765625, 0.737548828125, 0.7615966796875, 0.78564453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 5.0, 4.0, 2.0, 5.0, 8.0, 7.0, 15.0, 17.0, 19.0, 28.0, 37.0, 36.0, 44.0, 55.0, 81.0, 89.0, 93.0, 89.0, 71.0, 48.0, 51.0, 34.0, 30.0, 26.0, 15.0, 12.0, 11.0, 14.0, 8.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008287429809570312, -0.000802166759967804, -0.0007755905389785767, -0.0007490143179893494, -0.0007224380970001221, -0.0006958618760108948, -0.0006692856550216675, -0.0006427094340324402, -0.0006161332130432129, -0.0005895569920539856, -0.0005629807710647583, -0.000536404550075531, -0.0005098283290863037, -0.0004832521080970764, -0.0004566758871078491, -0.0004300996661186218, -0.00040352344512939453, -0.00037694722414016724, -0.00035037100315093994, -0.00032379478216171265, -0.00029721856117248535, -0.00027064234018325806, -0.00024406611919403076, -0.00021748989820480347, -0.00019091367721557617, -0.00016433745622634888, -0.00013776123523712158, -0.00011118501424789429, -8.460879325866699e-05, -5.80325722694397e-05, -3.14563512802124e-05, -4.880130290985107e-06, 2.1696090698242188e-05, 4.827231168746948e-05, 7.484853267669678e-05, 0.00010142475366592407, 0.00012800097465515137, 0.00015457719564437866, 0.00018115341663360596, 0.00020772963762283325, 0.00023430585861206055, 0.00026088207960128784, 0.00028745830059051514, 0.00031403452157974243, 0.0003406107425689697, 0.000367186963558197, 0.0003937631845474243, 0.0004203394055366516, 0.0004469156265258789, 0.0004734918475151062, 0.0005000680685043335, 0.0005266442894935608, 0.0005532205104827881, 0.0005797967314720154, 0.0006063729524612427, 0.00063294917345047, 0.0006595253944396973, 0.0006861016154289246, 0.0007126778364181519, 0.0007392540574073792, 0.0007658302783966064, 0.0007924064993858337, 0.000818982720375061, 0.0008455589413642883, 0.0008721351623535156]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 9.0, 10.0, 8.0, 9.0, 18.0, 18.0, 22.0, 31.0, 53.0, 84.0, 144.0, 306.0, 947.0, 975808.0, 69823.0, 659.0, 235.0, 118.0, 67.0, 38.0, 30.0, 19.0, 19.0, 13.0, 12.0, 6.0, 3.0, 5.0, 5.0, 6.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02484130859375, -0.024085283279418945, -0.02332925796508789, -0.022573232650756836, -0.02181720733642578, -0.021061182022094727, -0.020305156707763672, -0.019549131393432617, -0.018793106079101562, -0.018037080764770508, -0.017281055450439453, -0.0165250301361084, -0.015769004821777344, -0.015012979507446289, -0.014256954193115234, -0.01350092887878418, -0.012744903564453125, -0.01198887825012207, -0.011232852935791016, -0.010476827621459961, -0.009720802307128906, -0.008964776992797852, -0.008208751678466797, -0.007452726364135742, -0.0066967010498046875, -0.005940675735473633, -0.005184650421142578, -0.0044286251068115234, -0.0036725997924804688, -0.002916574478149414, -0.0021605491638183594, -0.0014045238494873047, -0.00064849853515625, 0.00010752677917480469, 0.0008635520935058594, 0.001619577407836914, 0.0023756027221679688, 0.0031316280364990234, 0.003887653350830078, 0.004643678665161133, 0.0053997039794921875, 0.006155729293823242, 0.006911754608154297, 0.0076677799224853516, 0.008423805236816406, 0.009179830551147461, 0.009935855865478516, 0.01069188117980957, 0.011447906494140625, 0.01220393180847168, 0.012959957122802734, 0.013715982437133789, 0.014472007751464844, 0.015228033065795898, 0.015984058380126953, 0.016740083694458008, 0.017496109008789062, 0.018252134323120117, 0.019008159637451172, 0.019764184951782227, 0.02052021026611328, 0.021276235580444336, 0.02203226089477539, 0.022788286209106445, 0.0235443115234375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 518.0, 498.0, 3.0], "bins": [-0.00933971256017685, -0.009189039468765259, -0.009038367308676243, -0.008887694217264652, -0.008737021125853062, -0.008586348965764046, -0.008435675874352455, -0.008285002782940865, -0.008134330622851849, -0.007983657531440258, -0.007832985371351242, -0.0076823122799396515, -0.007531639654189348, -0.007380967028439045, -0.007230293937027454, -0.007079621311277151, -0.006928948685526848, -0.006778276059776545, -0.006627602968364954, -0.006476930342614651, -0.0063262577168643475, -0.006175585091114044, -0.006024911999702454, -0.00587423937395215, -0.00572356628254056, -0.0055728936567902565, -0.005422220565378666, -0.005271547939628363, -0.005120875313878059, -0.004970202688127756, -0.0048195295967161655, -0.004668856970965862, -0.004518184810876846, -0.004367512185126543, -0.0042168390937149525, -0.004066166467964649, -0.003915493842214346, -0.003764820983633399, -0.003614148125052452, -0.003463475499302149, -0.003312802640721202, -0.003162129782140255, -0.0030114571563899517, -0.002860784297809005, -0.0027101116720587015, -0.0025594388134777546, -0.0024087661877274513, -0.0022580933291465044, -0.0021074204705655575, -0.0019567476119846106, -0.0018060749862343073, -0.0016554021276533604, -0.001504729501903057, -0.0013540566433221102, -0.001203383901156485, -0.00105271115899086, -0.0009020384750328958, -0.0007513657328672707, -0.0006006929324939847, -0.0004500201903283596, -0.0002993474481627345, -0.0001486747059971094, 1.9980943761765957e-06, 0.0001526708365418017, 0.0003033435787074268]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 16.0, 8.0, 20.0, 11.0, 19.0, 28.0, 23.0, 28.0, 32.0, 37.0, 43.0, 32.0, 43.0, 36.0, 54.0, 36.0, 43.0, 46.0, 39.0, 46.0, 44.0, 35.0, 39.0, 34.0, 22.0, 30.0, 21.0, 19.0, 14.0, 9.0, 13.0, 13.0, 10.0, 9.0, 4.0, 7.0, 4.0, 3.0, 1.0, 4.0], "bins": [-0.0005096197128295898, -0.0004967181012034416, -0.0004838164895772934, -0.00047091487795114517, -0.00045801326632499695, -0.0004451116546988487, -0.0004322100430727005, -0.0004193084314465523, -0.00040640681982040405, -0.00039350520819425583, -0.0003806035965681076, -0.0003677019849419594, -0.00035480037331581116, -0.00034189876168966293, -0.0003289971500635147, -0.0003160955384373665, -0.00030319392681121826, -0.00029029231518507004, -0.0002773907035589218, -0.0002644890919327736, -0.00025158748030662537, -0.00023868586868047714, -0.00022578425705432892, -0.0002128826454281807, -0.00019998103380203247, -0.00018707942217588425, -0.00017417781054973602, -0.0001612761989235878, -0.00014837458729743958, -0.00013547297567129135, -0.00012257136404514313, -0.0001096697524189949, -9.676814079284668e-05, -8.386652916669846e-05, -7.096491754055023e-05, -5.806330591440201e-05, -4.5161694288253784e-05, -3.226008266210556e-05, -1.9358471035957336e-05, -6.4568594098091125e-06, 6.444752216339111e-06, 1.9346363842487335e-05, 3.224797546863556e-05, 4.514958709478378e-05, 5.805119872093201e-05, 7.095281034708023e-05, 8.385442197322845e-05, 9.675603359937668e-05, 0.0001096576452255249, 0.00012255925685167313, 0.00013546086847782135, 0.00014836248010396957, 0.0001612640917301178, 0.00017416570335626602, 0.00018706731498241425, 0.00019996892660856247, 0.0002128705382347107, 0.00022577214986085892, 0.00023867376148700714, 0.00025157537311315536, 0.0002644769847393036, 0.0002773785963654518, 0.00029028020799160004, 0.00030318181961774826, 0.0003160834312438965]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 4.0, 6.0, 17.0, 21.0, 17.0, 17.0, 22.0, 21.0, 22.0, 32.0, 30.0, 38.0, 34.0, 39.0, 39.0, 43.0, 46.0, 31.0, 43.0, 44.0, 31.0, 45.0, 41.0, 32.0, 29.0, 33.0, 34.0, 22.0, 21.0, 18.0, 15.0, 13.0, 16.0, 13.0, 12.0, 9.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0], "bins": [-6.796875, -6.62548828125, -6.4541015625, -6.28271484375, -6.111328125, -5.93994140625, -5.7685546875, -5.59716796875, -5.42578125, -5.25439453125, -5.0830078125, -4.91162109375, -4.740234375, -4.56884765625, -4.3974609375, -4.22607421875, -4.0546875, -3.88330078125, -3.7119140625, -3.54052734375, -3.369140625, -3.19775390625, -3.0263671875, -2.85498046875, -2.68359375, -2.51220703125, -2.3408203125, -2.16943359375, -1.998046875, -1.82666015625, -1.6552734375, -1.48388671875, -1.3125, -1.14111328125, -0.9697265625, -0.79833984375, -0.626953125, -0.45556640625, -0.2841796875, -0.11279296875, 0.05859375, 0.22998046875, 0.4013671875, 0.57275390625, 0.744140625, 0.91552734375, 1.0869140625, 1.25830078125, 1.4296875, 1.60107421875, 1.7724609375, 1.94384765625, 2.115234375, 2.28662109375, 2.4580078125, 2.62939453125, 2.80078125, 2.97216796875, 3.1435546875, 3.31494140625, 3.486328125, 3.65771484375, 3.8291015625, 4.00048828125, 4.171875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 10.0, 11.0, 12.0, 18.0, 17.0, 27.0, 37.0, 69.0, 89.0, 151.0, 217.0, 365.0, 619.0, 1256.0, 2581.0, 5374.0, 13537.0, 36860.0, 107303.0, 323482.0, 362906.0, 124039.0, 42293.0, 15277.0, 6130.0, 2720.0, 1371.0, 673.0, 403.0, 241.0, 131.0, 108.0, 68.0, 49.0, 32.0, 19.0, 15.0, 10.0, 9.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.203125, -5.062744140625, -4.92236328125, -4.781982421875, -4.6416015625, -4.501220703125, -4.36083984375, -4.220458984375, -4.080078125, -3.939697265625, -3.79931640625, -3.658935546875, -3.5185546875, -3.378173828125, -3.23779296875, -3.097412109375, -2.95703125, -2.816650390625, -2.67626953125, -2.535888671875, -2.3955078125, -2.255126953125, -2.11474609375, -1.974365234375, -1.833984375, -1.693603515625, -1.55322265625, -1.412841796875, -1.2724609375, -1.132080078125, -0.99169921875, -0.851318359375, -0.7109375, -0.570556640625, -0.43017578125, -0.289794921875, -0.1494140625, -0.009033203125, 0.13134765625, 0.271728515625, 0.412109375, 0.552490234375, 0.69287109375, 0.833251953125, 0.9736328125, 1.114013671875, 1.25439453125, 1.394775390625, 1.53515625, 1.675537109375, 1.81591796875, 1.956298828125, 2.0966796875, 2.237060546875, 2.37744140625, 2.517822265625, 2.658203125, 2.798583984375, 2.93896484375, 3.079345703125, 3.2197265625, 3.360107421875, 3.50048828125, 3.640869140625, 3.78125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 10.0, 11.0, 20.0, 30.0, 22.0, 28.0, 26.0, 29.0, 47.0, 56.0, 53.0, 75.0, 91.0, 429.0, 1596.0, 108.0, 82.0, 57.0, 41.0, 33.0, 32.0, 28.0, 27.0, 20.0, 21.0, 15.0, 13.0, 12.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.828125, -29.99609375, -29.1640625, -28.33203125, -27.5, -26.66796875, -25.8359375, -25.00390625, -24.171875, -23.33984375, -22.5078125, -21.67578125, -20.84375, -20.01171875, -19.1796875, -18.34765625, -17.515625, -16.68359375, -15.8515625, -15.01953125, -14.1875, -13.35546875, -12.5234375, -11.69140625, -10.859375, -10.02734375, -9.1953125, -8.36328125, -7.53125, -6.69921875, -5.8671875, -5.03515625, -4.203125, -3.37109375, -2.5390625, -1.70703125, -0.875, -0.04296875, 0.7890625, 1.62109375, 2.453125, 3.28515625, 4.1171875, 4.94921875, 5.78125, 6.61328125, 7.4453125, 8.27734375, 9.109375, 9.94140625, 10.7734375, 11.60546875, 12.4375, 13.26953125, 14.1015625, 14.93359375, 15.765625, 16.59765625, 17.4296875, 18.26171875, 19.09375, 19.92578125, 20.7578125, 21.58984375, 22.421875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 9.0, 5.0, 15.0, 24.0, 23.0, 44.0, 40.0, 68.0, 106.0, 186.0, 325.0, 730.0, 10046.0, 3127482.0, 5156.0, 610.0, 303.0, 194.0, 101.0, 66.0, 45.0, 47.0, 32.0, 15.0, 12.0, 10.0, 8.0, 5.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-72.8125, -70.69775390625, -68.5830078125, -66.46826171875, -64.353515625, -62.23876953125, -60.1240234375, -58.00927734375, -55.89453125, -53.77978515625, -51.6650390625, -49.55029296875, -47.435546875, -45.32080078125, -43.2060546875, -41.09130859375, -38.9765625, -36.86181640625, -34.7470703125, -32.63232421875, -30.517578125, -28.40283203125, -26.2880859375, -24.17333984375, -22.05859375, -19.94384765625, -17.8291015625, -15.71435546875, -13.599609375, -11.48486328125, -9.3701171875, -7.25537109375, -5.140625, -3.02587890625, -0.9111328125, 1.20361328125, 3.318359375, 5.43310546875, 7.5478515625, 9.66259765625, 11.77734375, 13.89208984375, 16.0068359375, 18.12158203125, 20.236328125, 22.35107421875, 24.4658203125, 26.58056640625, 28.6953125, 30.81005859375, 32.9248046875, 35.03955078125, 37.154296875, 39.26904296875, 41.3837890625, 43.49853515625, 45.61328125, 47.72802734375, 49.8427734375, 51.95751953125, 54.072265625, 56.18701171875, 58.3017578125, 60.41650390625, 62.53125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 163.0, 838.0, 13.0, 2.0, 0.0, 0.0, 1.0], "bins": [-364.9888610839844, -358.7249450683594, -352.4610290527344, -346.1971130371094, -339.9331970214844, -333.6692810058594, -327.4053649902344, -321.1414489746094, -314.8775329589844, -308.6136169433594, -302.3497009277344, -296.0857849121094, -289.8218688964844, -283.5579528808594, -277.2940368652344, -271.0301208496094, -264.76617431640625, -258.50225830078125, -252.23834228515625, -245.97442626953125, -239.71051025390625, -233.44659423828125, -227.18267822265625, -220.91876220703125, -214.65484619140625, -208.39093017578125, -202.12701416015625, -195.86309814453125, -189.59918212890625, -183.33526611328125, -177.07135009765625, -170.80743408203125, -164.54351806640625, -158.27960205078125, -152.01568603515625, -145.75177001953125, -139.48785400390625, -133.22393798828125, -126.96001434326172, -120.69609832763672, -114.43217468261719, -108.16825866699219, -101.90434265136719, -95.64042663574219, -89.37651062011719, -83.11259460449219, -76.84867095947266, -70.58475494384766, -64.32083892822266, -58.056922912597656, -51.793006896972656, -45.52908706665039, -39.26517105102539, -33.00125503540039, -26.737335205078125, -20.473419189453125, -14.209503173828125, -7.945586204528809, -1.6816692352294922, 4.582248687744141, 10.84616470336914, 17.11008071899414, 23.374000549316406, 29.637916564941406, 35.901832580566406]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 6.0, 4.0, 6.0, 11.0, 7.0, 16.0, 16.0, 20.0, 25.0, 16.0, 28.0, 23.0, 28.0, 42.0, 34.0, 39.0, 27.0, 42.0, 44.0, 38.0, 50.0, 44.0, 37.0, 27.0, 34.0, 40.0, 41.0, 31.0, 20.0, 24.0, 19.0, 21.0, 17.0, 18.0, 18.0, 17.0, 9.0, 10.0, 7.0, 14.0, 9.0, 9.0, 2.0, 6.0, 2.0, 0.0, 2.0, 4.0, 4.0], "bins": [-58.86090087890625, -57.23533248901367, -55.60976028442383, -53.98419189453125, -52.358619689941406, -50.73305130004883, -49.10748291015625, -47.481910705566406, -45.85633850097656, -44.230770111083984, -42.60519790649414, -40.97962951660156, -39.35405731201172, -37.72848892211914, -36.10292053222656, -34.47734832763672, -32.85177993774414, -31.22620964050293, -29.60063934326172, -27.97507095336914, -26.349498748779297, -24.72393035888672, -23.098360061645508, -21.472789764404297, -19.847219467163086, -18.221649169921875, -16.596078872680664, -14.97050952911377, -13.344939231872559, -11.719368934631348, -10.093799591064453, -8.468229293823242, -6.842658996582031, -5.21708869934082, -3.5915188789367676, -1.9659490585327148, -0.3403787612915039, 1.285191535949707, 2.9107608795166016, 4.5363311767578125, 6.161901473999023, 7.787471771240234, 9.413042068481445, 11.03861141204834, 12.66418170928955, 14.289752006530762, 15.915321350097656, 17.540891647338867, 19.166461944580078, 20.79203224182129, 22.4176025390625, 24.043170928955078, 25.668743133544922, 27.2943115234375, 28.91988182067871, 30.545452117919922, 32.1710205078125, 33.79658889770508, 35.42216110229492, 37.0477294921875, 38.673301696777344, 40.29887008666992, 41.9244384765625, 43.550010681152344, 45.17558288574219]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 11.0, 10.0, 10.0, 9.0, 16.0, 15.0, 16.0, 21.0, 15.0, 32.0, 23.0, 27.0, 32.0, 42.0, 35.0, 48.0, 33.0, 43.0, 38.0, 40.0, 44.0, 36.0, 40.0, 39.0, 36.0, 32.0, 24.0, 39.0, 25.0, 21.0, 17.0, 18.0, 21.0, 19.0, 9.0, 7.0, 15.0, 9.0, 12.0, 9.0, 4.0, 3.0, 2.0, 3.0], "bins": [-6.8359375, -6.66192626953125, -6.4879150390625, -6.31390380859375, -6.139892578125, -5.96588134765625, -5.7918701171875, -5.61785888671875, -5.44384765625, -5.26983642578125, -5.0958251953125, -4.92181396484375, -4.747802734375, -4.57379150390625, -4.3997802734375, -4.22576904296875, -4.0517578125, -3.87774658203125, -3.7037353515625, -3.52972412109375, -3.355712890625, -3.18170166015625, -3.0076904296875, -2.83367919921875, -2.65966796875, -2.48565673828125, -2.3116455078125, -2.13763427734375, -1.963623046875, -1.78961181640625, -1.6156005859375, -1.44158935546875, -1.267578125, -1.09356689453125, -0.9195556640625, -0.74554443359375, -0.571533203125, -0.39752197265625, -0.2235107421875, -0.04949951171875, 0.12451171875, 0.29852294921875, 0.4725341796875, 0.64654541015625, 0.820556640625, 0.99456787109375, 1.1685791015625, 1.34259033203125, 1.5166015625, 1.69061279296875, 1.8646240234375, 2.03863525390625, 2.212646484375, 2.38665771484375, 2.5606689453125, 2.73468017578125, 2.90869140625, 3.08270263671875, 3.2567138671875, 3.43072509765625, 3.604736328125, 3.77874755859375, 3.9527587890625, 4.12677001953125, 4.30078125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 9.0, 10.0, 12.0, 14.0, 18.0, 14.0, 17.0, 20.0, 18.0, 36.0, 32.0, 54.0, 71.0, 120.0, 153.0, 365.0, 1873.0, 59539.0, 3724020.0, 401970.0, 4709.0, 479.0, 221.0, 101.0, 94.0, 51.0, 39.0, 33.0, 21.0, 19.0, 15.0, 24.0, 12.0, 17.0, 22.0, 9.0, 9.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 4.0], "bins": [-36.6875, -35.73876953125, -34.7900390625, -33.84130859375, -32.892578125, -31.94384765625, -30.9951171875, -30.04638671875, -29.09765625, -28.14892578125, -27.2001953125, -26.25146484375, -25.302734375, -24.35400390625, -23.4052734375, -22.45654296875, -21.5078125, -20.55908203125, -19.6103515625, -18.66162109375, -17.712890625, -16.76416015625, -15.8154296875, -14.86669921875, -13.91796875, -12.96923828125, -12.0205078125, -11.07177734375, -10.123046875, -9.17431640625, -8.2255859375, -7.27685546875, -6.328125, -5.37939453125, -4.4306640625, -3.48193359375, -2.533203125, -1.58447265625, -0.6357421875, 0.31298828125, 1.26171875, 2.21044921875, 3.1591796875, 4.10791015625, 5.056640625, 6.00537109375, 6.9541015625, 7.90283203125, 8.8515625, 9.80029296875, 10.7490234375, 11.69775390625, 12.646484375, 13.59521484375, 14.5439453125, 15.49267578125, 16.44140625, 17.39013671875, 18.3388671875, 19.28759765625, 20.236328125, 21.18505859375, 22.1337890625, 23.08251953125, 24.03125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 11.0, 18.0, 21.0, 24.0, 32.0, 70.0, 77.0, 118.0, 168.0, 269.0, 318.0, 431.0, 506.0, 461.0, 455.0, 278.0, 265.0, 172.0, 110.0, 80.0, 53.0, 31.0, 32.0, 14.0, 21.0, 7.0, 8.0, 6.0, 4.0, 4.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.328125, -16.846923828125, -16.36572265625, -15.884521484375, -15.4033203125, -14.922119140625, -14.44091796875, -13.959716796875, -13.478515625, -12.997314453125, -12.51611328125, -12.034912109375, -11.5537109375, -11.072509765625, -10.59130859375, -10.110107421875, -9.62890625, -9.147705078125, -8.66650390625, -8.185302734375, -7.7041015625, -7.222900390625, -6.74169921875, -6.260498046875, -5.779296875, -5.298095703125, -4.81689453125, -4.335693359375, -3.8544921875, -3.373291015625, -2.89208984375, -2.410888671875, -1.9296875, -1.448486328125, -0.96728515625, -0.486083984375, -0.0048828125, 0.476318359375, 0.95751953125, 1.438720703125, 1.919921875, 2.401123046875, 2.88232421875, 3.363525390625, 3.8447265625, 4.325927734375, 4.80712890625, 5.288330078125, 5.76953125, 6.250732421875, 6.73193359375, 7.213134765625, 7.6943359375, 8.175537109375, 8.65673828125, 9.137939453125, 9.619140625, 10.100341796875, 10.58154296875, 11.062744140625, 11.5439453125, 12.025146484375, 12.50634765625, 12.987548828125, 13.46875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 9.0, 19.0, 17.0, 13.0, 41.0, 37.0, 64.0, 70.0, 84.0, 128.0, 170.0, 264.0, 427.0, 1099.0, 26402.0, 4062155.0, 100013.0, 1631.0, 567.0, 327.0, 201.0, 138.0, 115.0, 84.0, 57.0, 31.0, 24.0, 18.0, 16.0, 16.0, 4.0, 4.0, 3.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.46875, -53.52978515625, -51.5908203125, -49.65185546875, -47.712890625, -45.77392578125, -43.8349609375, -41.89599609375, -39.95703125, -38.01806640625, -36.0791015625, -34.14013671875, -32.201171875, -30.26220703125, -28.3232421875, -26.38427734375, -24.4453125, -22.50634765625, -20.5673828125, -18.62841796875, -16.689453125, -14.75048828125, -12.8115234375, -10.87255859375, -8.93359375, -6.99462890625, -5.0556640625, -3.11669921875, -1.177734375, 0.76123046875, 2.7001953125, 4.63916015625, 6.578125, 8.51708984375, 10.4560546875, 12.39501953125, 14.333984375, 16.27294921875, 18.2119140625, 20.15087890625, 22.08984375, 24.02880859375, 25.9677734375, 27.90673828125, 29.845703125, 31.78466796875, 33.7236328125, 35.66259765625, 37.6015625, 39.54052734375, 41.4794921875, 43.41845703125, 45.357421875, 47.29638671875, 49.2353515625, 51.17431640625, 53.11328125, 55.05224609375, 56.9912109375, 58.93017578125, 60.869140625, 62.80810546875, 64.7470703125, 66.68603515625, 68.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 116.0, 272.0, 336.0, 205.0, 64.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.97164154052734, -69.35172271728516, -63.73180389404297, -58.111881256103516, -52.49196243286133, -46.87204360961914, -41.25212097167969, -35.6322021484375, -30.012283325195312, -24.392364501953125, -18.772443771362305, -13.152523040771484, -7.532604217529297, -1.9126853942871094, 3.7072372436523438, 9.327156066894531, 14.947074890136719, 20.566993713378906, 26.186914443969727, 31.806835174560547, 37.426753997802734, 43.04667282104492, 48.666595458984375, 54.28651428222656, 59.90643310546875, 65.52635192871094, 71.14627075195312, 76.76618957519531, 82.3861083984375, 88.00602722167969, 93.6259536743164, 99.2458724975586, 104.86578369140625, 110.48570251464844, 116.10562133789062, 121.72554016113281, 127.345458984375, 132.9653778076172, 138.58529663085938, 144.20523071289062, 149.82513427734375, 155.44505310058594, 161.06497192382812, 166.6848907470703, 172.3048095703125, 177.9247283935547, 183.54464721679688, 189.16458129882812, 194.7845001220703, 200.4044189453125, 206.0243377685547, 211.64425659179688, 217.26417541503906, 222.88409423828125, 228.5040283203125, 234.12393188476562, 239.74386596679688, 245.36378479003906, 250.98370361328125, 256.6036376953125, 262.2235412597656, 267.8434753417969, 273.46337890625, 279.08331298828125, 284.7032165527344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 2.0, 11.0, 7.0, 12.0, 12.0, 20.0, 8.0, 12.0, 24.0, 28.0, 21.0, 31.0, 31.0, 27.0, 32.0, 41.0, 38.0, 44.0, 42.0, 35.0, 49.0, 33.0, 47.0, 44.0, 38.0, 22.0, 37.0, 33.0, 28.0, 35.0, 22.0, 28.0, 17.0, 18.0, 13.0, 15.0, 9.0, 6.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-42.17071533203125, -40.77130126953125, -39.371883392333984, -37.972469329833984, -36.573055267333984, -35.17363739013672, -33.77422332763672, -32.37480926513672, -30.975393295288086, -29.575977325439453, -28.176563262939453, -26.77714729309082, -25.377731323242188, -23.978317260742188, -22.578901290893555, -21.179485321044922, -19.780071258544922, -18.38065528869629, -16.98124122619629, -15.581825256347656, -14.18241024017334, -12.782995223999023, -11.38357925415039, -9.984164237976074, -8.584749221801758, -7.185334205627441, -5.785918712615967, -4.386503219604492, -2.987088203430176, -1.5876731872558594, -0.18825721740722656, 1.2111577987670898, 2.6105728149414062, 4.009987831115723, 5.409403324127197, 6.808818817138672, 8.208233833312988, 9.607648849487305, 11.007064819335938, 12.406479835510254, 13.80589485168457, 15.205309867858887, 16.604724884033203, 18.004140853881836, 19.40355682373047, 20.80297088623047, 22.2023868560791, 23.601802825927734, 25.001216888427734, 26.400632858276367, 27.800046920776367, 29.199462890625, 30.598876953125, 31.998292922973633, 33.397708892822266, 34.797122955322266, 36.19654083251953, 37.59595489501953, 38.9953727722168, 40.3947868347168, 41.7942008972168, 43.19361877441406, 44.59303283691406, 45.99244689941406, 47.39186096191406]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 10.0, 4.0, 12.0, 7.0, 6.0, 7.0, 16.0, 17.0, 16.0, 29.0, 18.0, 27.0, 26.0, 25.0, 31.0, 45.0, 41.0, 40.0, 45.0, 58.0, 49.0, 45.0, 42.0, 36.0, 34.0, 36.0, 24.0, 24.0, 31.0, 36.0, 24.0, 24.0, 10.0, 24.0, 12.0, 19.0, 12.0, 10.0, 11.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 4.0], "bins": [-7.0390625, -6.856689453125, -6.67431640625, -6.491943359375, -6.3095703125, -6.127197265625, -5.94482421875, -5.762451171875, -5.580078125, -5.397705078125, -5.21533203125, -5.032958984375, -4.8505859375, -4.668212890625, -4.48583984375, -4.303466796875, -4.12109375, -3.938720703125, -3.75634765625, -3.573974609375, -3.3916015625, -3.209228515625, -3.02685546875, -2.844482421875, -2.662109375, -2.479736328125, -2.29736328125, -2.114990234375, -1.9326171875, -1.750244140625, -1.56787109375, -1.385498046875, -1.203125, -1.020751953125, -0.83837890625, -0.656005859375, -0.4736328125, -0.291259765625, -0.10888671875, 0.073486328125, 0.255859375, 0.438232421875, 0.62060546875, 0.802978515625, 0.9853515625, 1.167724609375, 1.35009765625, 1.532470703125, 1.71484375, 1.897216796875, 2.07958984375, 2.261962890625, 2.4443359375, 2.626708984375, 2.80908203125, 2.991455078125, 3.173828125, 3.356201171875, 3.53857421875, 3.720947265625, 3.9033203125, 4.085693359375, 4.26806640625, 4.450439453125, 4.6328125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 5.0, 9.0, 4.0, 18.0, 16.0, 38.0, 52.0, 74.0, 107.0, 178.0, 292.0, 386.0, 640.0, 905.0, 1409.0, 2073.0, 3100.0, 4835.0, 7433.0, 11621.0, 18250.0, 29929.0, 50014.0, 85708.0, 152340.0, 261764.0, 174137.0, 96690.0, 56298.0, 33379.0, 20272.0, 13074.0, 8116.0, 5351.0, 3381.0, 2300.0, 1474.0, 982.0, 632.0, 423.0, 275.0, 195.0, 127.0, 80.0, 54.0, 40.0, 30.0, 20.0, 6.0, 11.0, 5.0, 0.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.8486328125, -0.8217849731445312, -0.7949371337890625, -0.7680892944335938, -0.741241455078125, -0.7143936157226562, -0.6875457763671875, -0.6606979370117188, -0.63385009765625, -0.6070022583007812, -0.5801544189453125, -0.5533065795898438, -0.526458740234375, -0.49961090087890625, -0.4727630615234375, -0.44591522216796875, -0.4190673828125, -0.39221954345703125, -0.3653717041015625, -0.33852386474609375, -0.311676025390625, -0.28482818603515625, -0.2579803466796875, -0.23113250732421875, -0.20428466796875, -0.17743682861328125, -0.1505889892578125, -0.12374114990234375, -0.096893310546875, -0.07004547119140625, -0.0431976318359375, -0.01634979248046875, 0.010498046875, 0.03734588623046875, 0.0641937255859375, 0.09104156494140625, 0.117889404296875, 0.14473724365234375, 0.1715850830078125, 0.19843292236328125, 0.22528076171875, 0.25212860107421875, 0.2789764404296875, 0.30582427978515625, 0.332672119140625, 0.35951995849609375, 0.3863677978515625, 0.41321563720703125, 0.4400634765625, 0.46691131591796875, 0.4937591552734375, 0.5206069946289062, 0.547454833984375, 0.5743026733398438, 0.6011505126953125, 0.6279983520507812, 0.65484619140625, 0.6816940307617188, 0.7085418701171875, 0.7353897094726562, 0.762237548828125, 0.7890853881835938, 0.8159332275390625, 0.8427810668945312, 0.86962890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 9.0, 4.0, 4.0, 10.0, 11.0, 19.0, 21.0, 23.0, 25.0, 19.0, 24.0, 25.0, 31.0, 41.0, 29.0, 37.0, 41.0, 53.0, 48.0, 1065.0, 47.0, 57.0, 43.0, 42.0, 32.0, 32.0, 31.0, 21.0, 27.0, 18.0, 17.0, 18.0, 14.0, 21.0, 19.0, 7.0, 12.0, 7.0, 2.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.466949462890625, -3.35382080078125, -3.240692138671875, -3.1275634765625, -3.014434814453125, -2.90130615234375, -2.788177490234375, -2.675048828125, -2.561920166015625, -2.44879150390625, -2.335662841796875, -2.2225341796875, -2.109405517578125, -1.99627685546875, -1.883148193359375, -1.77001953125, -1.656890869140625, -1.54376220703125, -1.430633544921875, -1.3175048828125, -1.204376220703125, -1.09124755859375, -0.978118896484375, -0.864990234375, -0.751861572265625, -0.63873291015625, -0.525604248046875, -0.4124755859375, -0.299346923828125, -0.18621826171875, -0.073089599609375, 0.0400390625, 0.153167724609375, 0.26629638671875, 0.379425048828125, 0.4925537109375, 0.605682373046875, 0.71881103515625, 0.831939697265625, 0.945068359375, 1.058197021484375, 1.17132568359375, 1.284454345703125, 1.3975830078125, 1.510711669921875, 1.62384033203125, 1.736968994140625, 1.85009765625, 1.963226318359375, 2.07635498046875, 2.189483642578125, 2.3026123046875, 2.415740966796875, 2.52886962890625, 2.641998291015625, 2.755126953125, 2.868255615234375, 2.98138427734375, 3.094512939453125, 3.2076416015625, 3.320770263671875, 3.43389892578125, 3.547027587890625, 3.66015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 13.0, 20.0, 23.0, 40.0, 37.0, 89.0, 94.0, 138.0, 217.0, 262.0, 430.0, 633.0, 918.0, 1274.0, 1943.0, 2818.0, 4227.0, 6324.0, 9746.0, 15060.0, 23082.0, 37067.0, 62539.0, 106881.0, 193049.0, 1288317.0, 136780.0, 78368.0, 46241.0, 27801.0, 18011.0, 11478.0, 7592.0, 5019.0, 3412.0, 2229.0, 1549.0, 1088.0, 739.0, 489.0, 318.0, 238.0, 154.0, 109.0, 74.0, 66.0, 46.0, 25.0, 23.0, 14.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7158203125, -0.6928863525390625, -0.669952392578125, -0.6470184326171875, -0.62408447265625, -0.6011505126953125, -0.578216552734375, -0.5552825927734375, -0.5323486328125, -0.5094146728515625, -0.486480712890625, -0.4635467529296875, -0.44061279296875, -0.4176788330078125, -0.394744873046875, -0.3718109130859375, -0.348876953125, -0.3259429931640625, -0.303009033203125, -0.2800750732421875, -0.25714111328125, -0.2342071533203125, -0.211273193359375, -0.1883392333984375, -0.1654052734375, -0.1424713134765625, -0.119537353515625, -0.0966033935546875, -0.07366943359375, -0.0507354736328125, -0.027801513671875, -0.0048675537109375, 0.01806640625, 0.0410003662109375, 0.063934326171875, 0.0868682861328125, 0.10980224609375, 0.1327362060546875, 0.155670166015625, 0.1786041259765625, 0.2015380859375, 0.2244720458984375, 0.247406005859375, 0.2703399658203125, 0.29327392578125, 0.3162078857421875, 0.339141845703125, 0.3620758056640625, 0.385009765625, 0.4079437255859375, 0.430877685546875, 0.4538116455078125, 0.47674560546875, 0.4996795654296875, 0.522613525390625, 0.5455474853515625, 0.5684814453125, 0.5914154052734375, 0.614349365234375, 0.6372833251953125, 0.66021728515625, 0.6831512451171875, 0.706085205078125, 0.7290191650390625, 0.751953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 4.0, 16.0, 7.0, 13.0, 16.0, 24.0, 29.0, 31.0, 52.0, 52.0, 68.0, 105.0, 112.0, 118.0, 67.0, 64.0, 42.0, 38.0, 25.0, 25.0, 18.0, 12.0, 6.0, 7.0, 4.0, 8.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.0013427734375, -0.0013061463832855225, -0.001269519329071045, -0.0012328922748565674, -0.0011962652206420898, -0.0011596381664276123, -0.0011230111122131348, -0.0010863840579986572, -0.0010497570037841797, -0.0010131299495697021, -0.0009765028953552246, -0.0009398758411407471, -0.0009032487869262695, -0.000866621732711792, -0.0008299946784973145, -0.0007933676242828369, -0.0007567405700683594, -0.0007201135158538818, -0.0006834864616394043, -0.0006468594074249268, -0.0006102323532104492, -0.0005736052989959717, -0.0005369782447814941, -0.0005003511905670166, -0.00046372413635253906, -0.0004270970821380615, -0.000390470027923584, -0.00035384297370910645, -0.0003172159194946289, -0.00028058886528015137, -0.00024396181106567383, -0.0002073347568511963, -0.00017070770263671875, -0.0001340806484222412, -9.745359420776367e-05, -6.082653999328613e-05, -2.4199485778808594e-05, 1.2427568435668945e-05, 4.9054622650146484e-05, 8.568167686462402e-05, 0.00012230873107910156, 0.0001589357852935791, 0.00019556283950805664, 0.00023218989372253418, 0.0002688169479370117, 0.00030544400215148926, 0.0003420710563659668, 0.00037869811058044434, 0.0004153251647949219, 0.0004519522190093994, 0.000488579273223877, 0.0005252063274383545, 0.000561833381652832, 0.0005984604358673096, 0.0006350874900817871, 0.0006717145442962646, 0.0007083415985107422, 0.0007449686527252197, 0.0007815957069396973, 0.0008182227611541748, 0.0008548498153686523, 0.0008914768695831299, 0.0009281039237976074, 0.000964730978012085, 0.0010013580322265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 7.0, 3.0, 10.0, 14.0, 13.0, 14.0, 37.0, 52.0, 95.0, 176.0, 500.0, 23088.0, 1023077.0, 883.0, 255.0, 100.0, 69.0, 42.0, 22.0, 22.0, 14.0, 10.0, 10.0, 7.0, 3.0, 5.0, 4.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0291900634765625, -0.02811598777770996, -0.027041912078857422, -0.025967836380004883, -0.024893760681152344, -0.023819684982299805, -0.022745609283447266, -0.021671533584594727, -0.020597457885742188, -0.01952338218688965, -0.01844930648803711, -0.01737523078918457, -0.01630115509033203, -0.015227079391479492, -0.014153003692626953, -0.013078927993774414, -0.012004852294921875, -0.010930776596069336, -0.009856700897216797, -0.008782625198364258, -0.007708549499511719, -0.00663447380065918, -0.005560398101806641, -0.0044863224029541016, -0.0034122467041015625, -0.0023381710052490234, -0.0012640953063964844, -0.0001900196075439453, 0.0008840560913085938, 0.001958131790161133, 0.003032207489013672, 0.004106283187866211, 0.00518035888671875, 0.006254434585571289, 0.007328510284423828, 0.008402585983276367, 0.009476661682128906, 0.010550737380981445, 0.011624813079833984, 0.012698888778686523, 0.013772964477539062, 0.014847040176391602, 0.01592111587524414, 0.01699519157409668, 0.01806926727294922, 0.019143342971801758, 0.020217418670654297, 0.021291494369506836, 0.022365570068359375, 0.023439645767211914, 0.024513721466064453, 0.025587797164916992, 0.02666187286376953, 0.02773594856262207, 0.02881002426147461, 0.02988409996032715, 0.030958175659179688, 0.03203225135803223, 0.033106327056884766, 0.034180402755737305, 0.035254478454589844, 0.03632855415344238, 0.03740262985229492, 0.03847670555114746, 0.03955078125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 20.0, 55.0, 95.0, 162.0, 176.0, 176.0, 127.0, 86.0, 51.0, 22.0, 21.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008678828598931432, -0.0008456880459561944, -0.0008234931738115847, -0.0008012983598746359, -0.0007791034877300262, -0.0007569086737930775, -0.0007347138598561287, -0.000712518987711519, -0.0006903241155669093, -0.0006681293016299605, -0.0006459344294853508, -0.0006237396155484021, -0.0006015447434037924, -0.0005793499294668436, -0.0005571551155298948, -0.0005349602433852851, -0.0005127654294483364, -0.0004905706155113876, -0.0004683757433667779, -0.0004461809294298291, -0.00042398605728521943, -0.00040179124334827065, -0.0003795964003074914, -0.0003574015572667122, -0.00033520671422593296, -0.0003130118711851537, -0.0002908170281443745, -0.00026862218510359526, -0.0002464273711666465, -0.00022423251357395202, -0.00020203768508508801, -0.00017984284204430878, -0.00015764799900352955, -0.00013545315596275032, -0.0001132583201979287, -9.106348443310708e-05, -6.886864139232785e-05, -4.667379835154861e-05, -2.4478969862684608e-05, -2.2841268219053745e-06, 1.991071621887386e-05, 4.2105555621674284e-05, 6.430039502447471e-05, 8.649523078929633e-05, 0.00010869007383007556, 0.0001308849168708548, 0.0001530797453597188, 0.00017527458840049803, 0.00019746943144127727, 0.0002196642744820565, 0.00024185911752283573, 0.0002640539314597845, 0.0002862488036043942, 0.000308443617541343, 0.0003306384605821222, 0.00035283330362290144, 0.00037502814666368067, 0.0003972229897044599, 0.00041941783274523914, 0.00044161267578601837, 0.00046380748972296715, 0.00048600236186757684, 0.0005081971758045256, 0.0005303920479491353, 0.0005525868618860841]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 14.0, 13.0, 10.0, 17.0, 16.0, 19.0, 18.0, 25.0, 34.0, 39.0, 34.0, 42.0, 44.0, 44.0, 40.0, 33.0, 42.0, 65.0, 49.0, 41.0, 37.0, 30.0, 42.0, 37.0, 35.0, 32.0, 20.0, 18.0, 20.0, 17.0, 12.0, 12.0, 8.0, 8.0, 8.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005816221237182617, -0.00056490208953619, -0.0005481820553541183, -0.0005314620211720467, -0.000514741986989975, -0.0004980219528079033, -0.0004813019186258316, -0.0004645818844437599, -0.00044786185026168823, -0.00043114181607961655, -0.00041442178189754486, -0.0003977017477154732, -0.0003809817135334015, -0.0003642616793513298, -0.0003475416451692581, -0.00033082161098718643, -0.00031410157680511475, -0.00029738154262304306, -0.0002806615084409714, -0.0002639414742588997, -0.000247221440076828, -0.00023050140589475632, -0.00021378137171268463, -0.00019706133753061295, -0.00018034130334854126, -0.00016362126916646957, -0.0001469012349843979, -0.0001301812008023262, -0.00011346116662025452, -9.674113243818283e-05, -8.002109825611115e-05, -6.330106407403946e-05, -4.6581029891967773e-05, -2.9860995709896088e-05, -1.3140961527824402e-05, 3.579072654247284e-06, 2.029910683631897e-05, 3.7019141018390656e-05, 5.373917520046234e-05, 7.045920938253403e-05, 8.717924356460571e-05, 0.0001038992777466774, 0.00012061931192874908, 0.00013733934611082077, 0.00015405938029289246, 0.00017077941447496414, 0.00018749944865703583, 0.0002042194828391075, 0.0002209395170211792, 0.00023765955120325089, 0.00025437958538532257, 0.00027109961956739426, 0.00028781965374946594, 0.00030453968793153763, 0.0003212597221136093, 0.000337979756295681, 0.0003546997904777527, 0.00037141982465982437, 0.00038813985884189606, 0.00040485989302396774, 0.00042157992720603943, 0.0004382999613881111, 0.0004550199955701828, 0.0004717400297522545, 0.0004884600639343262]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 10.0, 4.0, 12.0, 7.0, 6.0, 7.0, 16.0, 17.0, 16.0, 29.0, 18.0, 27.0, 26.0, 25.0, 31.0, 45.0, 41.0, 40.0, 45.0, 58.0, 49.0, 45.0, 42.0, 36.0, 34.0, 36.0, 24.0, 24.0, 31.0, 36.0, 24.0, 24.0, 10.0, 24.0, 12.0, 19.0, 12.0, 10.0, 11.0, 4.0, 5.0, 4.0, 4.0, 1.0, 3.0, 4.0], "bins": [-7.0390625, -6.856689453125, -6.67431640625, -6.491943359375, -6.3095703125, -6.127197265625, -5.94482421875, -5.762451171875, -5.580078125, -5.397705078125, -5.21533203125, -5.032958984375, -4.8505859375, -4.668212890625, -4.48583984375, -4.303466796875, -4.12109375, -3.938720703125, -3.75634765625, -3.573974609375, -3.3916015625, -3.209228515625, -3.02685546875, -2.844482421875, -2.662109375, -2.479736328125, -2.29736328125, -2.114990234375, -1.9326171875, -1.750244140625, -1.56787109375, -1.385498046875, -1.203125, -1.020751953125, -0.83837890625, -0.656005859375, -0.4736328125, -0.291259765625, -0.10888671875, 0.073486328125, 0.255859375, 0.438232421875, 0.62060546875, 0.802978515625, 0.9853515625, 1.167724609375, 1.35009765625, 1.532470703125, 1.71484375, 1.897216796875, 2.07958984375, 2.261962890625, 2.4443359375, 2.626708984375, 2.80908203125, 2.991455078125, 3.173828125, 3.356201171875, 3.53857421875, 3.720947265625, 3.9033203125, 4.085693359375, 4.26806640625, 4.450439453125, 4.6328125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 7.0, 11.0, 10.0, 15.0, 24.0, 41.0, 68.0, 124.0, 228.0, 366.0, 699.0, 1182.0, 2219.0, 3790.0, 7311.0, 14249.0, 31202.0, 77731.0, 220138.0, 416658.0, 162728.0, 59422.0, 24814.0, 11956.0, 6111.0, 3249.0, 1880.0, 1011.0, 535.0, 311.0, 193.0, 116.0, 60.0, 38.0, 25.0, 11.0, 11.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.53863525390625, -3.4093017578125, -3.27996826171875, -3.150634765625, -3.02130126953125, -2.8919677734375, -2.76263427734375, -2.63330078125, -2.50396728515625, -2.3746337890625, -2.24530029296875, -2.115966796875, -1.98663330078125, -1.8572998046875, -1.72796630859375, -1.5986328125, -1.46929931640625, -1.3399658203125, -1.21063232421875, -1.081298828125, -0.95196533203125, -0.8226318359375, -0.69329833984375, -0.56396484375, -0.43463134765625, -0.3052978515625, -0.17596435546875, -0.046630859375, 0.08270263671875, 0.2120361328125, 0.34136962890625, 0.470703125, 0.60003662109375, 0.7293701171875, 0.85870361328125, 0.988037109375, 1.11737060546875, 1.2467041015625, 1.37603759765625, 1.50537109375, 1.63470458984375, 1.7640380859375, 1.89337158203125, 2.022705078125, 2.15203857421875, 2.2813720703125, 2.41070556640625, 2.5400390625, 2.66937255859375, 2.7987060546875, 2.92803955078125, 3.057373046875, 3.18670654296875, 3.3160400390625, 3.44537353515625, 3.57470703125, 3.70404052734375, 3.8333740234375, 3.96270751953125, 4.092041015625, 4.22137451171875, 4.3507080078125, 4.48004150390625, 4.609375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 8.0, 13.0, 14.0, 14.0, 22.0, 17.0, 24.0, 29.0, 23.0, 33.0, 42.0, 43.0, 39.0, 66.0, 73.0, 193.0, 1641.0, 227.0, 87.0, 61.0, 39.0, 37.0, 35.0, 30.0, 37.0, 25.0, 20.0, 25.0, 19.0, 14.0, 9.0, 10.0, 15.0, 14.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-22.5625, -21.889892578125, -21.21728515625, -20.544677734375, -19.8720703125, -19.199462890625, -18.52685546875, -17.854248046875, -17.181640625, -16.509033203125, -15.83642578125, -15.163818359375, -14.4912109375, -13.818603515625, -13.14599609375, -12.473388671875, -11.80078125, -11.128173828125, -10.45556640625, -9.782958984375, -9.1103515625, -8.437744140625, -7.76513671875, -7.092529296875, -6.419921875, -5.747314453125, -5.07470703125, -4.402099609375, -3.7294921875, -3.056884765625, -2.38427734375, -1.711669921875, -1.0390625, -0.366455078125, 0.30615234375, 0.978759765625, 1.6513671875, 2.323974609375, 2.99658203125, 3.669189453125, 4.341796875, 5.014404296875, 5.68701171875, 6.359619140625, 7.0322265625, 7.704833984375, 8.37744140625, 9.050048828125, 9.72265625, 10.395263671875, 11.06787109375, 11.740478515625, 12.4130859375, 13.085693359375, 13.75830078125, 14.430908203125, 15.103515625, 15.776123046875, 16.44873046875, 17.121337890625, 17.7939453125, 18.466552734375, 19.13916015625, 19.811767578125, 20.484375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 7.0, 6.0, 8.0, 3.0, 9.0, 15.0, 17.0, 29.0, 20.0, 52.0, 48.0, 68.0, 98.0, 137.0, 178.0, 293.0, 498.0, 1485.0, 45745.0, 3082918.0, 11799.0, 949.0, 427.0, 274.0, 152.0, 109.0, 83.0, 57.0, 60.0, 37.0, 23.0, 21.0, 13.0, 15.0, 10.0, 8.0, 7.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.3125, -46.77197265625, -45.2314453125, -43.69091796875, -42.150390625, -40.60986328125, -39.0693359375, -37.52880859375, -35.98828125, -34.44775390625, -32.9072265625, -31.36669921875, -29.826171875, -28.28564453125, -26.7451171875, -25.20458984375, -23.6640625, -22.12353515625, -20.5830078125, -19.04248046875, -17.501953125, -15.96142578125, -14.4208984375, -12.88037109375, -11.33984375, -9.79931640625, -8.2587890625, -6.71826171875, -5.177734375, -3.63720703125, -2.0966796875, -0.55615234375, 0.984375, 2.52490234375, 4.0654296875, 5.60595703125, 7.146484375, 8.68701171875, 10.2275390625, 11.76806640625, 13.30859375, 14.84912109375, 16.3896484375, 17.93017578125, 19.470703125, 21.01123046875, 22.5517578125, 24.09228515625, 25.6328125, 27.17333984375, 28.7138671875, 30.25439453125, 31.794921875, 33.33544921875, 34.8759765625, 36.41650390625, 37.95703125, 39.49755859375, 41.0380859375, 42.57861328125, 44.119140625, 45.65966796875, 47.2001953125, 48.74072265625, 50.28125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 22.0, 50.0, 122.0, 231.0, 252.0, 195.0, 99.0, 27.0, 11.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-58.641719818115234, -57.11623764038086, -55.59075927734375, -54.065277099609375, -52.539798736572266, -51.01431655883789, -49.48883819580078, -47.963356018066406, -46.43787384033203, -44.912391662597656, -43.38691329956055, -41.86143112182617, -40.33595275878906, -38.81047058105469, -37.28498840332031, -35.7595100402832, -34.234031677246094, -32.70854949951172, -31.18307113647461, -29.657588958740234, -28.132110595703125, -26.60662841796875, -25.081148147583008, -23.555667877197266, -22.030187606811523, -20.50470733642578, -18.97922706604004, -17.453746795654297, -15.928265571594238, -14.402785301208496, -12.877304077148438, -11.351823806762695, -9.826339721679688, -8.300859451293945, -6.775378704071045, -5.2498979568481445, -3.7244176864624023, -2.19893741607666, -0.6734561920166016, 0.8520240783691406, 2.377504348754883, 3.902984857559204, 5.428465366363525, 6.953946113586426, 8.479426383972168, 10.00490665435791, 11.530387878417969, 13.055868148803711, 14.581348419189453, 16.106828689575195, 17.632308959960938, 19.157791137695312, 20.683269500732422, 22.208751678466797, 23.73423194885254, 25.25971221923828, 26.785192489624023, 28.310672760009766, 29.836153030395508, 31.36163330078125, 32.887115478515625, 34.412593841552734, 35.93807601928711, 37.46355438232422, 38.989036560058594]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 13.0, 7.0, 20.0, 20.0, 25.0, 35.0, 25.0, 25.0, 32.0, 32.0, 46.0, 39.0, 39.0, 47.0, 39.0, 50.0, 45.0, 42.0, 52.0, 56.0, 37.0, 43.0, 30.0, 27.0, 33.0, 22.0, 16.0, 21.0, 16.0, 22.0, 15.0, 3.0, 8.0, 6.0, 5.0, 1.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-79.73925018310547, -77.4762954711914, -75.21334075927734, -72.95039367675781, -70.68743896484375, -68.42448425292969, -66.16152954101562, -63.89857864379883, -61.63562774658203, -59.37267303466797, -57.10972213745117, -54.84676742553711, -52.58381652832031, -50.32086181640625, -48.05790710449219, -45.79495620727539, -43.53200149536133, -41.269046783447266, -39.00609588623047, -36.743141174316406, -34.48019027709961, -32.21723556518555, -29.954282760620117, -27.691329956054688, -25.428377151489258, -23.165424346923828, -20.9024715423584, -18.63951873779297, -16.376564025878906, -14.113612174987793, -11.850658416748047, -9.587705612182617, -7.3247528076171875, -5.061800003051758, -2.79884672164917, -0.535893440246582, 1.7270593643188477, 3.9900121688842773, 6.252965927124023, 8.515918731689453, 10.778871536254883, 13.041824340820312, 15.304777145385742, 17.567729949951172, 19.830684661865234, 22.09363555908203, 24.356590270996094, 26.619543075561523, 28.882495880126953, 31.145448684692383, 33.40840148925781, 35.671356201171875, 37.93430709838867, 40.197261810302734, 42.46021270751953, 44.723167419433594, 46.986122131347656, 49.24907684326172, 51.512027740478516, 53.77498245239258, 56.037933349609375, 58.30088806152344, 60.5638427734375, 62.8267936706543, 65.0897445678711]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 7.0, 3.0, 5.0, 14.0, 12.0, 5.0, 14.0, 24.0, 31.0, 21.0, 19.0, 20.0, 30.0, 37.0, 32.0, 46.0, 40.0, 60.0, 43.0, 43.0, 49.0, 42.0, 43.0, 36.0, 24.0, 25.0, 35.0, 28.0, 37.0, 27.0, 21.0, 19.0, 18.0, 20.0, 14.0, 9.0, 7.0, 12.0, 8.0, 4.0, 3.0, 4.0, 5.0, 4.0], "bins": [-7.7578125, -7.56280517578125, -7.3677978515625, -7.17279052734375, -6.977783203125, -6.78277587890625, -6.5877685546875, -6.39276123046875, -6.19775390625, -6.00274658203125, -5.8077392578125, -5.61273193359375, -5.417724609375, -5.22271728515625, -5.0277099609375, -4.83270263671875, -4.6376953125, -4.44268798828125, -4.2476806640625, -4.05267333984375, -3.857666015625, -3.66265869140625, -3.4676513671875, -3.27264404296875, -3.07763671875, -2.88262939453125, -2.6876220703125, -2.49261474609375, -2.297607421875, -2.10260009765625, -1.9075927734375, -1.71258544921875, -1.517578125, -1.32257080078125, -1.1275634765625, -0.93255615234375, -0.737548828125, -0.54254150390625, -0.3475341796875, -0.15252685546875, 0.04248046875, 0.23748779296875, 0.4324951171875, 0.62750244140625, 0.822509765625, 1.01751708984375, 1.2125244140625, 1.40753173828125, 1.6025390625, 1.79754638671875, 1.9925537109375, 2.18756103515625, 2.382568359375, 2.57757568359375, 2.7725830078125, 2.96759033203125, 3.16259765625, 3.35760498046875, 3.5526123046875, 3.74761962890625, 3.942626953125, 4.13763427734375, 4.3326416015625, 4.52764892578125, 4.72265625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 5.0, 9.0, 8.0, 20.0, 26.0, 33.0, 49.0, 74.0, 105.0, 153.0, 278.0, 526.0, 953.0, 2483.0, 8552.0, 39585.0, 275739.0, 1456254.0, 1869121.0, 456846.0, 65372.0, 12275.0, 3235.0, 1220.0, 533.0, 272.0, 194.0, 106.0, 78.0, 55.0, 38.0, 35.0, 10.0, 15.0, 7.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.265625, -10.9449462890625, -10.624267578125, -10.3035888671875, -9.98291015625, -9.6622314453125, -9.341552734375, -9.0208740234375, -8.7001953125, -8.3795166015625, -8.058837890625, -7.7381591796875, -7.41748046875, -7.0968017578125, -6.776123046875, -6.4554443359375, -6.134765625, -5.8140869140625, -5.493408203125, -5.1727294921875, -4.85205078125, -4.5313720703125, -4.210693359375, -3.8900146484375, -3.5693359375, -3.2486572265625, -2.927978515625, -2.6072998046875, -2.28662109375, -1.9659423828125, -1.645263671875, -1.3245849609375, -1.00390625, -0.6832275390625, -0.362548828125, -0.0418701171875, 0.27880859375, 0.5994873046875, 0.920166015625, 1.2408447265625, 1.5615234375, 1.8822021484375, 2.202880859375, 2.5235595703125, 2.84423828125, 3.1649169921875, 3.485595703125, 3.8062744140625, 4.126953125, 4.4476318359375, 4.768310546875, 5.0889892578125, 5.40966796875, 5.7303466796875, 6.051025390625, 6.3717041015625, 6.6923828125, 7.0130615234375, 7.333740234375, 7.6544189453125, 7.97509765625, 8.2957763671875, 8.616455078125, 8.9371337890625, 9.2578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 9.0, 15.0, 12.0, 24.0, 23.0, 33.0, 39.0, 46.0, 68.0, 77.0, 105.0, 142.0, 181.0, 232.0, 289.0, 347.0, 393.0, 384.0, 299.0, 277.0, 238.0, 182.0, 143.0, 102.0, 84.0, 80.0, 46.0, 49.0, 26.0, 25.0, 30.0, 16.0, 10.0, 9.0, 5.0, 4.0, 5.0, 7.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7265625, -9.35302734375, -8.9794921875, -8.60595703125, -8.232421875, -7.85888671875, -7.4853515625, -7.11181640625, -6.73828125, -6.36474609375, -5.9912109375, -5.61767578125, -5.244140625, -4.87060546875, -4.4970703125, -4.12353515625, -3.75, -3.37646484375, -3.0029296875, -2.62939453125, -2.255859375, -1.88232421875, -1.5087890625, -1.13525390625, -0.76171875, -0.38818359375, -0.0146484375, 0.35888671875, 0.732421875, 1.10595703125, 1.4794921875, 1.85302734375, 2.2265625, 2.60009765625, 2.9736328125, 3.34716796875, 3.720703125, 4.09423828125, 4.4677734375, 4.84130859375, 5.21484375, 5.58837890625, 5.9619140625, 6.33544921875, 6.708984375, 7.08251953125, 7.4560546875, 7.82958984375, 8.203125, 8.57666015625, 8.9501953125, 9.32373046875, 9.697265625, 10.07080078125, 10.4443359375, 10.81787109375, 11.19140625, 11.56494140625, 11.9384765625, 12.31201171875, 12.685546875, 13.05908203125, 13.4326171875, 13.80615234375, 14.1796875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 10.0, 13.0, 15.0, 19.0, 25.0, 24.0, 29.0, 35.0, 38.0, 58.0, 77.0, 94.0, 146.0, 207.0, 302.0, 579.0, 2413.0, 405571.0, 3769302.0, 13182.0, 891.0, 362.0, 230.0, 192.0, 92.0, 87.0, 67.0, 42.0, 31.0, 37.0, 15.0, 17.0, 16.0, 9.0, 6.0, 11.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.84375, -56.04833984375, -54.2529296875, -52.45751953125, -50.662109375, -48.86669921875, -47.0712890625, -45.27587890625, -43.48046875, -41.68505859375, -39.8896484375, -38.09423828125, -36.298828125, -34.50341796875, -32.7080078125, -30.91259765625, -29.1171875, -27.32177734375, -25.5263671875, -23.73095703125, -21.935546875, -20.14013671875, -18.3447265625, -16.54931640625, -14.75390625, -12.95849609375, -11.1630859375, -9.36767578125, -7.572265625, -5.77685546875, -3.9814453125, -2.18603515625, -0.390625, 1.40478515625, 3.2001953125, 4.99560546875, 6.791015625, 8.58642578125, 10.3818359375, 12.17724609375, 13.97265625, 15.76806640625, 17.5634765625, 19.35888671875, 21.154296875, 22.94970703125, 24.7451171875, 26.54052734375, 28.3359375, 30.13134765625, 31.9267578125, 33.72216796875, 35.517578125, 37.31298828125, 39.1083984375, 40.90380859375, 42.69921875, 44.49462890625, 46.2900390625, 48.08544921875, 49.880859375, 51.67626953125, 53.4716796875, 55.26708984375, 57.0625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 22.0, 66.0, 125.0, 210.0, 271.0, 185.0, 99.0, 25.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.55597686767578, -96.572998046875, -92.59001159667969, -88.6070327758789, -84.62405395507812, -80.64106750488281, -76.65808868408203, -72.67510986328125, -68.69212341308594, -64.70914459228516, -60.726158142089844, -56.74317932128906, -52.760196685791016, -48.77721405029297, -44.79423522949219, -40.81125259399414, -36.828269958496094, -32.84528732299805, -28.862306594848633, -24.87932586669922, -20.896343231201172, -16.913360595703125, -12.930379867553711, -8.947399139404297, -4.96441650390625, -0.9814348220825195, 3.001546859741211, 6.984528541564941, 10.967510223388672, 14.950492858886719, 18.933473587036133, 22.916454315185547, 26.899444580078125, 30.882427215576172, 34.86540985107422, 38.848388671875, 42.83137130737305, 46.814353942871094, 50.797332763671875, 54.78031539916992, 58.76329803466797, 62.746280670166016, 66.72926330566406, 70.71224212646484, 74.69522094726562, 78.67820739746094, 82.66118621826172, 86.6441650390625, 90.62715148925781, 94.6101303100586, 98.5931167602539, 102.57609558105469, 106.55908203125, 110.54206085205078, 114.52503967285156, 118.50802612304688, 122.49100494384766, 126.47398376464844, 130.45697021484375, 134.43995666503906, 138.4229278564453, 142.40591430664062, 146.38890075683594, 150.3718719482422, 154.3548583984375]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 13.0, 7.0, 9.0, 5.0, 11.0, 16.0, 17.0, 16.0, 25.0, 17.0, 25.0, 30.0, 28.0, 28.0, 42.0, 46.0, 45.0, 43.0, 46.0, 40.0, 33.0, 42.0, 28.0, 31.0, 37.0, 36.0, 35.0, 31.0, 27.0, 28.0, 24.0, 18.0, 20.0, 18.0, 13.0, 12.0, 17.0, 16.0, 3.0, 4.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.52293395996094, -40.13435745239258, -38.74578094482422, -37.35720443725586, -35.9686279296875, -34.580047607421875, -33.191471099853516, -31.802894592285156, -30.414318084716797, -29.025741577148438, -27.637165069580078, -26.248586654663086, -24.860010147094727, -23.471433639526367, -22.082855224609375, -20.694278717041016, -19.305702209472656, -17.917125701904297, -16.528549194335938, -15.139970779418945, -13.751394271850586, -12.362817764282227, -10.97424030303955, -9.585662841796875, -8.197086334228516, -6.808509349822998, -5.4199323654174805, -4.031355381011963, -2.6427783966064453, -1.2542014122009277, 0.13437557220458984, 1.5229530334472656, 2.911529541015625, 4.300106525421143, 5.68868350982666, 7.077260494232178, 8.465837478637695, 9.854413986206055, 11.24299144744873, 12.631568908691406, 14.020145416259766, 15.408721923828125, 16.797298431396484, 18.185876846313477, 19.574453353881836, 20.963029861450195, 22.351608276367188, 23.740184783935547, 25.128761291503906, 26.517337799072266, 27.905914306640625, 29.294492721557617, 30.683069229125977, 32.07164764404297, 33.46022415161133, 34.84880065917969, 36.23737716674805, 37.625953674316406, 39.014530181884766, 40.403106689453125, 41.79168701171875, 43.18026351928711, 44.56884002685547, 45.95741653442383, 47.34599304199219]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 12.0, 13.0, 14.0, 18.0, 18.0, 29.0, 18.0, 29.0, 26.0, 33.0, 30.0, 35.0, 41.0, 44.0, 40.0, 35.0, 36.0, 40.0, 36.0, 39.0, 36.0, 44.0, 29.0, 35.0, 20.0, 37.0, 22.0, 24.0, 16.0, 14.0, 19.0, 14.0, 13.0, 12.0, 12.0, 7.0, 9.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.17578125, -5.99407958984375, -5.8123779296875, -5.63067626953125, -5.448974609375, -5.26727294921875, -5.0855712890625, -4.90386962890625, -4.72216796875, -4.54046630859375, -4.3587646484375, -4.17706298828125, -3.995361328125, -3.81365966796875, -3.6319580078125, -3.45025634765625, -3.2685546875, -3.08685302734375, -2.9051513671875, -2.72344970703125, -2.541748046875, -2.36004638671875, -2.1783447265625, -1.99664306640625, -1.81494140625, -1.63323974609375, -1.4515380859375, -1.26983642578125, -1.088134765625, -0.90643310546875, -0.7247314453125, -0.54302978515625, -0.361328125, -0.17962646484375, 0.0020751953125, 0.18377685546875, 0.365478515625, 0.54718017578125, 0.7288818359375, 0.91058349609375, 1.09228515625, 1.27398681640625, 1.4556884765625, 1.63739013671875, 1.819091796875, 2.00079345703125, 2.1824951171875, 2.36419677734375, 2.5458984375, 2.72760009765625, 2.9093017578125, 3.09100341796875, 3.272705078125, 3.45440673828125, 3.6361083984375, 3.81781005859375, 3.99951171875, 4.18121337890625, 4.3629150390625, 4.54461669921875, 4.726318359375, 4.90802001953125, 5.0897216796875, 5.27142333984375, 5.453125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 11.0, 24.0, 32.0, 48.0, 63.0, 105.0, 164.0, 217.0, 356.0, 501.0, 783.0, 1178.0, 1784.0, 2688.0, 4000.0, 6227.0, 9732.0, 15030.0, 24186.0, 39518.0, 66715.0, 115504.0, 205817.0, 231272.0, 129682.0, 74950.0, 44134.0, 26703.0, 16466.0, 10595.0, 6885.0, 4466.0, 2915.0, 2003.0, 1303.0, 851.0, 532.0, 366.0, 240.0, 186.0, 102.0, 71.0, 47.0, 28.0, 19.0, 14.0, 12.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.83447265625, -0.8067550659179688, -0.7790374755859375, -0.7513198852539062, -0.723602294921875, -0.6958847045898438, -0.6681671142578125, -0.6404495239257812, -0.61273193359375, -0.5850143432617188, -0.5572967529296875, -0.5295791625976562, -0.501861572265625, -0.47414398193359375, -0.4464263916015625, -0.41870880126953125, -0.3909912109375, -0.36327362060546875, -0.3355560302734375, -0.30783843994140625, -0.280120849609375, -0.25240325927734375, -0.2246856689453125, -0.19696807861328125, -0.16925048828125, -0.14153289794921875, -0.1138153076171875, -0.08609771728515625, -0.058380126953125, -0.03066253662109375, -0.0029449462890625, 0.02477264404296875, 0.052490234375, 0.08020782470703125, 0.1079254150390625, 0.13564300537109375, 0.163360595703125, 0.19107818603515625, 0.2187957763671875, 0.24651336669921875, 0.27423095703125, 0.30194854736328125, 0.3296661376953125, 0.35738372802734375, 0.385101318359375, 0.41281890869140625, 0.4405364990234375, 0.46825408935546875, 0.4959716796875, 0.5236892700195312, 0.5514068603515625, 0.5791244506835938, 0.606842041015625, 0.6345596313476562, 0.6622772216796875, 0.6899948120117188, 0.71771240234375, 0.7454299926757812, 0.7731475830078125, 0.8008651733398438, 0.828582763671875, 0.8563003540039062, 0.8840179443359375, 0.9117355346679688, 0.939453125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 7.0, 14.0, 16.0, 11.0, 16.0, 14.0, 15.0, 18.0, 31.0, 29.0, 34.0, 21.0, 46.0, 39.0, 38.0, 39.0, 57.0, 38.0, 1064.0, 40.0, 50.0, 33.0, 53.0, 40.0, 39.0, 40.0, 27.0, 26.0, 24.0, 19.0, 17.0, 9.0, 14.0, 7.0, 8.0, 5.0, 4.0, 0.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.806640625, -3.676483154296875, -3.54632568359375, -3.416168212890625, -3.2860107421875, -3.155853271484375, -3.02569580078125, -2.895538330078125, -2.765380859375, -2.635223388671875, -2.50506591796875, -2.374908447265625, -2.2447509765625, -2.114593505859375, -1.98443603515625, -1.854278564453125, -1.72412109375, -1.593963623046875, -1.46380615234375, -1.333648681640625, -1.2034912109375, -1.073333740234375, -0.94317626953125, -0.813018798828125, -0.682861328125, -0.552703857421875, -0.42254638671875, -0.292388916015625, -0.1622314453125, -0.032073974609375, 0.09808349609375, 0.228240966796875, 0.3583984375, 0.488555908203125, 0.61871337890625, 0.748870849609375, 0.8790283203125, 1.009185791015625, 1.13934326171875, 1.269500732421875, 1.399658203125, 1.529815673828125, 1.65997314453125, 1.790130615234375, 1.9202880859375, 2.050445556640625, 2.18060302734375, 2.310760498046875, 2.44091796875, 2.571075439453125, 2.70123291015625, 2.831390380859375, 2.9615478515625, 3.091705322265625, 3.22186279296875, 3.352020263671875, 3.482177734375, 3.612335205078125, 3.74249267578125, 3.872650146484375, 4.0028076171875, 4.132965087890625, 4.26312255859375, 4.393280029296875, 4.5234375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 6.0, 6.0, 7.0, 19.0, 26.0, 26.0, 37.0, 48.0, 95.0, 126.0, 163.0, 243.0, 335.0, 483.0, 754.0, 1000.0, 1547.0, 2269.0, 3523.0, 5461.0, 8243.0, 12678.0, 20385.0, 33920.0, 58787.0, 104773.0, 197529.0, 1309301.0, 141433.0, 78018.0, 44250.0, 26017.0, 16004.0, 10241.0, 6484.0, 4248.0, 2774.0, 1857.0, 1209.0, 820.0, 634.0, 426.0, 265.0, 180.0, 159.0, 95.0, 63.0, 47.0, 35.0, 24.0, 21.0, 19.0, 9.0, 7.0, 5.0, 1.0, 4.0, 3.0], "bins": [-0.9052734375, -0.8780441284179688, -0.8508148193359375, -0.8235855102539062, -0.796356201171875, -0.7691268920898438, -0.7418975830078125, -0.7146682739257812, -0.68743896484375, -0.6602096557617188, -0.6329803466796875, -0.6057510375976562, -0.578521728515625, -0.5512924194335938, -0.5240631103515625, -0.49683380126953125, -0.4696044921875, -0.44237518310546875, -0.4151458740234375, -0.38791656494140625, -0.360687255859375, -0.33345794677734375, -0.3062286376953125, -0.27899932861328125, -0.25177001953125, -0.22454071044921875, -0.1973114013671875, -0.17008209228515625, -0.142852783203125, -0.11562347412109375, -0.0883941650390625, -0.06116485595703125, -0.033935546875, -0.00670623779296875, 0.0205230712890625, 0.04775238037109375, 0.074981689453125, 0.10221099853515625, 0.1294403076171875, 0.15666961669921875, 0.18389892578125, 0.21112823486328125, 0.2383575439453125, 0.26558685302734375, 0.292816162109375, 0.32004547119140625, 0.3472747802734375, 0.37450408935546875, 0.4017333984375, 0.42896270751953125, 0.4561920166015625, 0.48342132568359375, 0.510650634765625, 0.5378799438476562, 0.5651092529296875, 0.5923385620117188, 0.61956787109375, 0.6467971801757812, 0.6740264892578125, 0.7012557983398438, 0.728485107421875, 0.7557144165039062, 0.7829437255859375, 0.8101730346679688, 0.83740234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 9.0, 12.0, 16.0, 14.0, 24.0, 26.0, 36.0, 41.0, 56.0, 68.0, 103.0, 109.0, 108.0, 79.0, 47.0, 55.0, 55.0, 33.0, 23.0, 18.0, 17.0, 8.0, 6.0, 2.0, 10.0, 2.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0013427734375, -0.001298859715461731, -0.001254945993423462, -0.0012110322713851929, -0.0011671185493469238, -0.0011232048273086548, -0.0010792911052703857, -0.0010353773832321167, -0.0009914636611938477, -0.0009475499391555786, -0.0009036362171173096, -0.0008597224950790405, -0.0008158087730407715, -0.0007718950510025024, -0.0007279813289642334, -0.0006840676069259644, -0.0006401538848876953, -0.0005962401628494263, -0.0005523264408111572, -0.0005084127187728882, -0.00046449899673461914, -0.0004205852746963501, -0.00037667155265808105, -0.000332757830619812, -0.00028884410858154297, -0.0002449303865432739, -0.00020101666450500488, -0.00015710294246673584, -0.0001131892204284668, -6.927549839019775e-05, -2.536177635192871e-05, 1.8551945686340332e-05, 6.246566772460938e-05, 0.00010637938976287842, 0.00015029311180114746, 0.0001942068338394165, 0.00023812055587768555, 0.0002820342779159546, 0.00032594799995422363, 0.0003698617219924927, 0.0004137754440307617, 0.00045768916606903076, 0.0005016028881072998, 0.0005455166101455688, 0.0005894303321838379, 0.0006333440542221069, 0.000677257776260376, 0.000721171498298645, 0.0007650852203369141, 0.0008089989423751831, 0.0008529126644134521, 0.0008968263864517212, 0.0009407401084899902, 0.0009846538305282593, 0.0010285675525665283, 0.0010724812746047974, 0.0011163949966430664, 0.0011603087186813354, 0.0012042224407196045, 0.0012481361627578735, 0.0012920498847961426, 0.0013359636068344116, 0.0013798773288726807, 0.0014237910509109497, 0.0014677047729492188]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 19.0, 22.0, 31.0, 45.0, 88.0, 163.0, 425.0, 3265.0, 1042465.0, 1338.0, 333.0, 125.0, 67.0, 43.0, 31.0, 13.0, 17.0, 7.0, 6.0, 7.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0401611328125, -0.038958072662353516, -0.03775501251220703, -0.03655195236206055, -0.03534889221191406, -0.03414583206176758, -0.032942771911621094, -0.03173971176147461, -0.030536651611328125, -0.02933359146118164, -0.028130531311035156, -0.026927471160888672, -0.025724411010742188, -0.024521350860595703, -0.02331829071044922, -0.022115230560302734, -0.02091217041015625, -0.019709110260009766, -0.01850605010986328, -0.017302989959716797, -0.016099929809570312, -0.014896869659423828, -0.013693809509277344, -0.01249074935913086, -0.011287689208984375, -0.01008462905883789, -0.008881568908691406, -0.007678508758544922, -0.0064754486083984375, -0.005272388458251953, -0.004069328308105469, -0.0028662681579589844, -0.0016632080078125, -0.0004601478576660156, 0.0007429122924804688, 0.0019459724426269531, 0.0031490325927734375, 0.004352092742919922, 0.005555152893066406, 0.006758213043212891, 0.007961273193359375, 0.00916433334350586, 0.010367393493652344, 0.011570453643798828, 0.012773513793945312, 0.013976573944091797, 0.015179634094238281, 0.016382694244384766, 0.01758575439453125, 0.018788814544677734, 0.01999187469482422, 0.021194934844970703, 0.022397994995117188, 0.023601055145263672, 0.024804115295410156, 0.02600717544555664, 0.027210235595703125, 0.02841329574584961, 0.029616355895996094, 0.030819416046142578, 0.03202247619628906, 0.03322553634643555, 0.03442859649658203, 0.035631656646728516, 0.036834716796875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 53.0, 301.0, 459.0, 169.0, 26.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0037578889168798923, -0.003685995936393738, -0.0036141027230769396, -0.003542209742590785, -0.003470316529273987, -0.0033984235487878323, -0.0033265305683016777, -0.003254637587815523, -0.003182744374498725, -0.0031108513940125704, -0.003038958180695772, -0.0029670652002096176, -0.002895172219723463, -0.002823279006406665, -0.0027513860259205103, -0.002679492812603712, -0.0026075998321175575, -0.002535706851631403, -0.0024638136383146048, -0.00239192065782845, -0.002320027444511652, -0.0022481344640254974, -0.002176241483539343, -0.0021043485030531883, -0.00203245528973639, -0.0019605623092502356, -0.0018886690959334373, -0.0018167761154472828, -0.0017448830185458064, -0.00167298992164433, -0.0016010969411581755, -0.001529203844256699, -0.001457310514524579, -0.0013854174176231027, -0.0013135243207216263, -0.0012416313402354717, -0.0011697382433339953, -0.001097845146432519, -0.0010259521659463644, -0.000954059069044888, -0.0008821659721434116, -0.0008102728752419353, -0.0007383798365481198, -0.0006664867978543043, -0.0005945937009528279, -0.0005227006040513515, -0.0004508075653575361, -0.0003789145266637206, -0.0003070214297622442, -0.0002351283619645983, -0.00016323529416695237, -9.134222636930645e-05, -1.944915857166052e-05, 5.244390922598541e-05, 0.00012433697702363133, 0.0001962300157174468, 0.0002681231126189232, 0.0003400161804165691, 0.00041190924821421504, 0.00048380231601186097, 0.0005556953838095069, 0.0006275884807109833, 0.0006994815194047987, 0.0007713745580986142, 0.0008432676550000906]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 6.0, 5.0, 9.0, 7.0, 5.0, 9.0, 15.0, 13.0, 17.0, 26.0, 28.0, 32.0, 26.0, 35.0, 38.0, 35.0, 47.0, 44.0, 49.0, 38.0, 34.0, 48.0, 42.0, 46.0, 40.0, 35.0, 32.0, 35.0, 23.0, 24.0, 23.0, 21.0, 11.0, 18.0, 11.0, 10.0, 15.0, 10.0, 9.0, 5.0, 8.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005971789360046387, -0.0005796132609248161, -0.0005620475858449936, -0.000544481910765171, -0.0005269162356853485, -0.000509350560605526, -0.0004917848855257034, -0.0004742192104458809, -0.00045665353536605835, -0.0004390878602862358, -0.00042152218520641327, -0.00040395651012659073, -0.0003863908350467682, -0.00036882515996694565, -0.0003512594848871231, -0.00033369380980730057, -0.00031612813472747803, -0.0002985624596476555, -0.00028099678456783295, -0.0002634311094880104, -0.00024586543440818787, -0.00022829975932836533, -0.00021073408424854279, -0.00019316840916872025, -0.0001756027340888977, -0.00015803705900907516, -0.00014047138392925262, -0.00012290570884943008, -0.00010534003376960754, -8.7774358689785e-05, -7.020868360996246e-05, -5.264300853013992e-05, -3.507733345031738e-05, -1.7511658370494843e-05, 5.4016709327697754e-08, 1.7619691789150238e-05, 3.518536686897278e-05, 5.275104194879532e-05, 7.031671702861786e-05, 8.78823921084404e-05, 0.00010544806718826294, 0.00012301374226808548, 0.00014057941734790802, 0.00015814509242773056, 0.0001757107675075531, 0.00019327644258737564, 0.00021084211766719818, 0.00022840779274702072, 0.00024597346782684326, 0.0002635391429066658, 0.00028110481798648834, 0.0002986704930663109, 0.0003162361681461334, 0.00033380184322595596, 0.0003513675183057785, 0.00036893319338560104, 0.0003864988684654236, 0.0004040645435452461, 0.00042163021862506866, 0.0004391958937048912, 0.00045676156878471375, 0.0004743272438645363, 0.0004918929189443588, 0.0005094585940241814, 0.0005270242691040039]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 12.0, 13.0, 14.0, 18.0, 18.0, 29.0, 18.0, 29.0, 26.0, 33.0, 30.0, 35.0, 41.0, 44.0, 40.0, 35.0, 36.0, 40.0, 36.0, 39.0, 36.0, 44.0, 29.0, 35.0, 20.0, 37.0, 22.0, 24.0, 16.0, 14.0, 19.0, 14.0, 13.0, 12.0, 12.0, 7.0, 9.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.17578125, -5.99407958984375, -5.8123779296875, -5.63067626953125, -5.448974609375, -5.26727294921875, -5.0855712890625, -4.90386962890625, -4.72216796875, -4.54046630859375, -4.3587646484375, -4.17706298828125, -3.995361328125, -3.81365966796875, -3.6319580078125, -3.45025634765625, -3.2685546875, -3.08685302734375, -2.9051513671875, -2.72344970703125, -2.541748046875, -2.36004638671875, -2.1783447265625, -1.99664306640625, -1.81494140625, -1.63323974609375, -1.4515380859375, -1.26983642578125, -1.088134765625, -0.90643310546875, -0.7247314453125, -0.54302978515625, -0.361328125, -0.17962646484375, 0.0020751953125, 0.18377685546875, 0.365478515625, 0.54718017578125, 0.7288818359375, 0.91058349609375, 1.09228515625, 1.27398681640625, 1.4556884765625, 1.63739013671875, 1.819091796875, 2.00079345703125, 2.1824951171875, 2.36419677734375, 2.5458984375, 2.72760009765625, 2.9093017578125, 3.09100341796875, 3.272705078125, 3.45440673828125, 3.6361083984375, 3.81781005859375, 3.99951171875, 4.18121337890625, 4.3629150390625, 4.54461669921875, 4.726318359375, 4.90802001953125, 5.0897216796875, 5.27142333984375, 5.453125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 8.0, 13.0, 17.0, 28.0, 40.0, 55.0, 83.0, 160.0, 309.0, 523.0, 953.0, 1900.0, 4264.0, 10268.0, 25579.0, 68194.0, 204002.0, 430289.0, 194295.0, 65049.0, 24560.0, 9811.0, 4150.0, 1934.0, 901.0, 486.0, 264.0, 151.0, 91.0, 69.0, 41.0, 26.0, 18.0, 7.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -6.001708984375, -5.82763671875, -5.653564453125, -5.4794921875, -5.305419921875, -5.13134765625, -4.957275390625, -4.783203125, -4.609130859375, -4.43505859375, -4.260986328125, -4.0869140625, -3.912841796875, -3.73876953125, -3.564697265625, -3.390625, -3.216552734375, -3.04248046875, -2.868408203125, -2.6943359375, -2.520263671875, -2.34619140625, -2.172119140625, -1.998046875, -1.823974609375, -1.64990234375, -1.475830078125, -1.3017578125, -1.127685546875, -0.95361328125, -0.779541015625, -0.60546875, -0.431396484375, -0.25732421875, -0.083251953125, 0.0908203125, 0.264892578125, 0.43896484375, 0.613037109375, 0.787109375, 0.961181640625, 1.13525390625, 1.309326171875, 1.4833984375, 1.657470703125, 1.83154296875, 2.005615234375, 2.1796875, 2.353759765625, 2.52783203125, 2.701904296875, 2.8759765625, 3.050048828125, 3.22412109375, 3.398193359375, 3.572265625, 3.746337890625, 3.92041015625, 4.094482421875, 4.2685546875, 4.442626953125, 4.61669921875, 4.790771484375, 4.96484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 10.0, 9.0, 10.0, 10.0, 11.0, 15.0, 26.0, 26.0, 29.0, 39.0, 37.0, 44.0, 46.0, 77.0, 74.0, 205.0, 1772.0, 167.0, 64.0, 55.0, 53.0, 42.0, 40.0, 46.0, 40.0, 15.0, 15.0, 15.0, 8.0, 11.0, 16.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.3125, -27.381591796875, -26.45068359375, -25.519775390625, -24.5888671875, -23.657958984375, -22.72705078125, -21.796142578125, -20.865234375, -19.934326171875, -19.00341796875, -18.072509765625, -17.1416015625, -16.210693359375, -15.27978515625, -14.348876953125, -13.41796875, -12.487060546875, -11.55615234375, -10.625244140625, -9.6943359375, -8.763427734375, -7.83251953125, -6.901611328125, -5.970703125, -5.039794921875, -4.10888671875, -3.177978515625, -2.2470703125, -1.316162109375, -0.38525390625, 0.545654296875, 1.4765625, 2.407470703125, 3.33837890625, 4.269287109375, 5.2001953125, 6.131103515625, 7.06201171875, 7.992919921875, 8.923828125, 9.854736328125, 10.78564453125, 11.716552734375, 12.6474609375, 13.578369140625, 14.50927734375, 15.440185546875, 16.37109375, 17.302001953125, 18.23291015625, 19.163818359375, 20.0947265625, 21.025634765625, 21.95654296875, 22.887451171875, 23.818359375, 24.749267578125, 25.68017578125, 26.611083984375, 27.5419921875, 28.472900390625, 29.40380859375, 30.334716796875, 31.265625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 12.0, 11.0, 16.0, 17.0, 21.0, 19.0, 22.0, 42.0, 79.0, 108.0, 129.0, 179.0, 253.0, 489.0, 1700.0, 155754.0, 2981465.0, 3668.0, 623.0, 311.0, 220.0, 146.0, 100.0, 85.0, 50.0, 45.0, 27.0, 20.0, 17.0, 17.0, 11.0, 13.0, 8.0, 4.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.8125, -66.7373046875, -64.662109375, -62.5869140625, -60.51171875, -58.4365234375, -56.361328125, -54.2861328125, -52.2109375, -50.1357421875, -48.060546875, -45.9853515625, -43.91015625, -41.8349609375, -39.759765625, -37.6845703125, -35.609375, -33.5341796875, -31.458984375, -29.3837890625, -27.30859375, -25.2333984375, -23.158203125, -21.0830078125, -19.0078125, -16.9326171875, -14.857421875, -12.7822265625, -10.70703125, -8.6318359375, -6.556640625, -4.4814453125, -2.40625, -0.3310546875, 1.744140625, 3.8193359375, 5.89453125, 7.9697265625, 10.044921875, 12.1201171875, 14.1953125, 16.2705078125, 18.345703125, 20.4208984375, 22.49609375, 24.5712890625, 26.646484375, 28.7216796875, 30.796875, 32.8720703125, 34.947265625, 37.0224609375, 39.09765625, 41.1728515625, 43.248046875, 45.3232421875, 47.3984375, 49.4736328125, 51.548828125, 53.6240234375, 55.69921875, 57.7744140625, 59.849609375, 61.9248046875, 64.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 18.0, 104.0, 328.0, 355.0, 160.0, 35.0, 9.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.740604400634766, -36.489803314208984, -34.23899841308594, -31.988197326660156, -29.737394332885742, -27.486591339111328, -25.235790252685547, -22.984987258911133, -20.73418426513672, -18.483381271362305, -16.23257827758789, -13.98177719116211, -11.730974197387695, -9.480171203613281, -7.229369163513184, -4.978567123413086, -2.727764129638672, -0.476961612701416, 1.7738409042358398, 4.024643421173096, 6.275445938110352, 8.526248931884766, 10.777050971984863, 13.027853012084961, 15.278656005859375, 17.52945899963379, 19.780261993408203, 22.031063079833984, 24.2818660736084, 26.532669067382812, 28.783470153808594, 31.034273147583008, 33.28507995605469, 35.53588104248047, 37.786685943603516, 40.0374870300293, 42.288291931152344, 44.539093017578125, 46.789894104003906, 49.04069519042969, 51.291500091552734, 53.542301177978516, 55.79310607910156, 58.043907165527344, 60.294708251953125, 62.54551315307617, 64.79631805419922, 67.047119140625, 69.29792022705078, 71.54872131347656, 73.79952239990234, 76.05033111572266, 78.30113220214844, 80.55193328857422, 82.802734375, 85.05353546142578, 87.30433654785156, 89.55513763427734, 91.80593872070312, 94.05674743652344, 96.30754852294922, 98.558349609375, 100.80915069580078, 103.05995178222656, 105.31076049804688]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 6.0, 11.0, 8.0, 18.0, 16.0, 13.0, 27.0, 25.0, 29.0, 19.0, 30.0, 33.0, 17.0, 33.0, 42.0, 35.0, 43.0, 29.0, 41.0, 27.0, 32.0, 29.0, 45.0, 34.0, 43.0, 31.0, 42.0, 25.0, 24.0, 30.0, 12.0, 22.0, 17.0, 21.0, 12.0, 11.0, 7.0, 6.0, 7.0, 5.0, 6.0, 1.0, 3.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-53.75586700439453, -52.113704681396484, -50.4715461730957, -48.829383850097656, -47.187225341796875, -45.54506301879883, -43.90290069580078, -42.2607421875, -40.61857986450195, -38.976417541503906, -37.334259033203125, -35.69209671020508, -34.04993438720703, -32.40777587890625, -30.765613555908203, -29.12345314025879, -27.481292724609375, -25.83913230895996, -24.196971893310547, -22.5548095703125, -20.912649154663086, -19.270488739013672, -17.628326416015625, -15.986166000366211, -14.344005584716797, -12.701845169067383, -11.059683799743652, -9.417522430419922, -7.775362014770508, -6.133201599121094, -4.491040229797363, -2.848878860473633, -1.2067146301269531, 0.43544626235961914, 2.0776071548461914, 3.7197680473327637, 5.361928939819336, 7.00408935546875, 8.64625072479248, 10.288412094116211, 11.930572509765625, 13.572732925415039, 15.21489429473877, 16.8570556640625, 18.499216079711914, 20.141376495361328, 21.783538818359375, 23.42569923400879, 25.067859649658203, 26.710020065307617, 28.35218048095703, 29.994342803955078, 31.636503219604492, 33.278663635253906, 34.92082595825195, 36.56298828125, 38.20514678955078, 39.84730911254883, 41.48946762084961, 43.131629943847656, 44.77378845214844, 46.415950775146484, 48.05811309814453, 49.70027160644531, 51.34243392944336]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 5.0, 12.0, 14.0, 19.0, 20.0, 13.0, 22.0, 28.0, 36.0, 25.0, 27.0, 34.0, 29.0, 35.0, 37.0, 38.0, 39.0, 46.0, 45.0, 23.0, 44.0, 32.0, 35.0, 31.0, 32.0, 31.0, 23.0, 22.0, 20.0, 17.0, 21.0, 23.0, 16.0, 13.0, 13.0, 8.0, 7.0, 9.0, 4.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.98828125, -5.80670166015625, -5.6251220703125, -5.44354248046875, -5.261962890625, -5.08038330078125, -4.8988037109375, -4.71722412109375, -4.53564453125, -4.35406494140625, -4.1724853515625, -3.99090576171875, -3.809326171875, -3.62774658203125, -3.4461669921875, -3.26458740234375, -3.0830078125, -2.90142822265625, -2.7198486328125, -2.53826904296875, -2.356689453125, -2.17510986328125, -1.9935302734375, -1.81195068359375, -1.63037109375, -1.44879150390625, -1.2672119140625, -1.08563232421875, -0.904052734375, -0.72247314453125, -0.5408935546875, -0.35931396484375, -0.177734375, 0.00384521484375, 0.1854248046875, 0.36700439453125, 0.548583984375, 0.73016357421875, 0.9117431640625, 1.09332275390625, 1.27490234375, 1.45648193359375, 1.6380615234375, 1.81964111328125, 2.001220703125, 2.18280029296875, 2.3643798828125, 2.54595947265625, 2.7275390625, 2.90911865234375, 3.0906982421875, 3.27227783203125, 3.453857421875, 3.63543701171875, 3.8170166015625, 3.99859619140625, 4.18017578125, 4.36175537109375, 4.5433349609375, 4.72491455078125, 4.906494140625, 5.08807373046875, 5.2696533203125, 5.45123291015625, 5.6328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 3.0, 6.0, 4.0, 6.0, 11.0, 15.0, 18.0, 11.0, 27.0, 25.0, 28.0, 32.0, 47.0, 49.0, 86.0, 161.0, 315.0, 1127.0, 8547.0, 401716.0, 3526349.0, 247589.0, 6338.0, 952.0, 320.0, 138.0, 66.0, 42.0, 31.0, 27.0, 25.0, 24.0, 26.0, 11.0, 19.0, 21.0, 10.0, 7.0, 11.0, 4.0, 9.0, 4.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.71875, -24.97216796875, -24.2255859375, -23.47900390625, -22.732421875, -21.98583984375, -21.2392578125, -20.49267578125, -19.74609375, -18.99951171875, -18.2529296875, -17.50634765625, -16.759765625, -16.01318359375, -15.2666015625, -14.52001953125, -13.7734375, -13.02685546875, -12.2802734375, -11.53369140625, -10.787109375, -10.04052734375, -9.2939453125, -8.54736328125, -7.80078125, -7.05419921875, -6.3076171875, -5.56103515625, -4.814453125, -4.06787109375, -3.3212890625, -2.57470703125, -1.828125, -1.08154296875, -0.3349609375, 0.41162109375, 1.158203125, 1.90478515625, 2.6513671875, 3.39794921875, 4.14453125, 4.89111328125, 5.6376953125, 6.38427734375, 7.130859375, 7.87744140625, 8.6240234375, 9.37060546875, 10.1171875, 10.86376953125, 11.6103515625, 12.35693359375, 13.103515625, 13.85009765625, 14.5966796875, 15.34326171875, 16.08984375, 16.83642578125, 17.5830078125, 18.32958984375, 19.076171875, 19.82275390625, 20.5693359375, 21.31591796875, 22.0625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 11.0, 7.0, 8.0, 12.0, 17.0, 39.0, 42.0, 40.0, 59.0, 84.0, 102.0, 172.0, 198.0, 327.0, 379.0, 417.0, 474.0, 381.0, 313.0, 281.0, 181.0, 139.0, 90.0, 79.0, 53.0, 52.0, 21.0, 27.0, 21.0, 13.0, 7.0, 6.0, 3.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.0625, -16.637939453125, -16.21337890625, -15.788818359375, -15.3642578125, -14.939697265625, -14.51513671875, -14.090576171875, -13.666015625, -13.241455078125, -12.81689453125, -12.392333984375, -11.9677734375, -11.543212890625, -11.11865234375, -10.694091796875, -10.26953125, -9.844970703125, -9.42041015625, -8.995849609375, -8.5712890625, -8.146728515625, -7.72216796875, -7.297607421875, -6.873046875, -6.448486328125, -6.02392578125, -5.599365234375, -5.1748046875, -4.750244140625, -4.32568359375, -3.901123046875, -3.4765625, -3.052001953125, -2.62744140625, -2.202880859375, -1.7783203125, -1.353759765625, -0.92919921875, -0.504638671875, -0.080078125, 0.344482421875, 0.76904296875, 1.193603515625, 1.6181640625, 2.042724609375, 2.46728515625, 2.891845703125, 3.31640625, 3.740966796875, 4.16552734375, 4.590087890625, 5.0146484375, 5.439208984375, 5.86376953125, 6.288330078125, 6.712890625, 7.137451171875, 7.56201171875, 7.986572265625, 8.4111328125, 8.835693359375, 9.26025390625, 9.684814453125, 10.109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 2.0, 2.0, 8.0, 9.0, 9.0, 13.0, 11.0, 24.0, 26.0, 32.0, 51.0, 80.0, 77.0, 143.0, 256.0, 442.0, 1267.0, 179866.0, 4006200.0, 4242.0, 642.0, 290.0, 168.0, 110.0, 85.0, 71.0, 47.0, 28.0, 23.0, 20.0, 13.0, 8.0, 6.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.375, -72.8818359375, -70.388671875, -67.8955078125, -65.40234375, -62.9091796875, -60.416015625, -57.9228515625, -55.4296875, -52.9365234375, -50.443359375, -47.9501953125, -45.45703125, -42.9638671875, -40.470703125, -37.9775390625, -35.484375, -32.9912109375, -30.498046875, -28.0048828125, -25.51171875, -23.0185546875, -20.525390625, -18.0322265625, -15.5390625, -13.0458984375, -10.552734375, -8.0595703125, -5.56640625, -3.0732421875, -0.580078125, 1.9130859375, 4.40625, 6.8994140625, 9.392578125, 11.8857421875, 14.37890625, 16.8720703125, 19.365234375, 21.8583984375, 24.3515625, 26.8447265625, 29.337890625, 31.8310546875, 34.32421875, 36.8173828125, 39.310546875, 41.8037109375, 44.296875, 46.7900390625, 49.283203125, 51.7763671875, 54.26953125, 56.7626953125, 59.255859375, 61.7490234375, 64.2421875, 66.7353515625, 69.228515625, 71.7216796875, 74.21484375, 76.7080078125, 79.201171875, 81.6943359375, 84.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 258.0, 662.0, 93.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.84001159667969, -62.19826889038086, -50.55652618408203, -38.91478729248047, -27.27304458618164, -15.631301879882812, -3.98956298828125, 7.652183532714844, 19.293922424316406, 30.935665130615234, 42.57740783691406, 54.219146728515625, 65.86088562011719, 77.50263214111328, 89.14437103271484, 100.78611755371094, 112.4278564453125, 124.06959533691406, 135.71133422851562, 147.35308837890625, 158.9948272705078, 170.63656616210938, 182.27830505371094, 193.9200439453125, 205.56179809570312, 217.2035369873047, 228.84527587890625, 240.48703002929688, 252.12876892089844, 263.7705078125, 275.4122314453125, 287.0539855957031, 298.6957092285156, 310.33746337890625, 321.97918701171875, 333.6209411621094, 345.2626647949219, 356.9044189453125, 368.546142578125, 380.1878967285156, 391.82965087890625, 403.4714050292969, 415.1131286621094, 426.7548828125, 438.3966064453125, 450.0383605957031, 461.68011474609375, 473.32183837890625, 484.96356201171875, 496.6053161621094, 508.2470397949219, 519.8887939453125, 531.530517578125, 543.1722412109375, 554.8140258789062, 566.4557495117188, 578.0975341796875, 589.7392578125, 601.3810424804688, 613.0227661132812, 624.6644897460938, 636.3062744140625, 647.947998046875, 659.5897216796875, 671.2314453125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 8.0, 5.0, 6.0, 13.0, 19.0, 23.0, 23.0, 26.0, 16.0, 23.0, 28.0, 36.0, 40.0, 41.0, 62.0, 43.0, 58.0, 41.0, 37.0, 47.0, 46.0, 43.0, 39.0, 29.0, 41.0, 31.0, 36.0, 25.0, 22.0, 21.0, 12.0, 7.0, 19.0, 9.0, 4.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.849853515625, -52.315155029296875, -50.78045654296875, -49.24576187133789, -47.711063385009766, -46.17636489868164, -44.64167022705078, -43.106971740722656, -41.57227325439453, -40.037574768066406, -38.50287628173828, -36.96818161010742, -35.4334831237793, -33.89878463745117, -32.36408996582031, -30.829391479492188, -29.294692993164062, -27.759994506835938, -26.225297927856445, -24.690601348876953, -23.155902862548828, -21.621204376220703, -20.08650779724121, -18.55181121826172, -17.017112731933594, -15.482415199279785, -13.947717666625977, -12.413020133972168, -10.87832260131836, -9.34362506866455, -7.808927536010742, -6.274230003356934, -4.739532470703125, -3.2048349380493164, -1.6701374053955078, -0.13543987274169922, 1.3992576599121094, 2.933955192565918, 4.468652725219727, 6.003350257873535, 7.538047790527344, 9.072745323181152, 10.607442855834961, 12.14214038848877, 13.676837921142578, 15.211535453796387, 16.746232986450195, 18.280929565429688, 19.815628051757812, 21.350326538085938, 22.88502311706543, 24.419719696044922, 25.954418182373047, 27.489116668701172, 29.023813247680664, 30.558509826660156, 32.09320831298828, 33.627906799316406, 35.16260528564453, 36.69729995727539, 38.231998443603516, 39.76669692993164, 41.3013916015625, 42.836090087890625, 44.37078857421875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 5.0, 4.0, 16.0, 11.0, 24.0, 16.0, 27.0, 18.0, 16.0, 28.0, 36.0, 29.0, 23.0, 31.0, 28.0, 39.0, 53.0, 36.0, 41.0, 46.0, 45.0, 26.0, 25.0, 33.0, 34.0, 32.0, 26.0, 27.0, 27.0, 16.0, 16.0, 21.0, 21.0, 21.0, 14.0, 14.0, 9.0, 6.0, 12.0, 10.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-6.33984375, -6.15875244140625, -5.9776611328125, -5.79656982421875, -5.615478515625, -5.43438720703125, -5.2532958984375, -5.07220458984375, -4.89111328125, -4.71002197265625, -4.5289306640625, -4.34783935546875, -4.166748046875, -3.98565673828125, -3.8045654296875, -3.62347412109375, -3.4423828125, -3.26129150390625, -3.0802001953125, -2.89910888671875, -2.718017578125, -2.53692626953125, -2.3558349609375, -2.17474365234375, -1.99365234375, -1.81256103515625, -1.6314697265625, -1.45037841796875, -1.269287109375, -1.08819580078125, -0.9071044921875, -0.72601318359375, -0.544921875, -0.36383056640625, -0.1827392578125, -0.00164794921875, 0.179443359375, 0.36053466796875, 0.5416259765625, 0.72271728515625, 0.90380859375, 1.08489990234375, 1.2659912109375, 1.44708251953125, 1.628173828125, 1.80926513671875, 1.9903564453125, 2.17144775390625, 2.3525390625, 2.53363037109375, 2.7147216796875, 2.89581298828125, 3.076904296875, 3.25799560546875, 3.4390869140625, 3.62017822265625, 3.80126953125, 3.98236083984375, 4.1634521484375, 4.34454345703125, 4.525634765625, 4.70672607421875, 4.8878173828125, 5.06890869140625, 5.25]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 15.0, 24.0, 35.0, 52.0, 71.0, 136.0, 174.0, 309.0, 441.0, 659.0, 1085.0, 1529.0, 2305.0, 3627.0, 5376.0, 7982.0, 12321.0, 18546.0, 28616.0, 44514.0, 71159.0, 116894.0, 207213.0, 208839.0, 117256.0, 70780.0, 44711.0, 28647.0, 18764.0, 12428.0, 8021.0, 5409.0, 3651.0, 2391.0, 1584.0, 1011.0, 656.0, 469.0, 310.0, 179.0, 137.0, 75.0, 53.0, 33.0, 25.0, 16.0, 7.0, 8.0, 5.0, 1.0, 0.0, 2.0], "bins": [-0.92431640625, -0.8979110717773438, -0.8715057373046875, -0.8451004028320312, -0.818695068359375, -0.7922897338867188, -0.7658843994140625, -0.7394790649414062, -0.71307373046875, -0.6866683959960938, -0.6602630615234375, -0.6338577270507812, -0.607452392578125, -0.5810470581054688, -0.5546417236328125, -0.5282363891601562, -0.5018310546875, -0.47542572021484375, -0.4490203857421875, -0.42261505126953125, -0.396209716796875, -0.36980438232421875, -0.3433990478515625, -0.31699371337890625, -0.29058837890625, -0.26418304443359375, -0.2377777099609375, -0.21137237548828125, -0.184967041015625, -0.15856170654296875, -0.1321563720703125, -0.10575103759765625, -0.079345703125, -0.05294036865234375, -0.0265350341796875, -0.00012969970703125, 0.026275634765625, 0.05268096923828125, 0.0790863037109375, 0.10549163818359375, 0.13189697265625, 0.15830230712890625, 0.1847076416015625, 0.21111297607421875, 0.237518310546875, 0.26392364501953125, 0.2903289794921875, 0.31673431396484375, 0.3431396484375, 0.36954498291015625, 0.3959503173828125, 0.42235565185546875, 0.448760986328125, 0.47516632080078125, 0.5015716552734375, 0.5279769897460938, 0.55438232421875, 0.5807876586914062, 0.6071929931640625, 0.6335983276367188, 0.660003662109375, 0.6864089965820312, 0.7128143310546875, 0.7392196655273438, 0.765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 4.0, 5.0, 6.0, 8.0, 17.0, 13.0, 16.0, 14.0, 18.0, 18.0, 23.0, 29.0, 29.0, 37.0, 34.0, 34.0, 35.0, 39.0, 34.0, 34.0, 1058.0, 41.0, 49.0, 47.0, 46.0, 41.0, 33.0, 36.0, 28.0, 34.0, 27.0, 22.0, 23.0, 16.0, 17.0, 9.0, 11.0, 9.0, 2.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.42578125, -4.29473876953125, -4.1636962890625, -4.03265380859375, -3.901611328125, -3.77056884765625, -3.6395263671875, -3.50848388671875, -3.37744140625, -3.24639892578125, -3.1153564453125, -2.98431396484375, -2.853271484375, -2.72222900390625, -2.5911865234375, -2.46014404296875, -2.3291015625, -2.19805908203125, -2.0670166015625, -1.93597412109375, -1.804931640625, -1.67388916015625, -1.5428466796875, -1.41180419921875, -1.28076171875, -1.14971923828125, -1.0186767578125, -0.88763427734375, -0.756591796875, -0.62554931640625, -0.4945068359375, -0.36346435546875, -0.232421875, -0.10137939453125, 0.0296630859375, 0.16070556640625, 0.291748046875, 0.42279052734375, 0.5538330078125, 0.68487548828125, 0.81591796875, 0.94696044921875, 1.0780029296875, 1.20904541015625, 1.340087890625, 1.47113037109375, 1.6021728515625, 1.73321533203125, 1.8642578125, 1.99530029296875, 2.1263427734375, 2.25738525390625, 2.388427734375, 2.51947021484375, 2.6505126953125, 2.78155517578125, 2.91259765625, 3.04364013671875, 3.1746826171875, 3.30572509765625, 3.436767578125, 3.56781005859375, 3.6988525390625, 3.82989501953125, 3.9609375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 13.0, 13.0, 14.0, 31.0, 28.0, 63.0, 58.0, 108.0, 148.0, 213.0, 294.0, 424.0, 657.0, 949.0, 1370.0, 2061.0, 3113.0, 4606.0, 6690.0, 10288.0, 15714.0, 25010.0, 40405.0, 68286.0, 118651.0, 245184.0, 1247725.0, 121382.0, 69535.0, 41066.0, 25315.0, 16271.0, 10417.0, 6846.0, 4583.0, 3128.0, 2043.0, 1364.0, 958.0, 665.0, 439.0, 288.0, 234.0, 138.0, 125.0, 63.0, 56.0, 41.0, 24.0, 17.0, 3.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.82080078125, -0.79345703125, -0.76611328125, -0.73876953125, -0.71142578125, -0.68408203125, -0.65673828125, -0.62939453125, -0.60205078125, -0.57470703125, -0.54736328125, -0.52001953125, -0.49267578125, -0.46533203125, -0.43798828125, -0.41064453125, -0.38330078125, -0.35595703125, -0.32861328125, -0.30126953125, -0.27392578125, -0.24658203125, -0.21923828125, -0.19189453125, -0.16455078125, -0.13720703125, -0.10986328125, -0.08251953125, -0.05517578125, -0.02783203125, -0.00048828125, 0.02685546875, 0.05419921875, 0.08154296875, 0.10888671875, 0.13623046875, 0.16357421875, 0.19091796875, 0.21826171875, 0.24560546875, 0.27294921875, 0.30029296875, 0.32763671875, 0.35498046875, 0.38232421875, 0.40966796875, 0.43701171875, 0.46435546875, 0.49169921875, 0.51904296875, 0.54638671875, 0.57373046875, 0.60107421875, 0.62841796875, 0.65576171875, 0.68310546875, 0.71044921875, 0.73779296875, 0.76513671875, 0.79248046875, 0.81982421875, 0.84716796875, 0.87451171875, 0.90185546875, 0.92919921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 3.0, 17.0, 10.0, 19.0, 26.0, 32.0, 35.0, 50.0, 50.0, 69.0, 61.0, 86.0, 79.0, 74.0, 54.0, 63.0, 61.0, 37.0, 29.0, 28.0, 24.0, 21.0, 19.0, 8.0, 13.0, 5.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011577606201171875, -0.0011221617460250854, -0.0010865628719329834, -0.0010509639978408813, -0.0010153651237487793, -0.0009797662496566772, -0.0009441673755645752, -0.0009085685014724731, -0.0008729696273803711, -0.000837370753288269, -0.000801771879196167, -0.0007661730051040649, -0.0007305741310119629, -0.0006949752569198608, -0.0006593763828277588, -0.0006237775087356567, -0.0005881786346435547, -0.0005525797605514526, -0.0005169808864593506, -0.00048138201236724854, -0.0004457831382751465, -0.00041018426418304443, -0.0003745853900909424, -0.00033898651599884033, -0.0003033876419067383, -0.00026778876781463623, -0.00023218989372253418, -0.00019659101963043213, -0.00016099214553833008, -0.00012539327144622803, -8.979439735412598e-05, -5.4195523262023926e-05, -1.8596649169921875e-05, 1.7002224922180176e-05, 5.2601099014282227e-05, 8.819997310638428e-05, 0.00012379884719848633, 0.00015939772129058838, 0.00019499659538269043, 0.00023059546947479248, 0.00026619434356689453, 0.0003017932176589966, 0.00033739209175109863, 0.0003729909658432007, 0.00040858983993530273, 0.0004441887140274048, 0.00047978758811950684, 0.0005153864622116089, 0.0005509853363037109, 0.000586584210395813, 0.000622183084487915, 0.0006577819585800171, 0.0006933808326721191, 0.0007289797067642212, 0.0007645785808563232, 0.0008001774549484253, 0.0008357763290405273, 0.0008713752031326294, 0.0009069740772247314, 0.0009425729513168335, 0.0009781718254089355, 0.0010137706995010376, 0.0010493695735931396, 0.0010849684476852417, 0.0011205673217773438]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 3.0, 5.0, 7.0, 15.0, 11.0, 21.0, 27.0, 26.0, 46.0, 41.0, 86.0, 171.0, 428.0, 2580.0, 1041289.0, 2850.0, 453.0, 164.0, 91.0, 60.0, 49.0, 32.0, 27.0, 21.0, 10.0, 17.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027587890625, -0.02662038803100586, -0.02565288543701172, -0.024685382843017578, -0.023717880249023438, -0.022750377655029297, -0.021782875061035156, -0.020815372467041016, -0.019847869873046875, -0.018880367279052734, -0.017912864685058594, -0.016945362091064453, -0.015977859497070312, -0.015010356903076172, -0.014042854309082031, -0.01307535171508789, -0.01210784912109375, -0.01114034652709961, -0.010172843933105469, -0.009205341339111328, -0.008237838745117188, -0.007270336151123047, -0.006302833557128906, -0.005335330963134766, -0.004367828369140625, -0.0034003257751464844, -0.0024328231811523438, -0.0014653205871582031, -0.0004978179931640625, 0.0004696846008300781, 0.0014371871948242188, 0.0024046897888183594, 0.0033721923828125, 0.004339694976806641, 0.005307197570800781, 0.006274700164794922, 0.0072422027587890625, 0.008209705352783203, 0.009177207946777344, 0.010144710540771484, 0.011112213134765625, 0.012079715728759766, 0.013047218322753906, 0.014014720916748047, 0.014982223510742188, 0.015949726104736328, 0.01691722869873047, 0.01788473129272461, 0.01885223388671875, 0.01981973648071289, 0.02078723907470703, 0.021754741668701172, 0.022722244262695312, 0.023689746856689453, 0.024657249450683594, 0.025624752044677734, 0.026592254638671875, 0.027559757232666016, 0.028527259826660156, 0.029494762420654297, 0.030462265014648438, 0.03142976760864258, 0.03239727020263672, 0.03336477279663086, 0.034332275390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 88.0, 569.0, 325.0, 27.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004656884353607893, -0.004557330626994371, -0.00445777690038085, -0.004358223639428616, -0.004258669912815094, -0.004159116186201572, -0.004059562459588051, -0.003960008732974529, -0.0038604550063610077, -0.003760901279747486, -0.003661347785964608, -0.0035617940593510866, -0.003462240332737565, -0.003362686838954687, -0.0032631331123411655, -0.003163579385727644, -0.003064025891944766, -0.0029644721653312445, -0.0028649186715483665, -0.002765364944934845, -0.0026658112183213234, -0.002566257491707802, -0.002466703997924924, -0.0023671502713114023, -0.0022675967775285244, -0.002168043050915003, -0.002068489557132125, -0.0019689358305186033, -0.0018693821039050817, -0.001769828493706882, -0.0016702748835086823, -0.0015707211568951607, -0.001471167430281639, -0.0013716138200834394, -0.0012720600934699178, -0.001172506483271718, -0.0010729527566581964, -0.0009733991464599967, -0.000873845536261797, -0.0007742918678559363, -0.0006747381994500756, -0.000575184531044215, -0.00047563089174218476, -0.00037607725244015455, -0.0002765235840342939, -0.00017696991562843323, -7.741630543023348e-05, 2.2137362975627184e-05, 0.00012169103138148785, 0.00022124468523543328, 0.0003207983390893787, 0.0004203519783914089, 0.0005199056467972696, 0.0006194593152031302, 0.00071901292540133, 0.0008185665938071907, 0.0009181202622130513, 0.001017673872411251, 0.0011172275990247726, 0.0012167812092229724, 0.0013163348194211721, 0.0014158885460346937, 0.0015154421562328935, 0.0016149957664310932, 0.0017145494930446148]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 13.0, 10.0, 11.0, 10.0, 8.0, 11.0, 11.0, 17.0, 22.0, 33.0, 34.0, 30.0, 28.0, 32.0, 33.0, 33.0, 39.0, 36.0, 52.0, 39.0, 44.0, 46.0, 39.0, 28.0, 31.0, 34.0, 22.0, 36.0, 30.0, 29.0, 29.0, 22.0, 21.0, 14.0, 16.0, 8.0, 7.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00044977664947509766, -0.00043544545769691467, -0.0004211142659187317, -0.0004067830741405487, -0.0003924518823623657, -0.00037812069058418274, -0.00036378949880599976, -0.00034945830702781677, -0.0003351271152496338, -0.0003207959234714508, -0.0003064647316932678, -0.00029213353991508484, -0.00027780234813690186, -0.00026347115635871887, -0.0002491399645805359, -0.0002348087728023529, -0.00022047758102416992, -0.00020614638924598694, -0.00019181519746780396, -0.00017748400568962097, -0.000163152813911438, -0.000148821622133255, -0.00013449043035507202, -0.00012015923857688904, -0.00010582804679870605, -9.149685502052307e-05, -7.716566324234009e-05, -6.28344714641571e-05, -4.850327968597412e-05, -3.417208790779114e-05, -1.9840896129608154e-05, -5.509704351425171e-06, 8.821487426757812e-06, 2.3152679204940796e-05, 3.748387098312378e-05, 5.181506276130676e-05, 6.614625453948975e-05, 8.047744631767273e-05, 9.480863809585571e-05, 0.0001091398298740387, 0.00012347102165222168, 0.00013780221343040466, 0.00015213340520858765, 0.00016646459698677063, 0.0001807957887649536, 0.0001951269805431366, 0.00020945817232131958, 0.00022378936409950256, 0.00023812055587768555, 0.00025245174765586853, 0.0002667829394340515, 0.0002811141312122345, 0.0002954453229904175, 0.00030977651476860046, 0.00032410770654678345, 0.00033843889832496643, 0.0003527700901031494, 0.0003671012818813324, 0.0003814324736595154, 0.00039576366543769836, 0.00041009485721588135, 0.00042442604899406433, 0.0004387572407722473, 0.0004530884325504303, 0.0004674196243286133]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 5.0, 4.0, 16.0, 11.0, 24.0, 16.0, 27.0, 18.0, 16.0, 28.0, 36.0, 29.0, 23.0, 31.0, 28.0, 39.0, 53.0, 36.0, 41.0, 46.0, 45.0, 26.0, 25.0, 33.0, 34.0, 32.0, 26.0, 27.0, 27.0, 16.0, 16.0, 21.0, 21.0, 21.0, 14.0, 14.0, 9.0, 6.0, 12.0, 10.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-6.33984375, -6.15875244140625, -5.9776611328125, -5.79656982421875, -5.615478515625, -5.43438720703125, -5.2532958984375, -5.07220458984375, -4.89111328125, -4.71002197265625, -4.5289306640625, -4.34783935546875, -4.166748046875, -3.98565673828125, -3.8045654296875, -3.62347412109375, -3.4423828125, -3.26129150390625, -3.0802001953125, -2.89910888671875, -2.718017578125, -2.53692626953125, -2.3558349609375, -2.17474365234375, -1.99365234375, -1.81256103515625, -1.6314697265625, -1.45037841796875, -1.269287109375, -1.08819580078125, -0.9071044921875, -0.72601318359375, -0.544921875, -0.36383056640625, -0.1827392578125, -0.00164794921875, 0.179443359375, 0.36053466796875, 0.5416259765625, 0.72271728515625, 0.90380859375, 1.08489990234375, 1.2659912109375, 1.44708251953125, 1.628173828125, 1.80926513671875, 1.9903564453125, 2.17144775390625, 2.3525390625, 2.53363037109375, 2.7147216796875, 2.89581298828125, 3.076904296875, 3.25799560546875, 3.4390869140625, 3.62017822265625, 3.80126953125, 3.98236083984375, 4.1634521484375, 4.34454345703125, 4.525634765625, 4.70672607421875, 4.8878173828125, 5.06890869140625, 5.25]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 11.0, 7.0, 11.0, 25.0, 16.0, 28.0, 33.0, 38.0, 66.0, 75.0, 123.0, 165.0, 226.0, 327.0, 490.0, 716.0, 1221.0, 2178.0, 3851.0, 7710.0, 15951.0, 35526.0, 82909.0, 210717.0, 390819.0, 169699.0, 67418.0, 29631.0, 13528.0, 6512.0, 3396.0, 1832.0, 1108.0, 683.0, 439.0, 293.0, 200.0, 148.0, 110.0, 63.0, 72.0, 50.0, 29.0, 26.0, 18.0, 14.0, 15.0, 8.0, 8.0, 6.0, 6.0, 4.0, 1.0, 0.0, 3.0], "bins": [-5.125, -4.97149658203125, -4.8179931640625, -4.66448974609375, -4.510986328125, -4.35748291015625, -4.2039794921875, -4.05047607421875, -3.89697265625, -3.74346923828125, -3.5899658203125, -3.43646240234375, -3.282958984375, -3.12945556640625, -2.9759521484375, -2.82244873046875, -2.6689453125, -2.51544189453125, -2.3619384765625, -2.20843505859375, -2.054931640625, -1.90142822265625, -1.7479248046875, -1.59442138671875, -1.44091796875, -1.28741455078125, -1.1339111328125, -0.98040771484375, -0.826904296875, -0.67340087890625, -0.5198974609375, -0.36639404296875, -0.212890625, -0.05938720703125, 0.0941162109375, 0.24761962890625, 0.401123046875, 0.55462646484375, 0.7081298828125, 0.86163330078125, 1.01513671875, 1.16864013671875, 1.3221435546875, 1.47564697265625, 1.629150390625, 1.78265380859375, 1.9361572265625, 2.08966064453125, 2.2431640625, 2.39666748046875, 2.5501708984375, 2.70367431640625, 2.857177734375, 3.01068115234375, 3.1641845703125, 3.31768798828125, 3.47119140625, 3.62469482421875, 3.7781982421875, 3.93170166015625, 4.085205078125, 4.23870849609375, 4.3922119140625, 4.54571533203125, 4.69921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 4.0, 1.0, 3.0, 6.0, 6.0, 14.0, 15.0, 12.0, 14.0, 23.0, 15.0, 16.0, 40.0, 23.0, 36.0, 44.0, 45.0, 47.0, 57.0, 61.0, 120.0, 355.0, 1460.0, 150.0, 78.0, 53.0, 38.0, 41.0, 41.0, 24.0, 28.0, 35.0, 26.0, 20.0, 17.0, 11.0, 19.0, 12.0, 8.0, 4.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.723876953125, -18.05712890625, -17.390380859375, -16.7236328125, -16.056884765625, -15.39013671875, -14.723388671875, -14.056640625, -13.389892578125, -12.72314453125, -12.056396484375, -11.3896484375, -10.722900390625, -10.05615234375, -9.389404296875, -8.72265625, -8.055908203125, -7.38916015625, -6.722412109375, -6.0556640625, -5.388916015625, -4.72216796875, -4.055419921875, -3.388671875, -2.721923828125, -2.05517578125, -1.388427734375, -0.7216796875, -0.054931640625, 0.61181640625, 1.278564453125, 1.9453125, 2.612060546875, 3.27880859375, 3.945556640625, 4.6123046875, 5.279052734375, 5.94580078125, 6.612548828125, 7.279296875, 7.946044921875, 8.61279296875, 9.279541015625, 9.9462890625, 10.613037109375, 11.27978515625, 11.946533203125, 12.61328125, 13.280029296875, 13.94677734375, 14.613525390625, 15.2802734375, 15.947021484375, 16.61376953125, 17.280517578125, 17.947265625, 18.614013671875, 19.28076171875, 19.947509765625, 20.6142578125, 21.281005859375, 21.94775390625, 22.614501953125, 23.28125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 9.0, 15.0, 23.0, 26.0, 46.0, 56.0, 88.0, 125.0, 178.0, 328.0, 628.0, 3091.0, 3109574.0, 29385.0, 1016.0, 403.0, 237.0, 130.0, 115.0, 68.0, 53.0, 47.0, 18.0, 13.0, 4.0, 17.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.1875, -56.580078125, -53.97265625, -51.365234375, -48.7578125, -46.150390625, -43.54296875, -40.935546875, -38.328125, -35.720703125, -33.11328125, -30.505859375, -27.8984375, -25.291015625, -22.68359375, -20.076171875, -17.46875, -14.861328125, -12.25390625, -9.646484375, -7.0390625, -4.431640625, -1.82421875, 0.783203125, 3.390625, 5.998046875, 8.60546875, 11.212890625, 13.8203125, 16.427734375, 19.03515625, 21.642578125, 24.25, 26.857421875, 29.46484375, 32.072265625, 34.6796875, 37.287109375, 39.89453125, 42.501953125, 45.109375, 47.716796875, 50.32421875, 52.931640625, 55.5390625, 58.146484375, 60.75390625, 63.361328125, 65.96875, 68.576171875, 71.18359375, 73.791015625, 76.3984375, 79.005859375, 81.61328125, 84.220703125, 86.828125, 89.435546875, 92.04296875, 94.650390625, 97.2578125, 99.865234375, 102.47265625, 105.080078125, 107.6875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 9.0, 24.0, 78.0, 134.0, 201.0, 206.0, 182.0, 100.0, 46.0, 12.0, 8.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.25172424316406, -45.908782958984375, -44.56583786010742, -43.222896575927734, -41.87995529174805, -40.537010192871094, -39.194068908691406, -37.85112762451172, -36.50818634033203, -35.165245056152344, -33.82229995727539, -32.4793586730957, -31.136417388916016, -29.793474197387695, -28.450531005859375, -27.107589721679688, -25.764644622802734, -24.421701431274414, -23.078760147094727, -21.735816955566406, -20.39287567138672, -19.0499324798584, -17.706989288330078, -16.36404800415039, -15.02110481262207, -13.678162574768066, -12.335220336914062, -10.992277145385742, -9.649334907531738, -8.306392669677734, -6.963449478149414, -5.62050724029541, -4.277565002441406, -2.9346225261688232, -1.5916800498962402, -0.24873733520507812, 1.0942049026489258, 2.4371471405029297, 3.78009033203125, 5.123032569885254, 6.465974807739258, 7.808917045593262, 9.151859283447266, 10.494802474975586, 11.83774471282959, 13.180686950683594, 14.523630142211914, 15.866572380065918, 17.209514617919922, 18.552457809448242, 19.89539909362793, 21.23834228515625, 22.581283569335938, 23.924226760864258, 25.267169952392578, 26.610111236572266, 27.953054428100586, 29.295997619628906, 30.638938903808594, 31.981882095336914, 33.324825286865234, 34.66776657104492, 36.010711669921875, 37.35365295410156, 38.69659423828125]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 11.0, 14.0, 24.0, 21.0, 20.0, 14.0, 18.0, 33.0, 43.0, 52.0, 29.0, 31.0, 46.0, 44.0, 45.0, 33.0, 56.0, 56.0, 43.0, 47.0, 30.0, 37.0, 32.0, 27.0, 30.0, 31.0, 15.0, 18.0, 14.0, 12.0, 10.0, 12.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.30511474609375, -67.20457458496094, -65.10403442382812, -63.00349426269531, -60.9029541015625, -58.80241394042969, -56.701873779296875, -54.60133361816406, -52.50079345703125, -50.40025329589844, -48.299713134765625, -46.19917297363281, -44.0986328125, -41.99809265136719, -39.897552490234375, -37.79701232910156, -35.69647216796875, -33.59593200683594, -31.495391845703125, -29.394851684570312, -27.2943115234375, -25.193771362304688, -23.093231201171875, -20.992691040039062, -18.89215087890625, -16.791610717773438, -14.691070556640625, -12.590530395507812, -10.489990234375, -8.389450073242188, -6.288909912109375, -4.1883697509765625, -2.08782958984375, 0.0127105712890625, 2.113250732421875, 4.2137908935546875, 6.3143310546875, 8.414871215820312, 10.515411376953125, 12.615951538085938, 14.71649169921875, 16.817031860351562, 18.917572021484375, 21.018112182617188, 23.11865234375, 25.219192504882812, 27.319732666015625, 29.420272827148438, 31.52081298828125, 33.62135314941406, 35.721893310546875, 37.82243347167969, 39.9229736328125, 42.02351379394531, 44.124053955078125, 46.22459411621094, 48.32513427734375, 50.42567443847656, 52.526214599609375, 54.62675476074219, 56.727294921875, 58.82783508300781, 60.928375244140625, 63.02891540527344, 65.12945556640625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 9.0, 5.0, 6.0, 10.0, 9.0, 19.0, 25.0, 20.0, 21.0, 31.0, 19.0, 21.0, 30.0, 26.0, 30.0, 30.0, 38.0, 33.0, 35.0, 47.0, 47.0, 41.0, 31.0, 42.0, 28.0, 30.0, 26.0, 24.0, 31.0, 22.0, 23.0, 22.0, 23.0, 26.0, 16.0, 12.0, 15.0, 9.0, 13.0, 7.0, 5.0, 10.0, 4.0, 3.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0], "bins": [-6.35546875, -6.16595458984375, -5.9764404296875, -5.78692626953125, -5.597412109375, -5.40789794921875, -5.2183837890625, -5.02886962890625, -4.83935546875, -4.64984130859375, -4.4603271484375, -4.27081298828125, -4.081298828125, -3.89178466796875, -3.7022705078125, -3.51275634765625, -3.3232421875, -3.13372802734375, -2.9442138671875, -2.75469970703125, -2.565185546875, -2.37567138671875, -2.1861572265625, -1.99664306640625, -1.80712890625, -1.61761474609375, -1.4281005859375, -1.23858642578125, -1.049072265625, -0.85955810546875, -0.6700439453125, -0.48052978515625, -0.291015625, -0.10150146484375, 0.0880126953125, 0.27752685546875, 0.467041015625, 0.65655517578125, 0.8460693359375, 1.03558349609375, 1.22509765625, 1.41461181640625, 1.6041259765625, 1.79364013671875, 1.983154296875, 2.17266845703125, 2.3621826171875, 2.55169677734375, 2.7412109375, 2.93072509765625, 3.1202392578125, 3.30975341796875, 3.499267578125, 3.68878173828125, 3.8782958984375, 4.06781005859375, 4.25732421875, 4.44683837890625, 4.6363525390625, 4.82586669921875, 5.015380859375, 5.20489501953125, 5.3944091796875, 5.58392333984375, 5.7734375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 11.0, 9.0, 4.0, 7.0, 11.0, 13.0, 21.0, 22.0, 20.0, 18.0, 28.0, 38.0, 43.0, 56.0, 109.0, 261.0, 718.0, 3344.0, 52477.0, 2282467.0, 1815702.0, 35080.0, 2593.0, 615.0, 220.0, 88.0, 45.0, 45.0, 17.0, 28.0, 27.0, 11.0, 24.0, 23.0, 16.0, 8.0, 15.0, 4.0, 8.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.3125, -24.56689453125, -23.8212890625, -23.07568359375, -22.330078125, -21.58447265625, -20.8388671875, -20.09326171875, -19.34765625, -18.60205078125, -17.8564453125, -17.11083984375, -16.365234375, -15.61962890625, -14.8740234375, -14.12841796875, -13.3828125, -12.63720703125, -11.8916015625, -11.14599609375, -10.400390625, -9.65478515625, -8.9091796875, -8.16357421875, -7.41796875, -6.67236328125, -5.9267578125, -5.18115234375, -4.435546875, -3.68994140625, -2.9443359375, -2.19873046875, -1.453125, -0.70751953125, 0.0380859375, 0.78369140625, 1.529296875, 2.27490234375, 3.0205078125, 3.76611328125, 4.51171875, 5.25732421875, 6.0029296875, 6.74853515625, 7.494140625, 8.23974609375, 8.9853515625, 9.73095703125, 10.4765625, 11.22216796875, 11.9677734375, 12.71337890625, 13.458984375, 14.20458984375, 14.9501953125, 15.69580078125, 16.44140625, 17.18701171875, 17.9326171875, 18.67822265625, 19.423828125, 20.16943359375, 20.9150390625, 21.66064453125, 22.40625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 2.0, 6.0, 12.0, 18.0, 25.0, 25.0, 45.0, 51.0, 59.0, 78.0, 132.0, 183.0, 264.0, 375.0, 439.0, 455.0, 476.0, 369.0, 273.0, 201.0, 164.0, 120.0, 86.0, 56.0, 34.0, 28.0, 26.0, 22.0, 12.0, 15.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.421875, -14.963623046875, -14.50537109375, -14.047119140625, -13.5888671875, -13.130615234375, -12.67236328125, -12.214111328125, -11.755859375, -11.297607421875, -10.83935546875, -10.381103515625, -9.9228515625, -9.464599609375, -9.00634765625, -8.548095703125, -8.08984375, -7.631591796875, -7.17333984375, -6.715087890625, -6.2568359375, -5.798583984375, -5.34033203125, -4.882080078125, -4.423828125, -3.965576171875, -3.50732421875, -3.049072265625, -2.5908203125, -2.132568359375, -1.67431640625, -1.216064453125, -0.7578125, -0.299560546875, 0.15869140625, 0.616943359375, 1.0751953125, 1.533447265625, 1.99169921875, 2.449951171875, 2.908203125, 3.366455078125, 3.82470703125, 4.282958984375, 4.7412109375, 5.199462890625, 5.65771484375, 6.115966796875, 6.57421875, 7.032470703125, 7.49072265625, 7.948974609375, 8.4072265625, 8.865478515625, 9.32373046875, 9.781982421875, 10.240234375, 10.698486328125, 11.15673828125, 11.614990234375, 12.0732421875, 12.531494140625, 12.98974609375, 13.447998046875, 13.90625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 5.0, 11.0, 20.0, 17.0, 26.0, 35.0, 38.0, 49.0, 59.0, 69.0, 110.0, 130.0, 204.0, 214.0, 333.0, 548.0, 1662.0, 220690.0, 3956637.0, 11069.0, 859.0, 403.0, 270.0, 187.0, 140.0, 92.0, 71.0, 67.0, 48.0, 44.0, 32.0, 35.0, 24.0, 17.0, 9.0, 16.0, 11.0, 8.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-67.0, -65.044921875, -63.08984375, -61.134765625, -59.1796875, -57.224609375, -55.26953125, -53.314453125, -51.359375, -49.404296875, -47.44921875, -45.494140625, -43.5390625, -41.583984375, -39.62890625, -37.673828125, -35.71875, -33.763671875, -31.80859375, -29.853515625, -27.8984375, -25.943359375, -23.98828125, -22.033203125, -20.078125, -18.123046875, -16.16796875, -14.212890625, -12.2578125, -10.302734375, -8.34765625, -6.392578125, -4.4375, -2.482421875, -0.52734375, 1.427734375, 3.3828125, 5.337890625, 7.29296875, 9.248046875, 11.203125, 13.158203125, 15.11328125, 17.068359375, 19.0234375, 20.978515625, 22.93359375, 24.888671875, 26.84375, 28.798828125, 30.75390625, 32.708984375, 34.6640625, 36.619140625, 38.57421875, 40.529296875, 42.484375, 44.439453125, 46.39453125, 48.349609375, 50.3046875, 52.259765625, 54.21484375, 56.169921875, 58.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 204.0, 678.0, 127.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-401.5618591308594, -390.8330383300781, -380.1042175292969, -369.3753662109375, -358.64654541015625, -347.917724609375, -337.18890380859375, -326.4600830078125, -315.73126220703125, -305.00244140625, -294.27362060546875, -283.5447998046875, -272.8159484863281, -262.0871276855469, -251.35830688476562, -240.62948608398438, -229.900634765625, -219.17181396484375, -208.44297790527344, -197.7141571044922, -186.98532104492188, -176.25650024414062, -165.52767944335938, -154.79885864257812, -144.0700225830078, -133.34120178222656, -122.61236572265625, -111.883544921875, -101.15471649169922, -90.42588806152344, -79.69706726074219, -68.9682388305664, -58.23944091796875, -47.51061248779297, -36.78178787231445, -26.052963256835938, -15.324134826660156, -4.595306396484375, 6.133514404296875, 16.862342834472656, 27.591171264648438, 38.31999969482422, 49.048824310302734, 59.77764892578125, 70.50647735595703, 81.23530578613281, 91.96412658691406, 102.69295501708984, 113.42178344726562, 124.1506118774414, 134.8794403076172, 145.60826110839844, 156.33709716796875, 167.06591796875, 177.79473876953125, 188.5235595703125, 199.2523956298828, 209.98121643066406, 220.71005249023438, 231.43887329101562, 242.16769409179688, 252.8965301513672, 263.6253662109375, 274.35418701171875, 285.0830078125]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 7.0, 15.0, 13.0, 14.0, 20.0, 23.0, 24.0, 19.0, 28.0, 37.0, 30.0, 31.0, 38.0, 38.0, 43.0, 56.0, 25.0, 57.0, 37.0, 41.0, 46.0, 28.0, 41.0, 36.0, 30.0, 18.0, 21.0, 31.0, 31.0, 17.0, 16.0, 14.0, 12.0, 8.0, 10.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-46.56011962890625, -45.138511657714844, -43.7169075012207, -42.2952995300293, -40.873695373535156, -39.45208740234375, -38.030479431152344, -36.6088752746582, -35.18727111816406, -33.765663146972656, -32.344058990478516, -30.92245101928711, -29.50084686279297, -28.079238891601562, -26.65763282775879, -25.236026763916016, -23.81441879272461, -22.392812728881836, -20.971206665039062, -19.549598693847656, -18.127994537353516, -16.70638656616211, -15.284780502319336, -13.863174438476562, -12.441568374633789, -11.019962310791016, -9.598356246948242, -8.176749229431152, -6.755143165588379, -5.3335371017456055, -3.9119300842285156, -2.490324020385742, -1.0687179565429688, 0.3528883457183838, 1.7744946479797363, 3.196101188659668, 4.617707252502441, 6.039313316345215, 7.460920333862305, 8.882526397705078, 10.304132461547852, 11.725738525390625, 13.147344589233398, 14.568951606750488, 15.990557670593262, 17.41216278076172, 18.833770751953125, 20.2553768157959, 21.676982879638672, 23.098588943481445, 24.52019500732422, 25.941802978515625, 27.363407135009766, 28.785015106201172, 30.206621170043945, 31.62822723388672, 33.049835205078125, 34.47144317626953, 35.89304733276367, 37.31465530395508, 38.73625946044922, 40.157867431640625, 41.57947540283203, 43.00107955932617, 44.42268371582031]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 6.0, 12.0, 11.0, 11.0, 13.0, 13.0, 19.0, 22.0, 23.0, 27.0, 25.0, 32.0, 22.0, 27.0, 37.0, 38.0, 52.0, 37.0, 48.0, 38.0, 47.0, 36.0, 45.0, 31.0, 34.0, 28.0, 32.0, 31.0, 27.0, 26.0, 18.0, 14.0, 24.0, 15.0, 9.0, 17.0, 12.0, 2.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.1453857421875, -5.943115234375, -5.7408447265625, -5.53857421875, -5.3363037109375, -5.134033203125, -4.9317626953125, -4.7294921875, -4.5272216796875, -4.324951171875, -4.1226806640625, -3.92041015625, -3.7181396484375, -3.515869140625, -3.3135986328125, -3.111328125, -2.9090576171875, -2.706787109375, -2.5045166015625, -2.30224609375, -2.0999755859375, -1.897705078125, -1.6954345703125, -1.4931640625, -1.2908935546875, -1.088623046875, -0.8863525390625, -0.68408203125, -0.4818115234375, -0.279541015625, -0.0772705078125, 0.125, 0.3272705078125, 0.529541015625, 0.7318115234375, 0.93408203125, 1.1363525390625, 1.338623046875, 1.5408935546875, 1.7431640625, 1.9454345703125, 2.147705078125, 2.3499755859375, 2.55224609375, 2.7545166015625, 2.956787109375, 3.1590576171875, 3.361328125, 3.5635986328125, 3.765869140625, 3.9681396484375, 4.17041015625, 4.3726806640625, 4.574951171875, 4.7772216796875, 4.9794921875, 5.1817626953125, 5.384033203125, 5.5863037109375, 5.78857421875, 5.9908447265625, 6.193115234375, 6.3953857421875, 6.59765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 7.0, 3.0, 6.0, 15.0, 22.0, 24.0, 44.0, 62.0, 97.0, 135.0, 213.0, 298.0, 412.0, 621.0, 862.0, 1325.0, 1979.0, 2855.0, 4173.0, 6228.0, 9422.0, 14571.0, 22277.0, 34406.0, 54101.0, 88463.0, 157372.0, 241166.0, 160647.0, 90469.0, 54829.0, 34624.0, 22562.0, 14749.0, 9731.0, 6531.0, 4249.0, 2893.0, 2009.0, 1270.0, 923.0, 613.0, 420.0, 292.0, 198.0, 133.0, 76.0, 57.0, 44.0, 23.0, 24.0, 19.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8647308349609375, -0.836395263671875, -0.8080596923828125, -0.77972412109375, -0.7513885498046875, -0.723052978515625, -0.6947174072265625, -0.6663818359375, -0.6380462646484375, -0.609710693359375, -0.5813751220703125, -0.55303955078125, -0.5247039794921875, -0.496368408203125, -0.4680328369140625, -0.439697265625, -0.4113616943359375, -0.383026123046875, -0.3546905517578125, -0.32635498046875, -0.2980194091796875, -0.269683837890625, -0.2413482666015625, -0.2130126953125, -0.1846771240234375, -0.156341552734375, -0.1280059814453125, -0.09967041015625, -0.0713348388671875, -0.042999267578125, -0.0146636962890625, 0.013671875, 0.0420074462890625, 0.070343017578125, 0.0986785888671875, 0.12701416015625, 0.1553497314453125, 0.183685302734375, 0.2120208740234375, 0.2403564453125, 0.2686920166015625, 0.297027587890625, 0.3253631591796875, 0.35369873046875, 0.3820343017578125, 0.410369873046875, 0.4387054443359375, 0.467041015625, 0.4953765869140625, 0.523712158203125, 0.5520477294921875, 0.58038330078125, 0.6087188720703125, 0.637054443359375, 0.6653900146484375, 0.6937255859375, 0.7220611572265625, 0.750396728515625, 0.7787322998046875, 0.80706787109375, 0.8354034423828125, 0.863739013671875, 0.8920745849609375, 0.92041015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 8.0, 12.0, 8.0, 8.0, 13.0, 17.0, 18.0, 16.0, 16.0, 23.0, 25.0, 23.0, 33.0, 28.0, 33.0, 35.0, 30.0, 36.0, 45.0, 35.0, 1068.0, 38.0, 34.0, 46.0, 26.0, 41.0, 38.0, 30.0, 24.0, 31.0, 35.0, 19.0, 22.0, 14.0, 12.0, 13.0, 17.0, 13.0, 6.0, 9.0, 6.0, 4.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.9453125, -3.81634521484375, -3.6873779296875, -3.55841064453125, -3.429443359375, -3.30047607421875, -3.1715087890625, -3.04254150390625, -2.91357421875, -2.78460693359375, -2.6556396484375, -2.52667236328125, -2.397705078125, -2.26873779296875, -2.1397705078125, -2.01080322265625, -1.8818359375, -1.75286865234375, -1.6239013671875, -1.49493408203125, -1.365966796875, -1.23699951171875, -1.1080322265625, -0.97906494140625, -0.85009765625, -0.72113037109375, -0.5921630859375, -0.46319580078125, -0.334228515625, -0.20526123046875, -0.0762939453125, 0.05267333984375, 0.181640625, 0.31060791015625, 0.4395751953125, 0.56854248046875, 0.697509765625, 0.82647705078125, 0.9554443359375, 1.08441162109375, 1.21337890625, 1.34234619140625, 1.4713134765625, 1.60028076171875, 1.729248046875, 1.85821533203125, 1.9871826171875, 2.11614990234375, 2.2451171875, 2.37408447265625, 2.5030517578125, 2.63201904296875, 2.760986328125, 2.88995361328125, 3.0189208984375, 3.14788818359375, 3.27685546875, 3.40582275390625, 3.5347900390625, 3.66375732421875, 3.792724609375, 3.92169189453125, 4.0506591796875, 4.17962646484375, 4.30859375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 15.0, 18.0, 28.0, 37.0, 58.0, 78.0, 122.0, 160.0, 249.0, 349.0, 499.0, 746.0, 1078.0, 1672.0, 2296.0, 3432.0, 4955.0, 7335.0, 10886.0, 16136.0, 25412.0, 40994.0, 66807.0, 114289.0, 204237.0, 1271100.0, 125743.0, 72803.0, 44340.0, 27524.0, 17688.0, 11611.0, 7836.0, 5216.0, 3604.0, 2397.0, 1712.0, 1118.0, 772.0, 555.0, 371.0, 240.0, 188.0, 124.0, 105.0, 55.0, 46.0, 27.0, 23.0, 16.0, 8.0, 9.0, 6.0, 1.0, 2.0], "bins": [-0.93896484375, -0.9114151000976562, -0.8838653564453125, -0.8563156127929688, -0.828765869140625, -0.8012161254882812, -0.7736663818359375, -0.7461166381835938, -0.71856689453125, -0.6910171508789062, -0.6634674072265625, -0.6359176635742188, -0.608367919921875, -0.5808181762695312, -0.5532684326171875, -0.5257186889648438, -0.4981689453125, -0.47061920166015625, -0.4430694580078125, -0.41551971435546875, -0.387969970703125, -0.36042022705078125, -0.3328704833984375, -0.30532073974609375, -0.27777099609375, -0.25022125244140625, -0.2226715087890625, -0.19512176513671875, -0.167572021484375, -0.14002227783203125, -0.1124725341796875, -0.08492279052734375, -0.057373046875, -0.02982330322265625, -0.0022735595703125, 0.02527618408203125, 0.052825927734375, 0.08037567138671875, 0.1079254150390625, 0.13547515869140625, 0.16302490234375, 0.19057464599609375, 0.2181243896484375, 0.24567413330078125, 0.273223876953125, 0.30077362060546875, 0.3283233642578125, 0.35587310791015625, 0.3834228515625, 0.41097259521484375, 0.4385223388671875, 0.46607208251953125, 0.493621826171875, 0.5211715698242188, 0.5487213134765625, 0.5762710571289062, 0.60382080078125, 0.6313705444335938, 0.6589202880859375, 0.6864700317382812, 0.714019775390625, 0.7415695190429688, 0.7691192626953125, 0.7966690063476562, 0.82421875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 8.0, 5.0, 14.0, 12.0, 13.0, 12.0, 19.0, 34.0, 40.0, 40.0, 51.0, 50.0, 73.0, 80.0, 77.0, 76.0, 65.0, 54.0, 40.0, 34.0, 37.0, 34.0, 17.0, 17.0, 9.0, 18.0, 14.0, 10.0, 4.0, 8.0, 6.0, 3.0, 5.0, 8.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0009431838989257812, -0.0009174048900604248, -0.0008916258811950684, -0.0008658468723297119, -0.0008400678634643555, -0.000814288854598999, -0.0007885098457336426, -0.0007627308368682861, -0.0007369518280029297, -0.0007111728191375732, -0.0006853938102722168, -0.0006596148014068604, -0.0006338357925415039, -0.0006080567836761475, -0.000582277774810791, -0.0005564987659454346, -0.0005307197570800781, -0.0005049407482147217, -0.00047916173934936523, -0.0004533827304840088, -0.00042760372161865234, -0.0004018247127532959, -0.00037604570388793945, -0.000350266695022583, -0.00032448768615722656, -0.0002987086772918701, -0.00027292966842651367, -0.0002471506595611572, -0.00022137165069580078, -0.00019559264183044434, -0.0001698136329650879, -0.00014403462409973145, -0.000118255615234375, -9.247660636901855e-05, -6.669759750366211e-05, -4.0918588638305664e-05, -1.5139579772949219e-05, 1.0639429092407227e-05, 3.641843795776367e-05, 6.219744682312012e-05, 8.797645568847656e-05, 0.00011375546455383301, 0.00013953447341918945, 0.0001653134822845459, 0.00019109249114990234, 0.0002168715000152588, 0.00024265050888061523, 0.0002684295177459717, 0.0002942085266113281, 0.00031998753547668457, 0.000345766544342041, 0.00037154555320739746, 0.0003973245620727539, 0.00042310357093811035, 0.0004488825798034668, 0.00047466158866882324, 0.0005004405975341797, 0.0005262196063995361, 0.0005519986152648926, 0.000577777624130249, 0.0006035566329956055, 0.0006293356418609619, 0.0006551146507263184, 0.0006808936595916748, 0.0007066726684570312]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 8.0, 4.0, 5.0, 13.0, 13.0, 14.0, 10.0, 20.0, 26.0, 35.0, 42.0, 49.0, 69.0, 128.0, 217.0, 495.0, 1865.0, 898333.0, 145092.0, 1116.0, 379.0, 226.0, 100.0, 83.0, 54.0, 39.0, 22.0, 21.0, 17.0, 8.0, 18.0, 5.0, 10.0, 6.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016143798828125, -0.015542745590209961, -0.014941692352294922, -0.014340639114379883, -0.013739585876464844, -0.013138532638549805, -0.012537479400634766, -0.011936426162719727, -0.011335372924804688, -0.010734319686889648, -0.01013326644897461, -0.00953221321105957, -0.008931159973144531, -0.008330106735229492, -0.007729053497314453, -0.007128000259399414, -0.006526947021484375, -0.005925893783569336, -0.005324840545654297, -0.004723787307739258, -0.004122734069824219, -0.0035216808319091797, -0.0029206275939941406, -0.0023195743560791016, -0.0017185211181640625, -0.0011174678802490234, -0.0005164146423339844, 8.463859558105469e-05, 0.0006856918334960938, 0.0012867450714111328, 0.0018877983093261719, 0.002488851547241211, 0.00308990478515625, 0.003690958023071289, 0.004292011260986328, 0.004893064498901367, 0.005494117736816406, 0.006095170974731445, 0.006696224212646484, 0.0072972774505615234, 0.007898330688476562, 0.008499383926391602, 0.00910043716430664, 0.00970149040222168, 0.010302543640136719, 0.010903596878051758, 0.011504650115966797, 0.012105703353881836, 0.012706756591796875, 0.013307809829711914, 0.013908863067626953, 0.014509916305541992, 0.015110969543457031, 0.01571202278137207, 0.01631307601928711, 0.01691412925720215, 0.017515182495117188, 0.018116235733032227, 0.018717288970947266, 0.019318342208862305, 0.019919395446777344, 0.020520448684692383, 0.021121501922607422, 0.02172255516052246, 0.0223236083984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 27.0, 71.0, 173.0, 238.0, 222.0, 139.0, 83.0, 31.0, 14.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008538862457498908, -0.0008196478011086583, -0.0007854094146750867, -0.0007511709700338542, -0.0007169325253926218, -0.0006826941389590502, -0.0006484556943178177, -0.0006142172496765852, -0.0005799788050353527, -0.0005457403603941202, -0.0005115019739605486, -0.00047726352931931615, -0.00044302508467808366, -0.0004087866691406816, -0.0003745482536032796, -0.0003403098089620471, -0.0003060714225284755, -0.0002718330069910735, -0.000237594562349841, -0.00020335614681243896, -0.0001691177167231217, -0.00013487928663380444, -0.0001006408710964024, -6.640244100708514e-05, -3.216401091776788e-05, 2.0744155335705727e-06, 3.631284198490903e-05, 7.055126479826868e-05, 0.00010478969488758594, 0.0001390281249769032, 0.00017326654051430523, 0.0002075049706036225, 0.00024174340069293976, 0.0002759818162303418, 0.0003102202608715743, 0.0003444586764089763, 0.0003786971210502088, 0.00041293553658761084, 0.0004471739521250129, 0.00048141239676624537, 0.0005156508414074779, 0.0005498892860487103, 0.0005841276724822819, 0.0006183661171235144, 0.0006526045617647469, 0.0006868429481983185, 0.000721081392839551, 0.0007553198374807835, 0.000789558223914355, 0.0008237966685555875, 0.0008580350549891591, 0.0008922734996303916, 0.0009265119442716241, 0.0009607503889128566, 0.0009949887171387672, 0.0010292271617799997, 0.0010634656064212322, 0.0010977040510624647, 0.0011319424957036972, 0.0011661809403449297, 0.0012004192685708404, 0.0012346577132120728, 0.0012688961578533053, 0.0013031346024945378, 0.0013373730471357703]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 4.0, 2.0, 4.0, 12.0, 8.0, 10.0, 19.0, 26.0, 17.0, 32.0, 20.0, 28.0, 41.0, 41.0, 44.0, 37.0, 51.0, 49.0, 46.0, 29.0, 36.0, 53.0, 36.0, 23.0, 42.0, 39.0, 41.0, 29.0, 38.0, 18.0, 27.0, 22.0, 7.0, 16.0, 9.0, 9.0, 7.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004254579544067383, -0.00041246507316827774, -0.0003994721919298172, -0.00038647931069135666, -0.0003734864294528961, -0.0003604935482144356, -0.00034750066697597504, -0.0003345077857375145, -0.00032151490449905396, -0.0003085220232605934, -0.0002955291420221329, -0.00028253626078367233, -0.0002695433795452118, -0.00025655049830675125, -0.0002435576170682907, -0.00023056473582983017, -0.00021757185459136963, -0.0002045789733529091, -0.00019158609211444855, -0.000178593210875988, -0.00016560032963752747, -0.00015260744839906693, -0.00013961456716060638, -0.00012662168592214584, -0.0001136288046836853, -0.00010063592344522476, -8.764304220676422e-05, -7.465016096830368e-05, -6.165727972984314e-05, -4.86643984913826e-05, -3.567151725292206e-05, -2.2678636014461517e-05, -9.685754776000977e-06, 3.307126462459564e-06, 1.6300007700920105e-05, 2.9292888939380646e-05, 4.2285770177841187e-05, 5.527865141630173e-05, 6.827153265476227e-05, 8.126441389322281e-05, 9.425729513168335e-05, 0.00010725017637014389, 0.00012024305760860443, 0.00013323593884706497, 0.0001462288200855255, 0.00015922170132398605, 0.0001722145825624466, 0.00018520746380090714, 0.00019820034503936768, 0.00021119322627782822, 0.00022418610751628876, 0.0002371789887547493, 0.00025017186999320984, 0.0002631647512316704, 0.0002761576324701309, 0.00028915051370859146, 0.000302143394947052, 0.00031513627618551254, 0.0003281291574239731, 0.0003411220386624336, 0.00035411491990089417, 0.0003671078011393547, 0.00038010068237781525, 0.0003930935636162758, 0.00040608644485473633]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 6.0, 12.0, 11.0, 11.0, 13.0, 13.0, 19.0, 22.0, 23.0, 27.0, 25.0, 32.0, 22.0, 27.0, 37.0, 38.0, 52.0, 37.0, 48.0, 38.0, 47.0, 36.0, 45.0, 31.0, 34.0, 28.0, 32.0, 31.0, 27.0, 26.0, 18.0, 14.0, 24.0, 15.0, 9.0, 17.0, 12.0, 2.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.1453857421875, -5.943115234375, -5.7408447265625, -5.53857421875, -5.3363037109375, -5.134033203125, -4.9317626953125, -4.7294921875, -4.5272216796875, -4.324951171875, -4.1226806640625, -3.92041015625, -3.7181396484375, -3.515869140625, -3.3135986328125, -3.111328125, -2.9090576171875, -2.706787109375, -2.5045166015625, -2.30224609375, -2.0999755859375, -1.897705078125, -1.6954345703125, -1.4931640625, -1.2908935546875, -1.088623046875, -0.8863525390625, -0.68408203125, -0.4818115234375, -0.279541015625, -0.0772705078125, 0.125, 0.3272705078125, 0.529541015625, 0.7318115234375, 0.93408203125, 1.1363525390625, 1.338623046875, 1.5408935546875, 1.7431640625, 1.9454345703125, 2.147705078125, 2.3499755859375, 2.55224609375, 2.7545166015625, 2.956787109375, 3.1590576171875, 3.361328125, 3.5635986328125, 3.765869140625, 3.9681396484375, 4.17041015625, 4.3726806640625, 4.574951171875, 4.7772216796875, 4.9794921875, 5.1817626953125, 5.384033203125, 5.5863037109375, 5.78857421875, 5.9908447265625, 6.193115234375, 6.3953857421875, 6.59765625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 16.0, 16.0, 21.0, 28.0, 39.0, 87.0, 99.0, 140.0, 241.0, 391.0, 602.0, 1051.0, 1849.0, 3541.0, 7350.0, 16840.0, 42698.0, 123980.0, 390116.0, 302704.0, 95459.0, 34321.0, 13585.0, 6271.0, 3109.0, 1574.0, 918.0, 549.0, 342.0, 226.0, 140.0, 83.0, 57.0, 35.0, 23.0, 29.0, 6.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.85076904296875, -5.6781005859375, -5.50543212890625, -5.332763671875, -5.16009521484375, -4.9874267578125, -4.81475830078125, -4.64208984375, -4.46942138671875, -4.2967529296875, -4.12408447265625, -3.951416015625, -3.77874755859375, -3.6060791015625, -3.43341064453125, -3.2607421875, -3.08807373046875, -2.9154052734375, -2.74273681640625, -2.570068359375, -2.39739990234375, -2.2247314453125, -2.05206298828125, -1.87939453125, -1.70672607421875, -1.5340576171875, -1.36138916015625, -1.188720703125, -1.01605224609375, -0.8433837890625, -0.67071533203125, -0.498046875, -0.32537841796875, -0.1527099609375, 0.01995849609375, 0.192626953125, 0.36529541015625, 0.5379638671875, 0.71063232421875, 0.88330078125, 1.05596923828125, 1.2286376953125, 1.40130615234375, 1.573974609375, 1.74664306640625, 1.9193115234375, 2.09197998046875, 2.2646484375, 2.43731689453125, 2.6099853515625, 2.78265380859375, 2.955322265625, 3.12799072265625, 3.3006591796875, 3.47332763671875, 3.64599609375, 3.81866455078125, 3.9913330078125, 4.16400146484375, 4.336669921875, 4.50933837890625, 4.6820068359375, 4.85467529296875, 5.02734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 8.0, 6.0, 7.0, 9.0, 10.0, 14.0, 10.0, 12.0, 16.0, 16.0, 34.0, 22.0, 35.0, 37.0, 35.0, 40.0, 42.0, 46.0, 87.0, 233.0, 1669.0, 170.0, 80.0, 53.0, 53.0, 42.0, 28.0, 42.0, 26.0, 25.0, 29.0, 24.0, 17.0, 12.0, 14.0, 10.0, 6.0, 5.0, 4.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.125, -24.41455078125, -23.7041015625, -22.99365234375, -22.283203125, -21.57275390625, -20.8623046875, -20.15185546875, -19.44140625, -18.73095703125, -18.0205078125, -17.31005859375, -16.599609375, -15.88916015625, -15.1787109375, -14.46826171875, -13.7578125, -13.04736328125, -12.3369140625, -11.62646484375, -10.916015625, -10.20556640625, -9.4951171875, -8.78466796875, -8.07421875, -7.36376953125, -6.6533203125, -5.94287109375, -5.232421875, -4.52197265625, -3.8115234375, -3.10107421875, -2.390625, -1.68017578125, -0.9697265625, -0.25927734375, 0.451171875, 1.16162109375, 1.8720703125, 2.58251953125, 3.29296875, 4.00341796875, 4.7138671875, 5.42431640625, 6.134765625, 6.84521484375, 7.5556640625, 8.26611328125, 8.9765625, 9.68701171875, 10.3974609375, 11.10791015625, 11.818359375, 12.52880859375, 13.2392578125, 13.94970703125, 14.66015625, 15.37060546875, 16.0810546875, 16.79150390625, 17.501953125, 18.21240234375, 18.9228515625, 19.63330078125, 20.34375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 13.0, 23.0, 18.0, 40.0, 53.0, 97.0, 135.0, 194.0, 270.0, 489.0, 1424.0, 2655421.0, 485123.0, 1104.0, 418.0, 274.0, 197.0, 112.0, 74.0, 62.0, 50.0, 27.0, 23.0, 15.0, 10.0, 10.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-93.75, -91.212890625, -88.67578125, -86.138671875, -83.6015625, -81.064453125, -78.52734375, -75.990234375, -73.453125, -70.916015625, -68.37890625, -65.841796875, -63.3046875, -60.767578125, -58.23046875, -55.693359375, -53.15625, -50.619140625, -48.08203125, -45.544921875, -43.0078125, -40.470703125, -37.93359375, -35.396484375, -32.859375, -30.322265625, -27.78515625, -25.248046875, -22.7109375, -20.173828125, -17.63671875, -15.099609375, -12.5625, -10.025390625, -7.48828125, -4.951171875, -2.4140625, 0.123046875, 2.66015625, 5.197265625, 7.734375, 10.271484375, 12.80859375, 15.345703125, 17.8828125, 20.419921875, 22.95703125, 25.494140625, 28.03125, 30.568359375, 33.10546875, 35.642578125, 38.1796875, 40.716796875, 43.25390625, 45.791015625, 48.328125, 50.865234375, 53.40234375, 55.939453125, 58.4765625, 61.013671875, 63.55078125, 66.087890625, 68.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 86.0, 566.0, 320.0, 38.0, 6.0], "bins": [-228.25588989257812, -224.502197265625, -220.7484893798828, -216.9947967529297, -213.2410888671875, -209.48739624023438, -205.73370361328125, -201.97999572753906, -198.22630310058594, -194.4726104736328, -190.71890258789062, -186.9652099609375, -183.2115020751953, -179.4578094482422, -175.7041015625, -171.95040893554688, -168.19671630859375, -164.44302368164062, -160.68931579589844, -156.9356231689453, -153.18191528320312, -149.42822265625, -145.67453002929688, -141.9208221435547, -138.1671142578125, -134.41342163085938, -130.6597137451172, -126.90602111816406, -123.1523208618164, -119.39862060546875, -115.6449203491211, -111.89122009277344, -108.13752746582031, -104.38382720947266, -100.630126953125, -96.87643432617188, -93.12273406982422, -89.36903381347656, -85.6153335571289, -81.86163330078125, -78.1079330444336, -74.35423278808594, -70.60053253173828, -66.84683227539062, -63.0931396484375, -59.339439392089844, -55.58573913574219, -51.83203887939453, -48.07834243774414, -44.324642181396484, -40.570945739746094, -36.81724548339844, -33.06354522705078, -29.30984878540039, -25.556148529052734, -21.80245018005371, -18.048751831054688, -14.295053482055664, -10.541354179382324, -6.787654876708984, -3.033956527709961, 0.7197418212890625, 4.473442077636719, 8.227140426635742, 11.98083782196045]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 8.0, 15.0, 8.0, 16.0, 15.0, 23.0, 21.0, 16.0, 20.0, 37.0, 24.0, 28.0, 26.0, 30.0, 36.0, 38.0, 43.0, 47.0, 43.0, 28.0, 34.0, 44.0, 24.0, 42.0, 37.0, 34.0, 29.0, 35.0, 22.0, 22.0, 28.0, 16.0, 21.0, 15.0, 15.0, 6.0, 9.0, 6.0, 7.0, 4.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-56.03406524658203, -54.16773986816406, -52.30141830444336, -50.43509292602539, -48.56876754760742, -46.70244598388672, -44.83612060546875, -42.96979522705078, -41.10346984863281, -39.237144470214844, -37.37082290649414, -35.50449752807617, -33.6381721496582, -31.771848678588867, -29.90552520751953, -28.039199829101562, -26.172876358032227, -24.30655288696289, -22.440227508544922, -20.573904037475586, -18.707578659057617, -16.84125518798828, -14.974930763244629, -13.108606338500977, -11.242281913757324, -9.375957489013672, -7.5096330642700195, -5.643309116363525, -3.776984691619873, -1.910660743713379, -0.04433631896972656, 1.8219881057739258, 3.688312530517578, 5.5546369552612305, 7.420961380004883, 9.287284851074219, 11.153610229492188, 13.019933700561523, 14.886258125305176, 16.752582550048828, 18.618907928466797, 20.485231399536133, 22.3515567779541, 24.217880249023438, 26.084205627441406, 27.950529098510742, 29.816852569580078, 31.683177947998047, 33.54949951171875, 35.41582489013672, 37.28214645385742, 39.14847183227539, 41.01479721069336, 42.88111877441406, 44.74744415283203, 46.61376953125, 48.48009490966797, 50.34642028808594, 52.21274185180664, 54.07906723022461, 55.94539260864258, 57.81171417236328, 59.67803955078125, 61.54436492919922, 63.41069030761719]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 11.0, 10.0, 10.0, 17.0, 13.0, 13.0, 20.0, 21.0, 25.0, 24.0, 25.0, 26.0, 36.0, 31.0, 26.0, 47.0, 36.0, 44.0, 43.0, 48.0, 51.0, 41.0, 39.0, 36.0, 26.0, 36.0, 32.0, 25.0, 24.0, 32.0, 17.0, 11.0, 14.0, 17.0, 12.0, 17.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.31427001953125, -6.0972900390625, -5.88031005859375, -5.663330078125, -5.44635009765625, -5.2293701171875, -5.01239013671875, -4.79541015625, -4.57843017578125, -4.3614501953125, -4.14447021484375, -3.927490234375, -3.71051025390625, -3.4935302734375, -3.27655029296875, -3.0595703125, -2.84259033203125, -2.6256103515625, -2.40863037109375, -2.191650390625, -1.97467041015625, -1.7576904296875, -1.54071044921875, -1.32373046875, -1.10675048828125, -0.8897705078125, -0.67279052734375, -0.455810546875, -0.23883056640625, -0.0218505859375, 0.19512939453125, 0.412109375, 0.62908935546875, 0.8460693359375, 1.06304931640625, 1.280029296875, 1.49700927734375, 1.7139892578125, 1.93096923828125, 2.14794921875, 2.36492919921875, 2.5819091796875, 2.79888916015625, 3.015869140625, 3.23284912109375, 3.4498291015625, 3.66680908203125, 3.8837890625, 4.10076904296875, 4.3177490234375, 4.53472900390625, 4.751708984375, 4.96868896484375, 5.1856689453125, 5.40264892578125, 5.61962890625, 5.83660888671875, 6.0535888671875, 6.27056884765625, 6.487548828125, 6.70452880859375, 6.9215087890625, 7.13848876953125, 7.35546875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 16.0, 17.0, 11.0, 12.0, 14.0, 20.0, 30.0, 30.0, 48.0, 63.0, 79.0, 148.0, 230.0, 589.0, 1791.0, 10489.0, 164380.0, 2238392.0, 1680218.0, 88372.0, 6813.0, 1342.0, 464.0, 216.0, 120.0, 71.0, 55.0, 47.0, 32.0, 24.0, 18.0, 20.0, 14.0, 14.0, 8.0, 11.0, 10.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.859375, -15.310791015625, -14.76220703125, -14.213623046875, -13.6650390625, -13.116455078125, -12.56787109375, -12.019287109375, -11.470703125, -10.922119140625, -10.37353515625, -9.824951171875, -9.2763671875, -8.727783203125, -8.17919921875, -7.630615234375, -7.08203125, -6.533447265625, -5.98486328125, -5.436279296875, -4.8876953125, -4.339111328125, -3.79052734375, -3.241943359375, -2.693359375, -2.144775390625, -1.59619140625, -1.047607421875, -0.4990234375, 0.049560546875, 0.59814453125, 1.146728515625, 1.6953125, 2.243896484375, 2.79248046875, 3.341064453125, 3.8896484375, 4.438232421875, 4.98681640625, 5.535400390625, 6.083984375, 6.632568359375, 7.18115234375, 7.729736328125, 8.2783203125, 8.826904296875, 9.37548828125, 9.924072265625, 10.47265625, 11.021240234375, 11.56982421875, 12.118408203125, 12.6669921875, 13.215576171875, 13.76416015625, 14.312744140625, 14.861328125, 15.409912109375, 15.95849609375, 16.507080078125, 17.0556640625, 17.604248046875, 18.15283203125, 18.701416015625, 19.25]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 13.0, 10.0, 17.0, 24.0, 27.0, 48.0, 70.0, 100.0, 114.0, 207.0, 261.0, 406.0, 496.0, 533.0, 490.0, 334.0, 298.0, 168.0, 123.0, 104.0, 67.0, 41.0, 47.0, 22.0, 14.0, 13.0, 12.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.1024169921875, -14.587646484375, -14.0728759765625, -13.55810546875, -13.0433349609375, -12.528564453125, -12.0137939453125, -11.4990234375, -10.9842529296875, -10.469482421875, -9.9547119140625, -9.43994140625, -8.9251708984375, -8.410400390625, -7.8956298828125, -7.380859375, -6.8660888671875, -6.351318359375, -5.8365478515625, -5.32177734375, -4.8070068359375, -4.292236328125, -3.7774658203125, -3.2626953125, -2.7479248046875, -2.233154296875, -1.7183837890625, -1.20361328125, -0.6888427734375, -0.174072265625, 0.3406982421875, 0.85546875, 1.3702392578125, 1.885009765625, 2.3997802734375, 2.91455078125, 3.4293212890625, 3.944091796875, 4.4588623046875, 4.9736328125, 5.4884033203125, 6.003173828125, 6.5179443359375, 7.03271484375, 7.5474853515625, 8.062255859375, 8.5770263671875, 9.091796875, 9.6065673828125, 10.121337890625, 10.6361083984375, 11.15087890625, 11.6656494140625, 12.180419921875, 12.6951904296875, 13.2099609375, 13.7247314453125, 14.239501953125, 14.7542724609375, 15.26904296875, 15.7838134765625, 16.298583984375, 16.8133544921875, 17.328125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 6.0, 9.0, 17.0, 32.0, 23.0, 34.0, 39.0, 54.0, 66.0, 108.0, 106.0, 168.0, 180.0, 261.0, 483.0, 1086.0, 43256.0, 4124590.0, 21383.0, 918.0, 421.0, 235.0, 186.0, 129.0, 89.0, 89.0, 73.0, 43.0, 50.0, 37.0, 13.0, 16.0, 15.0, 11.0, 6.0, 11.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-70.0, -67.8427734375, -65.685546875, -63.5283203125, -61.37109375, -59.2138671875, -57.056640625, -54.8994140625, -52.7421875, -50.5849609375, -48.427734375, -46.2705078125, -44.11328125, -41.9560546875, -39.798828125, -37.6416015625, -35.484375, -33.3271484375, -31.169921875, -29.0126953125, -26.85546875, -24.6982421875, -22.541015625, -20.3837890625, -18.2265625, -16.0693359375, -13.912109375, -11.7548828125, -9.59765625, -7.4404296875, -5.283203125, -3.1259765625, -0.96875, 1.1884765625, 3.345703125, 5.5029296875, 7.66015625, 9.8173828125, 11.974609375, 14.1318359375, 16.2890625, 18.4462890625, 20.603515625, 22.7607421875, 24.91796875, 27.0751953125, 29.232421875, 31.3896484375, 33.546875, 35.7041015625, 37.861328125, 40.0185546875, 42.17578125, 44.3330078125, 46.490234375, 48.6474609375, 50.8046875, 52.9619140625, 55.119140625, 57.2763671875, 59.43359375, 61.5908203125, 63.748046875, 65.9052734375, 68.0625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 14.0, 29.0, 48.0, 83.0, 136.0, 176.0, 192.0, 153.0, 78.0, 48.0, 31.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.90583801269531, -54.511817932128906, -52.117794036865234, -49.72377395629883, -47.329750061035156, -44.93572998046875, -42.541709899902344, -40.14768981933594, -37.753665924072266, -35.35964584350586, -32.96562194824219, -30.57160186767578, -28.177579879760742, -25.783557891845703, -23.389537811279297, -20.995515823364258, -18.60149383544922, -16.20747184753418, -13.813450813293457, -11.419429779052734, -9.025407791137695, -6.631385803222656, -4.237364768981934, -1.843343734741211, 0.5506782531738281, 2.944699764251709, 5.33872127532959, 7.732742786407471, 10.126764297485352, 12.52078628540039, 14.914807319641113, 17.308828353881836, 19.702842712402344, 22.096864700317383, 24.490886688232422, 26.884906768798828, 29.278928756713867, 31.672950744628906, 34.06697082519531, 36.46099090576172, 38.85501480102539, 41.2490348815918, 43.64305877685547, 46.037078857421875, 48.43109893798828, 50.82512283325195, 53.21914291381836, 55.61316680908203, 58.00718688964844, 60.401206970214844, 62.795230865478516, 65.18925476074219, 67.5832748413086, 69.977294921875, 72.3713150024414, 74.76533508300781, 77.15936279296875, 79.55338287353516, 81.94740295410156, 84.3414306640625, 86.7354507446289, 89.12947082519531, 91.52349090576172, 93.91751098632812, 96.31153106689453]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 10.0, 4.0, 7.0, 14.0, 6.0, 10.0, 12.0, 15.0, 14.0, 14.0, 15.0, 22.0, 22.0, 19.0, 33.0, 34.0, 31.0, 46.0, 38.0, 47.0, 36.0, 34.0, 34.0, 38.0, 32.0, 37.0, 37.0, 29.0, 23.0, 31.0, 36.0, 27.0, 28.0, 23.0, 19.0, 15.0, 15.0, 19.0, 8.0, 17.0, 12.0, 4.0, 12.0, 8.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-42.838348388671875, -41.569488525390625, -40.30063247680664, -39.031776428222656, -37.762916564941406, -36.494056701660156, -35.22520065307617, -33.95634460449219, -32.68748474121094, -31.41862678527832, -30.149768829345703, -28.880910873413086, -27.61205291748047, -26.34319496154785, -25.074337005615234, -23.805479049682617, -22.53662109375, -21.267763137817383, -19.998905181884766, -18.73004722595215, -17.46118927001953, -16.192331314086914, -14.923473358154297, -13.65461540222168, -12.385757446289062, -11.116899490356445, -9.848041534423828, -8.579183578491211, -7.310325622558594, -6.041467666625977, -4.772609710693359, -3.503751754760742, -2.234893798828125, -0.9660358428955078, 0.3028221130371094, 1.5716800689697266, 2.8405380249023438, 4.109395980834961, 5.378253936767578, 6.647111892700195, 7.9159698486328125, 9.18482780456543, 10.453685760498047, 11.722543716430664, 12.991401672363281, 14.260259628295898, 15.529117584228516, 16.797975540161133, 18.06683349609375, 19.335691452026367, 20.604549407958984, 21.8734073638916, 23.14226531982422, 24.411123275756836, 25.679981231689453, 26.94883918762207, 28.217697143554688, 29.486555099487305, 30.755413055419922, 32.024269104003906, 33.293128967285156, 34.561988830566406, 35.83084487915039, 37.099700927734375, 38.368560791015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 9.0, 9.0, 9.0, 10.0, 15.0, 10.0, 15.0, 8.0, 21.0, 28.0, 24.0, 22.0, 28.0, 27.0, 30.0, 33.0, 43.0, 42.0, 39.0, 45.0, 36.0, 46.0, 38.0, 41.0, 39.0, 21.0, 27.0, 31.0, 26.0, 25.0, 27.0, 15.0, 14.0, 23.0, 22.0, 18.0, 18.0, 6.0, 8.0, 12.0, 6.0, 9.0, 5.0, 8.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.4140625, -6.21856689453125, -6.0230712890625, -5.82757568359375, -5.632080078125, -5.43658447265625, -5.2410888671875, -5.04559326171875, -4.85009765625, -4.65460205078125, -4.4591064453125, -4.26361083984375, -4.068115234375, -3.87261962890625, -3.6771240234375, -3.48162841796875, -3.2861328125, -3.09063720703125, -2.8951416015625, -2.69964599609375, -2.504150390625, -2.30865478515625, -2.1131591796875, -1.91766357421875, -1.72216796875, -1.52667236328125, -1.3311767578125, -1.13568115234375, -0.940185546875, -0.74468994140625, -0.5491943359375, -0.35369873046875, -0.158203125, 0.03729248046875, 0.2327880859375, 0.42828369140625, 0.623779296875, 0.81927490234375, 1.0147705078125, 1.21026611328125, 1.40576171875, 1.60125732421875, 1.7967529296875, 1.99224853515625, 2.187744140625, 2.38323974609375, 2.5787353515625, 2.77423095703125, 2.9697265625, 3.16522216796875, 3.3607177734375, 3.55621337890625, 3.751708984375, 3.94720458984375, 4.1427001953125, 4.33819580078125, 4.53369140625, 4.72918701171875, 4.9246826171875, 5.12017822265625, 5.315673828125, 5.51116943359375, 5.7066650390625, 5.90216064453125, 6.09765625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 6.0, 17.0, 21.0, 31.0, 40.0, 76.0, 98.0, 146.0, 219.0, 366.0, 565.0, 830.0, 1343.0, 1986.0, 3228.0, 5024.0, 7914.0, 12724.0, 20166.0, 32853.0, 53796.0, 92283.0, 176035.0, 273240.0, 153975.0, 83070.0, 48774.0, 29736.0, 18356.0, 11511.0, 7263.0, 4578.0, 2901.0, 1890.0, 1182.0, 783.0, 533.0, 335.0, 220.0, 121.0, 102.0, 70.0, 40.0, 27.0, 28.0, 19.0, 10.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0201568603515625, -0.986602783203125, -0.9530487060546875, -0.91949462890625, -0.8859405517578125, -0.852386474609375, -0.8188323974609375, -0.7852783203125, -0.7517242431640625, -0.718170166015625, -0.6846160888671875, -0.65106201171875, -0.6175079345703125, -0.583953857421875, -0.5503997802734375, -0.516845703125, -0.4832916259765625, -0.449737548828125, -0.4161834716796875, -0.38262939453125, -0.3490753173828125, -0.315521240234375, -0.2819671630859375, -0.2484130859375, -0.2148590087890625, -0.181304931640625, -0.1477508544921875, -0.11419677734375, -0.0806427001953125, -0.047088623046875, -0.0135345458984375, 0.02001953125, 0.0535736083984375, 0.087127685546875, 0.1206817626953125, 0.15423583984375, 0.1877899169921875, 0.221343994140625, 0.2548980712890625, 0.2884521484375, 0.3220062255859375, 0.355560302734375, 0.3891143798828125, 0.42266845703125, 0.4562225341796875, 0.489776611328125, 0.5233306884765625, 0.556884765625, 0.5904388427734375, 0.623992919921875, 0.6575469970703125, 0.69110107421875, 0.7246551513671875, 0.758209228515625, 0.7917633056640625, 0.8253173828125, 0.8588714599609375, 0.892425537109375, 0.9259796142578125, 0.95953369140625, 0.9930877685546875, 1.026641845703125, 1.0601959228515625, 1.09375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 14.0, 11.0, 15.0, 14.0, 12.0, 23.0, 14.0, 24.0, 30.0, 30.0, 33.0, 44.0, 50.0, 40.0, 52.0, 39.0, 1079.0, 49.0, 45.0, 45.0, 43.0, 34.0, 40.0, 38.0, 30.0, 32.0, 24.0, 12.0, 16.0, 14.0, 14.0, 3.0, 8.0, 5.0, 10.0, 10.0, 3.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.943603515625, -4.79345703125, -4.643310546875, -4.4931640625, -4.343017578125, -4.19287109375, -4.042724609375, -3.892578125, -3.742431640625, -3.59228515625, -3.442138671875, -3.2919921875, -3.141845703125, -2.99169921875, -2.841552734375, -2.69140625, -2.541259765625, -2.39111328125, -2.240966796875, -2.0908203125, -1.940673828125, -1.79052734375, -1.640380859375, -1.490234375, -1.340087890625, -1.18994140625, -1.039794921875, -0.8896484375, -0.739501953125, -0.58935546875, -0.439208984375, -0.2890625, -0.138916015625, 0.01123046875, 0.161376953125, 0.3115234375, 0.461669921875, 0.61181640625, 0.761962890625, 0.912109375, 1.062255859375, 1.21240234375, 1.362548828125, 1.5126953125, 1.662841796875, 1.81298828125, 1.963134765625, 2.11328125, 2.263427734375, 2.41357421875, 2.563720703125, 2.7138671875, 2.864013671875, 3.01416015625, 3.164306640625, 3.314453125, 3.464599609375, 3.61474609375, 3.764892578125, 3.9150390625, 4.065185546875, 4.21533203125, 4.365478515625, 4.515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 11.0, 4.0, 11.0, 19.0, 26.0, 54.0, 55.0, 92.0, 154.0, 241.0, 329.0, 478.0, 722.0, 1066.0, 1614.0, 2397.0, 3716.0, 5435.0, 8166.0, 12297.0, 19321.0, 31890.0, 54862.0, 98508.0, 189174.0, 1315032.0, 150559.0, 80677.0, 45399.0, 26613.0, 16509.0, 10503.0, 7118.0, 4640.0, 3135.0, 2060.0, 1390.0, 920.0, 610.0, 462.0, 294.0, 219.0, 120.0, 76.0, 59.0, 37.0, 25.0, 12.0, 7.0, 3.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.91650390625, -0.8862838745117188, -0.8560638427734375, -0.8258438110351562, -0.795623779296875, -0.7654037475585938, -0.7351837158203125, -0.7049636840820312, -0.67474365234375, -0.6445236206054688, -0.6143035888671875, -0.5840835571289062, -0.553863525390625, -0.5236434936523438, -0.4934234619140625, -0.46320343017578125, -0.4329833984375, -0.40276336669921875, -0.3725433349609375, -0.34232330322265625, -0.312103271484375, -0.28188323974609375, -0.2516632080078125, -0.22144317626953125, -0.19122314453125, -0.16100311279296875, -0.1307830810546875, -0.10056304931640625, -0.070343017578125, -0.04012298583984375, -0.0099029541015625, 0.02031707763671875, 0.050537109375, 0.08075714111328125, 0.1109771728515625, 0.14119720458984375, 0.171417236328125, 0.20163726806640625, 0.2318572998046875, 0.26207733154296875, 0.29229736328125, 0.32251739501953125, 0.3527374267578125, 0.38295745849609375, 0.413177490234375, 0.44339752197265625, 0.4736175537109375, 0.5038375854492188, 0.5340576171875, 0.5642776489257812, 0.5944976806640625, 0.6247177124023438, 0.654937744140625, 0.6851577758789062, 0.7153778076171875, 0.7455978393554688, 0.77581787109375, 0.8060379028320312, 0.8362579345703125, 0.8664779663085938, 0.896697998046875, 0.9269180297851562, 0.9571380615234375, 0.9873580932617188, 1.017578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 6.0, 11.0, 10.0, 20.0, 27.0, 36.0, 34.0, 40.0, 55.0, 70.0, 68.0, 93.0, 89.0, 86.0, 64.0, 67.0, 58.0, 32.0, 25.0, 24.0, 11.0, 23.0, 12.0, 14.0, 8.0, 8.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001232147216796875, -0.0011951923370361328, -0.0011582374572753906, -0.0011212825775146484, -0.0010843276977539062, -0.001047372817993164, -0.0010104179382324219, -0.0009734630584716797, -0.0009365081787109375, -0.0008995532989501953, -0.0008625984191894531, -0.0008256435394287109, -0.0007886886596679688, -0.0007517337799072266, -0.0007147789001464844, -0.0006778240203857422, -0.000640869140625, -0.0006039142608642578, -0.0005669593811035156, -0.0005300045013427734, -0.0004930496215820312, -0.00045609474182128906, -0.0004191398620605469, -0.0003821849822998047, -0.0003452301025390625, -0.0003082752227783203, -0.0002713203430175781, -0.00023436546325683594, -0.00019741058349609375, -0.00016045570373535156, -0.00012350082397460938, -8.654594421386719e-05, -4.9591064453125e-05, -1.2636184692382812e-05, 2.4318695068359375e-05, 6.127357482910156e-05, 9.822845458984375e-05, 0.00013518333435058594, 0.00017213821411132812, 0.0002090930938720703, 0.0002460479736328125, 0.0002830028533935547, 0.0003199577331542969, 0.00035691261291503906, 0.00039386749267578125, 0.00043082237243652344, 0.0004677772521972656, 0.0005047321319580078, 0.00054168701171875, 0.0005786418914794922, 0.0006155967712402344, 0.0006525516510009766, 0.0006895065307617188, 0.0007264614105224609, 0.0007634162902832031, 0.0008003711700439453, 0.0008373260498046875, 0.0008742809295654297, 0.0009112358093261719, 0.0009481906890869141, 0.0009851455688476562, 0.0010221004486083984, 0.0010590553283691406, 0.0010960102081298828, 0.001132965087890625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 10.0, 7.0, 8.0, 16.0, 16.0, 16.0, 24.0, 25.0, 34.0, 55.0, 63.0, 124.0, 190.0, 569.0, 4427.0, 1039107.0, 2807.0, 472.0, 198.0, 123.0, 60.0, 52.0, 32.0, 28.0, 23.0, 12.0, 16.0, 8.0, 9.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0271453857421875, -0.026253938674926758, -0.025362491607666016, -0.024471044540405273, -0.02357959747314453, -0.02268815040588379, -0.021796703338623047, -0.020905256271362305, -0.020013809204101562, -0.01912236213684082, -0.018230915069580078, -0.017339468002319336, -0.016448020935058594, -0.015556573867797852, -0.01466512680053711, -0.013773679733276367, -0.012882232666015625, -0.011990785598754883, -0.01109933853149414, -0.010207891464233398, -0.009316444396972656, -0.008424997329711914, -0.007533550262451172, -0.00664210319519043, -0.0057506561279296875, -0.004859209060668945, -0.003967761993408203, -0.003076314926147461, -0.0021848678588867188, -0.0012934207916259766, -0.0004019737243652344, 0.0004894733428955078, 0.00138092041015625, 0.002272367477416992, 0.0031638145446777344, 0.0040552616119384766, 0.004946708679199219, 0.005838155746459961, 0.006729602813720703, 0.007621049880981445, 0.008512496948242188, 0.00940394401550293, 0.010295391082763672, 0.011186838150024414, 0.012078285217285156, 0.012969732284545898, 0.01386117935180664, 0.014752626419067383, 0.015644073486328125, 0.016535520553588867, 0.01742696762084961, 0.01831841468811035, 0.019209861755371094, 0.020101308822631836, 0.020992755889892578, 0.02188420295715332, 0.022775650024414062, 0.023667097091674805, 0.024558544158935547, 0.02544999122619629, 0.02634143829345703, 0.027232885360717773, 0.028124332427978516, 0.029015779495239258, 0.0299072265625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 45.0, 257.0, 470.0, 206.0, 27.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003547140397131443, -0.0034739698749035597, -0.0034007993526756763, -0.003327628830447793, -0.0032544583082199097, -0.0031812877859920263, -0.003108117263764143, -0.0030349469743669033, -0.0029617762193083763, -0.002888605697080493, -0.0028154351748526096, -0.0027422646526247263, -0.002669094130396843, -0.0025959236081689596, -0.0025227530859410763, -0.0024495827965438366, -0.0023764122743159533, -0.00230324175208807, -0.0022300712298601866, -0.0021569007076323032, -0.00208373018540442, -0.0020105596631765366, -0.001937389257363975, -0.0018642187351360917, -0.0017910482129082084, -0.001717877690680325, -0.0016447071684524417, -0.0015715366462245584, -0.0014983662404119968, -0.0014251957181841135, -0.0013520251959562302, -0.0012788546737283468, -0.0012056839186698198, -0.0011325133964419365, -0.0010593428742140532, -0.0009861723519861698, -0.0009130018879659474, -0.000839831365738064, -0.0007666609017178416, -0.0006934903794899583, -0.000620319857262075, -0.0005471493350341916, -0.0004739788419101387, -0.00040080834878608584, -0.0003276378265582025, -0.00025446730433031917, -0.00018129681120626628, -0.0001081263180822134, -3.495579585433006e-05, 3.821471182163805e-05, 0.00011138521949760616, 0.00018455572717357427, 0.0002577262348495424, 0.0003308967570774257, 0.0004040672502014786, 0.0004772377433255315, 0.0005504082655534148, 0.0006235787877812982, 0.0006967493100091815, 0.0007699197740294039, 0.0008430902962572873, 0.0009162608184851706, 0.000989431282505393, 0.0010626018047332764, 0.0011357723269611597]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 11.0, 5.0, 7.0, 15.0, 15.0, 20.0, 21.0, 20.0, 23.0, 25.0, 37.0, 28.0, 28.0, 36.0, 40.0, 37.0, 38.0, 31.0, 32.0, 36.0, 39.0, 36.0, 42.0, 46.0, 32.0, 36.0, 30.0, 34.0, 20.0, 28.0, 21.0, 17.0, 17.0, 12.0, 12.0, 8.0, 12.0, 15.0, 6.0, 6.0, 7.0, 6.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00040394067764282227, -0.00039034057408571243, -0.0003767404705286026, -0.00036314036697149277, -0.00034954026341438293, -0.0003359401598572731, -0.00032234005630016327, -0.00030873995274305344, -0.0002951398491859436, -0.00028153974562883377, -0.00026793964207172394, -0.0002543395385146141, -0.00024073943495750427, -0.00022713933140039444, -0.0002135392278432846, -0.00019993912428617477, -0.00018633902072906494, -0.0001727389171719551, -0.00015913881361484528, -0.00014553871005773544, -0.0001319386065006256, -0.00011833850294351578, -0.00010473839938640594, -9.113829582929611e-05, -7.753819227218628e-05, -6.393808871507645e-05, -5.0337985157966614e-05, -3.673788160085678e-05, -2.3137778043746948e-05, -9.537674486637115e-06, 4.062429070472717e-06, 1.766253262758255e-05, 3.126263618469238e-05, 4.4862739741802216e-05, 5.846284329891205e-05, 7.206294685602188e-05, 8.566305041313171e-05, 9.926315397024155e-05, 0.00011286325752735138, 0.0001264633610844612, 0.00014006346464157104, 0.00015366356819868088, 0.0001672636717557907, 0.00018086377531290054, 0.00019446387887001038, 0.0002080639824271202, 0.00022166408598423004, 0.00023526418954133987, 0.0002488642930984497, 0.00026246439665555954, 0.00027606450021266937, 0.0002896646037697792, 0.00030326470732688904, 0.00031686481088399887, 0.0003304649144411087, 0.00034406501799821854, 0.00035766512155532837, 0.0003712652251124382, 0.00038486532866954803, 0.00039846543222665787, 0.0004120655357837677, 0.00042566563934087753, 0.00043926574289798737, 0.0004528658464550972, 0.00046646595001220703]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 8.0, 9.0, 9.0, 9.0, 10.0, 15.0, 10.0, 15.0, 8.0, 21.0, 28.0, 24.0, 22.0, 28.0, 27.0, 30.0, 33.0, 43.0, 42.0, 38.0, 46.0, 36.0, 46.0, 38.0, 41.0, 39.0, 21.0, 27.0, 31.0, 26.0, 25.0, 27.0, 15.0, 14.0, 23.0, 22.0, 18.0, 18.0, 6.0, 8.0, 12.0, 6.0, 9.0, 5.0, 8.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.4140625, -6.21856689453125, -6.0230712890625, -5.82757568359375, -5.632080078125, -5.43658447265625, -5.2410888671875, -5.04559326171875, -4.85009765625, -4.65460205078125, -4.4591064453125, -4.26361083984375, -4.068115234375, -3.87261962890625, -3.6771240234375, -3.48162841796875, -3.2861328125, -3.09063720703125, -2.8951416015625, -2.69964599609375, -2.504150390625, -2.30865478515625, -2.1131591796875, -1.91766357421875, -1.72216796875, -1.52667236328125, -1.3311767578125, -1.13568115234375, -0.940185546875, -0.74468994140625, -0.5491943359375, -0.35369873046875, -0.158203125, 0.03729248046875, 0.2327880859375, 0.42828369140625, 0.623779296875, 0.81927490234375, 1.0147705078125, 1.21026611328125, 1.40576171875, 1.60125732421875, 1.7967529296875, 1.99224853515625, 2.187744140625, 2.38323974609375, 2.5787353515625, 2.77423095703125, 2.9697265625, 3.16522216796875, 3.3607177734375, 3.55621337890625, 3.751708984375, 3.94720458984375, 4.1427001953125, 4.33819580078125, 4.53369140625, 4.72918701171875, 4.9246826171875, 5.12017822265625, 5.315673828125, 5.51116943359375, 5.7066650390625, 5.90216064453125, 6.09765625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 7.0, 16.0, 19.0, 21.0, 22.0, 38.0, 38.0, 78.0, 111.0, 116.0, 196.0, 321.0, 602.0, 1132.0, 2301.0, 5287.0, 13756.0, 42784.0, 164256.0, 521268.0, 212988.0, 54312.0, 16874.0, 6341.0, 2670.0, 1243.0, 643.0, 332.0, 225.0, 132.0, 103.0, 72.0, 57.0, 43.0, 36.0, 18.0, 16.0, 14.0, 10.0, 13.0, 7.0, 7.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-6.546875, -6.35198974609375, -6.1571044921875, -5.96221923828125, -5.767333984375, -5.57244873046875, -5.3775634765625, -5.18267822265625, -4.98779296875, -4.79290771484375, -4.5980224609375, -4.40313720703125, -4.208251953125, -4.01336669921875, -3.8184814453125, -3.62359619140625, -3.4287109375, -3.23382568359375, -3.0389404296875, -2.84405517578125, -2.649169921875, -2.45428466796875, -2.2593994140625, -2.06451416015625, -1.86962890625, -1.67474365234375, -1.4798583984375, -1.28497314453125, -1.090087890625, -0.89520263671875, -0.7003173828125, -0.50543212890625, -0.310546875, -0.11566162109375, 0.0792236328125, 0.27410888671875, 0.468994140625, 0.66387939453125, 0.8587646484375, 1.05364990234375, 1.24853515625, 1.44342041015625, 1.6383056640625, 1.83319091796875, 2.028076171875, 2.22296142578125, 2.4178466796875, 2.61273193359375, 2.8076171875, 3.00250244140625, 3.1973876953125, 3.39227294921875, 3.587158203125, 3.78204345703125, 3.9769287109375, 4.17181396484375, 4.36669921875, 4.56158447265625, 4.7564697265625, 4.95135498046875, 5.146240234375, 5.34112548828125, 5.5360107421875, 5.73089599609375, 5.92578125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 6.0, 12.0, 16.0, 22.0, 20.0, 27.0, 29.0, 37.0, 34.0, 37.0, 28.0, 45.0, 60.0, 89.0, 1604.0, 427.0, 87.0, 45.0, 41.0, 53.0, 34.0, 29.0, 39.0, 44.0, 36.0, 18.0, 21.0, 16.0, 14.0, 13.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -22.109619140625, -21.34423828125, -20.578857421875, -19.8134765625, -19.048095703125, -18.28271484375, -17.517333984375, -16.751953125, -15.986572265625, -15.22119140625, -14.455810546875, -13.6904296875, -12.925048828125, -12.15966796875, -11.394287109375, -10.62890625, -9.863525390625, -9.09814453125, -8.332763671875, -7.5673828125, -6.802001953125, -6.03662109375, -5.271240234375, -4.505859375, -3.740478515625, -2.97509765625, -2.209716796875, -1.4443359375, -0.678955078125, 0.08642578125, 0.851806640625, 1.6171875, 2.382568359375, 3.14794921875, 3.913330078125, 4.6787109375, 5.444091796875, 6.20947265625, 6.974853515625, 7.740234375, 8.505615234375, 9.27099609375, 10.036376953125, 10.8017578125, 11.567138671875, 12.33251953125, 13.097900390625, 13.86328125, 14.628662109375, 15.39404296875, 16.159423828125, 16.9248046875, 17.690185546875, 18.45556640625, 19.220947265625, 19.986328125, 20.751708984375, 21.51708984375, 22.282470703125, 23.0478515625, 23.813232421875, 24.57861328125, 25.343994140625, 26.109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 17.0, 17.0, 22.0, 22.0, 30.0, 38.0, 54.0, 106.0, 125.0, 171.0, 258.0, 432.0, 884.0, 10558.0, 3120362.0, 10502.0, 878.0, 389.0, 244.0, 171.0, 102.0, 77.0, 73.0, 35.0, 31.0, 21.0, 11.0, 13.0, 10.0, 11.0, 6.0, 2.0, 10.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.1875, -63.181640625, -61.17578125, -59.169921875, -57.1640625, -55.158203125, -53.15234375, -51.146484375, -49.140625, -47.134765625, -45.12890625, -43.123046875, -41.1171875, -39.111328125, -37.10546875, -35.099609375, -33.09375, -31.087890625, -29.08203125, -27.076171875, -25.0703125, -23.064453125, -21.05859375, -19.052734375, -17.046875, -15.041015625, -13.03515625, -11.029296875, -9.0234375, -7.017578125, -5.01171875, -3.005859375, -1.0, 1.005859375, 3.01171875, 5.017578125, 7.0234375, 9.029296875, 11.03515625, 13.041015625, 15.046875, 17.052734375, 19.05859375, 21.064453125, 23.0703125, 25.076171875, 27.08203125, 29.087890625, 31.09375, 33.099609375, 35.10546875, 37.111328125, 39.1171875, 41.123046875, 43.12890625, 45.134765625, 47.140625, 49.146484375, 51.15234375, 53.158203125, 55.1640625, 57.169921875, 59.17578125, 61.181640625, 63.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 68.0, 451.0, 422.0, 70.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.95098876953125, -129.3613739013672, -126.77175903320312, -124.18214416503906, -121.592529296875, -119.00291442871094, -116.41329956054688, -113.82368469238281, -111.23406982421875, -108.64445495605469, -106.05484008789062, -103.46522521972656, -100.8756103515625, -98.28599548339844, -95.69638061523438, -93.10676574707031, -90.51715087890625, -87.92753601074219, -85.33792114257812, -82.74830627441406, -80.15869140625, -77.56907653808594, -74.97946166992188, -72.38984680175781, -69.80023193359375, -67.21061706542969, -64.62100219726562, -62.03138732910156, -59.4417724609375, -56.85215759277344, -54.262542724609375, -51.67292785644531, -49.083309173583984, -46.49369430541992, -43.90407943725586, -41.3144645690918, -38.724849700927734, -36.13523483276367, -33.54561996459961, -30.956005096435547, -28.366390228271484, -25.776775360107422, -23.18716049194336, -20.597545623779297, -18.007930755615234, -15.418315887451172, -12.82870101928711, -10.239086151123047, -7.649471282958984, -5.059856414794922, -2.4702415466308594, 0.11937332153320312, 2.7089881896972656, 5.298603057861328, 7.888217926025391, 10.477832794189453, 13.067447662353516, 15.657062530517578, 18.24667739868164, 20.836292266845703, 23.425907135009766, 26.015522003173828, 28.60513687133789, 31.194751739501953, 33.784366607666016]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 7.0, 6.0, 30.0, 20.0, 23.0, 22.0, 26.0, 23.0, 26.0, 43.0, 42.0, 39.0, 50.0, 61.0, 49.0, 56.0, 50.0, 52.0, 42.0, 51.0, 29.0, 32.0, 25.0, 35.0, 26.0, 23.0, 30.0, 10.0, 14.0, 12.0, 8.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.52313232421875, -70.36395263671875, -68.20476531982422, -66.04558563232422, -63.88640213012695, -61.72721862792969, -59.56803894042969, -57.40885543823242, -55.249671936035156, -53.09048843383789, -50.931304931640625, -48.772125244140625, -46.61294174194336, -44.453758239746094, -42.294578552246094, -40.13539505004883, -37.97621154785156, -35.8170280456543, -33.65784454345703, -31.49866485595703, -29.339481353759766, -27.1802978515625, -25.021116256713867, -22.861934661865234, -20.70275115966797, -18.543567657470703, -16.38438606262207, -14.225203514099121, -12.066020965576172, -9.906838417053223, -7.747655868530273, -5.588473320007324, -3.429290771484375, -1.2701082229614258, 0.8890743255615234, 3.0482568740844727, 5.207439422607422, 7.366621971130371, 9.52580451965332, 11.68498706817627, 13.844169616699219, 16.003353118896484, 18.162534713745117, 20.32171630859375, 22.480899810791016, 24.64008331298828, 26.799264907836914, 28.958446502685547, 31.117630004882812, 33.27681350708008, 35.435997009277344, 37.595176696777344, 39.75436019897461, 41.913543701171875, 44.072723388671875, 46.23190689086914, 48.391090393066406, 50.55027389526367, 52.70945739746094, 54.86863708496094, 57.0278205871582, 59.18700408935547, 61.34618377685547, 63.505367279052734, 65.66455078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 9.0, 11.0, 13.0, 9.0, 12.0, 19.0, 18.0, 26.0, 27.0, 17.0, 24.0, 42.0, 37.0, 31.0, 29.0, 47.0, 43.0, 36.0, 34.0, 45.0, 36.0, 39.0, 29.0, 26.0, 36.0, 32.0, 21.0, 22.0, 20.0, 25.0, 16.0, 14.0, 16.0, 16.0, 22.0, 10.0, 11.0, 8.0, 11.0, 9.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.15234375, -5.9581298828125, -5.763916015625, -5.5697021484375, -5.37548828125, -5.1812744140625, -4.987060546875, -4.7928466796875, -4.5986328125, -4.4044189453125, -4.210205078125, -4.0159912109375, -3.82177734375, -3.6275634765625, -3.433349609375, -3.2391357421875, -3.044921875, -2.8507080078125, -2.656494140625, -2.4622802734375, -2.26806640625, -2.0738525390625, -1.879638671875, -1.6854248046875, -1.4912109375, -1.2969970703125, -1.102783203125, -0.9085693359375, -0.71435546875, -0.5201416015625, -0.325927734375, -0.1317138671875, 0.0625, 0.2567138671875, 0.450927734375, 0.6451416015625, 0.83935546875, 1.0335693359375, 1.227783203125, 1.4219970703125, 1.6162109375, 1.8104248046875, 2.004638671875, 2.1988525390625, 2.39306640625, 2.5872802734375, 2.781494140625, 2.9757080078125, 3.169921875, 3.3641357421875, 3.558349609375, 3.7525634765625, 3.94677734375, 4.1409912109375, 4.335205078125, 4.5294189453125, 4.7236328125, 4.9178466796875, 5.112060546875, 5.3062744140625, 5.50048828125, 5.6947021484375, 5.888916015625, 6.0831298828125, 6.27734375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 8.0, 6.0, 9.0, 18.0, 13.0, 26.0, 21.0, 26.0, 32.0, 35.0, 38.0, 38.0, 55.0, 57.0, 85.0, 139.0, 185.0, 386.0, 767.0, 2154.0, 12987.0, 210779.0, 2263625.0, 1592925.0, 99152.0, 7502.0, 1588.0, 584.0, 264.0, 179.0, 115.0, 79.0, 52.0, 55.0, 39.0, 49.0, 38.0, 31.0, 26.0, 22.0, 14.0, 18.0, 14.0, 10.0, 12.0, 7.0, 3.0, 0.0, 4.0, 7.0, 1.0, 2.0, 1.0, 3.0], "bins": [-17.171875, -16.649658203125, -16.12744140625, -15.605224609375, -15.0830078125, -14.560791015625, -14.03857421875, -13.516357421875, -12.994140625, -12.471923828125, -11.94970703125, -11.427490234375, -10.9052734375, -10.383056640625, -9.86083984375, -9.338623046875, -8.81640625, -8.294189453125, -7.77197265625, -7.249755859375, -6.7275390625, -6.205322265625, -5.68310546875, -5.160888671875, -4.638671875, -4.116455078125, -3.59423828125, -3.072021484375, -2.5498046875, -2.027587890625, -1.50537109375, -0.983154296875, -0.4609375, 0.061279296875, 0.58349609375, 1.105712890625, 1.6279296875, 2.150146484375, 2.67236328125, 3.194580078125, 3.716796875, 4.239013671875, 4.76123046875, 5.283447265625, 5.8056640625, 6.327880859375, 6.85009765625, 7.372314453125, 7.89453125, 8.416748046875, 8.93896484375, 9.461181640625, 9.9833984375, 10.505615234375, 11.02783203125, 11.550048828125, 12.072265625, 12.594482421875, 13.11669921875, 13.638916015625, 14.1611328125, 14.683349609375, 15.20556640625, 15.727783203125, 16.25]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 10.0, 15.0, 21.0, 20.0, 31.0, 49.0, 71.0, 94.0, 145.0, 180.0, 252.0, 333.0, 439.0, 498.0, 472.0, 393.0, 275.0, 219.0, 162.0, 113.0, 67.0, 52.0, 48.0, 24.0, 20.0, 18.0, 9.0, 12.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8359375, -15.380126953125, -14.92431640625, -14.468505859375, -14.0126953125, -13.556884765625, -13.10107421875, -12.645263671875, -12.189453125, -11.733642578125, -11.27783203125, -10.822021484375, -10.3662109375, -9.910400390625, -9.45458984375, -8.998779296875, -8.54296875, -8.087158203125, -7.63134765625, -7.175537109375, -6.7197265625, -6.263916015625, -5.80810546875, -5.352294921875, -4.896484375, -4.440673828125, -3.98486328125, -3.529052734375, -3.0732421875, -2.617431640625, -2.16162109375, -1.705810546875, -1.25, -0.794189453125, -0.33837890625, 0.117431640625, 0.5732421875, 1.029052734375, 1.48486328125, 1.940673828125, 2.396484375, 2.852294921875, 3.30810546875, 3.763916015625, 4.2197265625, 4.675537109375, 5.13134765625, 5.587158203125, 6.04296875, 6.498779296875, 6.95458984375, 7.410400390625, 7.8662109375, 8.322021484375, 8.77783203125, 9.233642578125, 9.689453125, 10.145263671875, 10.60107421875, 11.056884765625, 11.5126953125, 11.968505859375, 12.42431640625, 12.880126953125, 13.3359375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 16.0, 14.0, 33.0, 46.0, 55.0, 61.0, 107.0, 112.0, 147.0, 222.0, 335.0, 483.0, 1267.0, 1233519.0, 2954339.0, 1720.0, 540.0, 340.0, 241.0, 165.0, 138.0, 108.0, 59.0, 43.0, 44.0, 34.0, 26.0, 17.0, 12.0, 8.0, 3.0, 2.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.5625, -77.0, -74.4375, -71.875, -69.3125, -66.75, -64.1875, -61.625, -59.0625, -56.5, -53.9375, -51.375, -48.8125, -46.25, -43.6875, -41.125, -38.5625, -36.0, -33.4375, -30.875, -28.3125, -25.75, -23.1875, -20.625, -18.0625, -15.5, -12.9375, -10.375, -7.8125, -5.25, -2.6875, -0.125, 2.4375, 5.0, 7.5625, 10.125, 12.6875, 15.25, 17.8125, 20.375, 22.9375, 25.5, 28.0625, 30.625, 33.1875, 35.75, 38.3125, 40.875, 43.4375, 46.0, 48.5625, 51.125, 53.6875, 56.25, 58.8125, 61.375, 63.9375, 66.5, 69.0625, 71.625, 74.1875, 76.75, 79.3125, 81.875, 84.4375]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 8.0, 60.0, 340.0, 475.0, 122.0, 9.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.8811950683594, -258.9228820800781, -251.96458435058594, -245.0062713623047, -238.0479736328125, -231.08966064453125, -224.13134765625, -217.17303466796875, -210.21473693847656, -203.2564239501953, -196.29812622070312, -189.33981323242188, -182.38150024414062, -175.42320251464844, -168.4648895263672, -161.506591796875, -154.54827880859375, -147.5899658203125, -140.6316680908203, -133.67335510253906, -126.71504974365234, -119.75674438476562, -112.79843139648438, -105.84012603759766, -98.88182067871094, -91.92351531982422, -84.9652099609375, -78.00689697265625, -71.04859161376953, -64.09028625488281, -57.13197708129883, -50.173667907714844, -43.21534729003906, -36.257041931152344, -29.29873275756836, -22.340425491333008, -15.382118225097656, -8.423812866210938, -1.4655036926269531, 5.492805480957031, 12.45111083984375, 19.4094181060791, 26.367725372314453, 33.32603454589844, 40.284339904785156, 47.242645263671875, 54.20095443725586, 61.159263610839844, 68.11756896972656, 75.07587432861328, 82.0341796875, 88.99249267578125, 95.95079803466797, 102.90910339355469, 109.86741638183594, 116.82572174072266, 123.78402709960938, 130.74234008789062, 137.7006378173828, 144.65895080566406, 151.61724853515625, 158.5755615234375, 165.53387451171875, 172.4921875, 179.4504852294922]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 15.0, 5.0, 12.0, 12.0, 18.0, 9.0, 25.0, 24.0, 26.0, 31.0, 29.0, 29.0, 51.0, 27.0, 32.0, 35.0, 38.0, 41.0, 43.0, 32.0, 41.0, 40.0, 44.0, 38.0, 36.0, 26.0, 36.0, 32.0, 20.0, 25.0, 20.0, 27.0, 10.0, 8.0, 3.0, 5.0, 10.0, 10.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-40.64363098144531, -39.27654266357422, -37.90945053100586, -36.542362213134766, -35.17527389526367, -33.80818176269531, -32.44109344482422, -31.074005126953125, -29.7069149017334, -28.339824676513672, -26.972736358642578, -25.60564613342285, -24.238555908203125, -22.87146759033203, -21.504377365112305, -20.137287139892578, -18.770198822021484, -17.403108596801758, -16.036020278930664, -14.668930053710938, -13.301840782165527, -11.934751510620117, -10.56766128540039, -9.20057201385498, -7.83348274230957, -6.46639347076416, -5.099303722381592, -3.7322139739990234, -2.3651247024536133, -0.9980354309082031, 0.36905479431152344, 1.7361440658569336, 3.1032333374023438, 4.470322608947754, 5.837412357330322, 7.204502105712891, 8.5715913772583, 9.938680648803711, 11.305770874023438, 12.672860145568848, 14.039949417114258, 15.407038688659668, 16.774127960205078, 18.141218185424805, 19.50830841064453, 20.875396728515625, 22.24248695373535, 23.609577178955078, 24.976665496826172, 26.3437557220459, 27.710844039916992, 29.07793426513672, 30.445022583007812, 31.81211280822754, 33.179203033447266, 34.54629135131836, 35.91338348388672, 37.28047180175781, 38.64756393432617, 40.014652252197266, 41.38174057006836, 42.74883270263672, 44.11592102050781, 45.483009338378906, 46.85009765625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 4.0, 10.0, 5.0, 9.0, 8.0, 5.0, 10.0, 10.0, 15.0, 12.0, 12.0, 23.0, 23.0, 31.0, 28.0, 23.0, 35.0, 25.0, 44.0, 36.0, 43.0, 39.0, 31.0, 37.0, 47.0, 47.0, 47.0, 29.0, 27.0, 27.0, 19.0, 24.0, 20.0, 23.0, 26.0, 14.0, 22.0, 10.0, 16.0, 15.0, 6.0, 15.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.0546875, -5.863525390625, -5.67236328125, -5.481201171875, -5.2900390625, -5.098876953125, -4.90771484375, -4.716552734375, -4.525390625, -4.334228515625, -4.14306640625, -3.951904296875, -3.7607421875, -3.569580078125, -3.37841796875, -3.187255859375, -2.99609375, -2.804931640625, -2.61376953125, -2.422607421875, -2.2314453125, -2.040283203125, -1.84912109375, -1.657958984375, -1.466796875, -1.275634765625, -1.08447265625, -0.893310546875, -0.7021484375, -0.510986328125, -0.31982421875, -0.128662109375, 0.0625, 0.253662109375, 0.44482421875, 0.635986328125, 0.8271484375, 1.018310546875, 1.20947265625, 1.400634765625, 1.591796875, 1.782958984375, 1.97412109375, 2.165283203125, 2.3564453125, 2.547607421875, 2.73876953125, 2.929931640625, 3.12109375, 3.312255859375, 3.50341796875, 3.694580078125, 3.8857421875, 4.076904296875, 4.26806640625, 4.459228515625, 4.650390625, 4.841552734375, 5.03271484375, 5.223876953125, 5.4150390625, 5.606201171875, 5.79736328125, 5.988525390625, 6.1796875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 9.0, 11.0, 22.0, 32.0, 34.0, 45.0, 96.0, 149.0, 180.0, 324.0, 455.0, 604.0, 942.0, 1359.0, 2022.0, 2778.0, 4158.0, 6123.0, 9039.0, 13366.0, 19972.0, 30629.0, 48657.0, 80541.0, 141765.0, 254051.0, 174662.0, 95245.0, 56141.0, 35059.0, 22961.0, 14886.0, 10100.0, 7046.0, 4813.0, 3245.0, 2212.0, 1539.0, 1048.0, 688.0, 507.0, 341.0, 226.0, 155.0, 116.0, 68.0, 41.0, 43.0, 21.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.923828125, -0.895538330078125, -0.86724853515625, -0.838958740234375, -0.8106689453125, -0.782379150390625, -0.75408935546875, -0.725799560546875, -0.697509765625, -0.669219970703125, -0.64093017578125, -0.612640380859375, -0.5843505859375, -0.556060791015625, -0.52777099609375, -0.499481201171875, -0.47119140625, -0.442901611328125, -0.41461181640625, -0.386322021484375, -0.3580322265625, -0.329742431640625, -0.30145263671875, -0.273162841796875, -0.244873046875, -0.216583251953125, -0.18829345703125, -0.160003662109375, -0.1317138671875, -0.103424072265625, -0.07513427734375, -0.046844482421875, -0.0185546875, 0.009735107421875, 0.03802490234375, 0.066314697265625, 0.0946044921875, 0.122894287109375, 0.15118408203125, 0.179473876953125, 0.207763671875, 0.236053466796875, 0.26434326171875, 0.292633056640625, 0.3209228515625, 0.349212646484375, 0.37750244140625, 0.405792236328125, 0.43408203125, 0.462371826171875, 0.49066162109375, 0.518951416015625, 0.5472412109375, 0.575531005859375, 0.60382080078125, 0.632110595703125, 0.660400390625, 0.688690185546875, 0.71697998046875, 0.745269775390625, 0.7735595703125, 0.801849365234375, 0.83013916015625, 0.858428955078125, 0.88671875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 6.0, 9.0, 2.0, 8.0, 7.0, 8.0, 13.0, 14.0, 26.0, 19.0, 28.0, 30.0, 26.0, 27.0, 30.0, 34.0, 29.0, 39.0, 38.0, 35.0, 35.0, 1077.0, 48.0, 46.0, 33.0, 30.0, 24.0, 29.0, 37.0, 36.0, 27.0, 24.0, 28.0, 14.0, 15.0, 20.0, 12.0, 11.0, 14.0, 9.0, 5.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.02734375, -3.89544677734375, -3.7635498046875, -3.63165283203125, -3.499755859375, -3.36785888671875, -3.2359619140625, -3.10406494140625, -2.97216796875, -2.84027099609375, -2.7083740234375, -2.57647705078125, -2.444580078125, -2.31268310546875, -2.1807861328125, -2.04888916015625, -1.9169921875, -1.78509521484375, -1.6531982421875, -1.52130126953125, -1.389404296875, -1.25750732421875, -1.1256103515625, -0.99371337890625, -0.86181640625, -0.72991943359375, -0.5980224609375, -0.46612548828125, -0.334228515625, -0.20233154296875, -0.0704345703125, 0.06146240234375, 0.193359375, 0.32525634765625, 0.4571533203125, 0.58905029296875, 0.720947265625, 0.85284423828125, 0.9847412109375, 1.11663818359375, 1.24853515625, 1.38043212890625, 1.5123291015625, 1.64422607421875, 1.776123046875, 1.90802001953125, 2.0399169921875, 2.17181396484375, 2.3037109375, 2.43560791015625, 2.5675048828125, 2.69940185546875, 2.831298828125, 2.96319580078125, 3.0950927734375, 3.22698974609375, 3.35888671875, 3.49078369140625, 3.6226806640625, 3.75457763671875, 3.886474609375, 4.01837158203125, 4.1502685546875, 4.28216552734375, 4.4140625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 4.0, 7.0, 11.0, 9.0, 24.0, 22.0, 39.0, 57.0, 52.0, 95.0, 118.0, 179.0, 252.0, 328.0, 531.0, 712.0, 980.0, 1396.0, 2009.0, 2805.0, 3967.0, 5840.0, 8585.0, 12795.0, 18651.0, 28430.0, 43980.0, 69110.0, 112430.0, 197508.0, 1256053.0, 118733.0, 73218.0, 46055.0, 29915.0, 19781.0, 13134.0, 8961.0, 6092.0, 4159.0, 3100.0, 2088.0, 1455.0, 1039.0, 678.0, 484.0, 341.0, 256.0, 191.0, 140.0, 93.0, 66.0, 59.0, 34.0, 29.0, 31.0, 9.0, 9.0, 9.0, 3.0, 2.0, 2.0], "bins": [-0.82861328125, -0.802764892578125, -0.77691650390625, -0.751068115234375, -0.7252197265625, -0.699371337890625, -0.67352294921875, -0.647674560546875, -0.621826171875, -0.595977783203125, -0.57012939453125, -0.544281005859375, -0.5184326171875, -0.492584228515625, -0.46673583984375, -0.440887451171875, -0.4150390625, -0.389190673828125, -0.36334228515625, -0.337493896484375, -0.3116455078125, -0.285797119140625, -0.25994873046875, -0.234100341796875, -0.208251953125, -0.182403564453125, -0.15655517578125, -0.130706787109375, -0.1048583984375, -0.079010009765625, -0.05316162109375, -0.027313232421875, -0.00146484375, 0.024383544921875, 0.05023193359375, 0.076080322265625, 0.1019287109375, 0.127777099609375, 0.15362548828125, 0.179473876953125, 0.205322265625, 0.231170654296875, 0.25701904296875, 0.282867431640625, 0.3087158203125, 0.334564208984375, 0.36041259765625, 0.386260986328125, 0.412109375, 0.437957763671875, 0.46380615234375, 0.489654541015625, 0.5155029296875, 0.541351318359375, 0.56719970703125, 0.593048095703125, 0.618896484375, 0.644744873046875, 0.67059326171875, 0.696441650390625, 0.7222900390625, 0.748138427734375, 0.77398681640625, 0.799835205078125, 0.82568359375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 6.0, 9.0, 8.0, 7.0, 5.0, 15.0, 13.0, 12.0, 26.0, 34.0, 41.0, 34.0, 58.0, 67.0, 73.0, 81.0, 84.0, 65.0, 75.0, 59.0, 48.0, 31.0, 27.0, 19.0, 17.0, 17.0, 9.0, 14.0, 6.0, 5.0, 8.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0015478134155273438, -0.001505047082901001, -0.0014622807502746582, -0.0014195144176483154, -0.0013767480850219727, -0.0013339817523956299, -0.0012912154197692871, -0.0012484490871429443, -0.0012056827545166016, -0.0011629164218902588, -0.001120150089263916, -0.0010773837566375732, -0.0010346174240112305, -0.0009918510913848877, -0.0009490847587585449, -0.0009063184261322021, -0.0008635520935058594, -0.0008207857608795166, -0.0007780194282531738, -0.0007352530956268311, -0.0006924867630004883, -0.0006497204303741455, -0.0006069540977478027, -0.00056418776512146, -0.0005214214324951172, -0.0004786550998687744, -0.00043588876724243164, -0.00039312243461608887, -0.0003503561019897461, -0.0003075897693634033, -0.00026482343673706055, -0.00022205710411071777, -0.000179290771484375, -0.00013652443885803223, -9.375810623168945e-05, -5.099177360534668e-05, -8.225440979003906e-06, 3.454089164733887e-05, 7.730722427368164e-05, 0.00012007355690002441, 0.0001628398895263672, 0.00020560622215270996, 0.00024837255477905273, 0.0002911388874053955, 0.0003339052200317383, 0.00037667155265808105, 0.00041943788528442383, 0.0004622042179107666, 0.0005049705505371094, 0.0005477368831634521, 0.0005905032157897949, 0.0006332695484161377, 0.0006760358810424805, 0.0007188022136688232, 0.000761568546295166, 0.0008043348789215088, 0.0008471012115478516, 0.0008898675441741943, 0.0009326338768005371, 0.0009754002094268799, 0.0010181665420532227, 0.0010609328746795654, 0.0011036992073059082, 0.001146465539932251, 0.0011892318725585938]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 8.0, 4.0, 1.0, 10.0, 15.0, 13.0, 20.0, 32.0, 24.0, 46.0, 71.0, 88.0, 193.0, 454.0, 2956.0, 1041356.0, 2228.0, 460.0, 191.0, 82.0, 73.0, 55.0, 41.0, 27.0, 23.0, 14.0, 12.0, 10.0, 6.0, 9.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02984619140625, -0.028797626495361328, -0.027749061584472656, -0.026700496673583984, -0.025651931762695312, -0.02460336685180664, -0.02355480194091797, -0.022506237030029297, -0.021457672119140625, -0.020409107208251953, -0.01936054229736328, -0.01831197738647461, -0.017263412475585938, -0.016214847564697266, -0.015166282653808594, -0.014117717742919922, -0.01306915283203125, -0.012020587921142578, -0.010972023010253906, -0.009923458099365234, -0.008874893188476562, -0.00782632827758789, -0.006777763366699219, -0.005729198455810547, -0.004680633544921875, -0.003632068634033203, -0.0025835037231445312, -0.0015349388122558594, -0.0004863739013671875, 0.0005621910095214844, 0.0016107559204101562, 0.002659320831298828, 0.0037078857421875, 0.004756450653076172, 0.005805015563964844, 0.006853580474853516, 0.007902145385742188, 0.00895071029663086, 0.009999275207519531, 0.011047840118408203, 0.012096405029296875, 0.013144969940185547, 0.014193534851074219, 0.01524209976196289, 0.016290664672851562, 0.017339229583740234, 0.018387794494628906, 0.019436359405517578, 0.02048492431640625, 0.021533489227294922, 0.022582054138183594, 0.023630619049072266, 0.024679183959960938, 0.02572774887084961, 0.02677631378173828, 0.027824878692626953, 0.028873443603515625, 0.029922008514404297, 0.03097057342529297, 0.03201913833618164, 0.03306770324707031, 0.034116268157958984, 0.035164833068847656, 0.03621339797973633, 0.037261962890625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 84.0, 348.0, 452.0, 114.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005578746204264462, -0.00047948287101462483, -0.000401091092498973, -0.0003226993139833212, -0.0002443075645714998, -0.00016591581515967846, -8.752403664402664e-05, -9.132258128374815e-06, 6.925949128344655e-05, 0.00014765125524718314, 0.00022604301921091974, 0.00030443479772657156, 0.0003828265471383929, 0.0004612182965502143, 0.0005396100459620357, 0.0006180018535815179, 0.0006963936029933393, 0.0007747853524051607, 0.0008531771600246429, 0.0009315689094364643, 0.0010099606588482857, 0.001088352408260107, 0.0011667441576719284, 0.0012451359070837498, 0.0013235276564955711, 0.0014019194059073925, 0.0014803111553192139, 0.0015587029047310352, 0.0016370946541428566, 0.001715486403554678, 0.0017938782693818212, 0.0018722700187936425, 0.001950661651790142, 0.0020290534012019634, 0.002107445150613785, 0.002185836900025606, 0.0022642286494374275, 0.002342620398849249, 0.0024210121482610703, 0.0024994038976728916, 0.002577795647084713, 0.0026561873964965343, 0.0027345791459083557, 0.002812970895320177, 0.0028913626447319984, 0.00296975439414382, 0.003048146143555641, 0.0031265378929674625, 0.0032049298752099276, 0.003283321624621749, 0.0033617133740335703, 0.0034401051234453917, 0.003518496872857213, 0.0035968886222690344, 0.0036752803716808558, 0.0037536723539233208, 0.003832064103335142, 0.0039104558527469635, 0.003988847602158785, 0.004067239351570606, 0.004145631100982428, 0.004224022850394249, 0.00430241459980607, 0.004380806349217892, 0.004459198098629713]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 6.0, 8.0, 9.0, 16.0, 5.0, 16.0, 18.0, 17.0, 27.0, 25.0, 17.0, 29.0, 36.0, 36.0, 34.0, 31.0, 39.0, 43.0, 53.0, 45.0, 37.0, 42.0, 35.0, 44.0, 36.0, 39.0, 38.0, 24.0, 23.0, 19.0, 24.0, 22.0, 22.0, 17.0, 13.0, 12.0, 9.0, 11.0, 4.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006906390190124512, -0.0006702588871121407, -0.0006498787552118301, -0.0006294986233115196, -0.0006091184914112091, -0.0005887383595108986, -0.0005683582276105881, -0.0005479780957102776, -0.000527597963809967, -0.0005072178319096565, -0.000486837700009346, -0.0004664575681090355, -0.000446077436208725, -0.00042569730430841446, -0.00040531717240810394, -0.0003849370405077934, -0.0003645569086074829, -0.0003441767767071724, -0.0003237966448068619, -0.00030341651290655136, -0.00028303638100624084, -0.00026265624910593033, -0.0002422761172056198, -0.0002218959853053093, -0.00020151585340499878, -0.00018113572150468826, -0.00016075558960437775, -0.00014037545770406723, -0.00011999532580375671, -9.96151939034462e-05, -7.923506200313568e-05, -5.8854930102825165e-05, -3.847479820251465e-05, -1.8094666302204132e-05, 2.2854655981063843e-06, 2.26655974984169e-05, 4.304572939872742e-05, 6.342586129903793e-05, 8.380599319934845e-05, 0.00010418612509965897, 0.00012456625699996948, 0.00014494638890028, 0.00016532652080059052, 0.00018570665270090103, 0.00020608678460121155, 0.00022646691650152206, 0.0002468470484018326, 0.0002672271803021431, 0.0002876073122024536, 0.00030798744410276413, 0.00032836757600307465, 0.00034874770790338516, 0.0003691278398036957, 0.0003895079717040062, 0.0004098881036043167, 0.00043026823550462723, 0.00045064836740493774, 0.00047102849930524826, 0.0004914086312055588, 0.0005117887631058693, 0.0005321688950061798, 0.0005525490269064903, 0.0005729291588068008, 0.0005933092907071114, 0.0006136894226074219]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 4.0, 10.0, 5.0, 9.0, 8.0, 5.0, 10.0, 10.0, 15.0, 12.0, 12.0, 23.0, 23.0, 31.0, 28.0, 23.0, 35.0, 25.0, 44.0, 36.0, 43.0, 39.0, 31.0, 37.0, 47.0, 47.0, 47.0, 29.0, 27.0, 27.0, 19.0, 24.0, 20.0, 23.0, 26.0, 14.0, 22.0, 10.0, 16.0, 15.0, 6.0, 15.0, 14.0, 6.0, 6.0, 7.0, 6.0, 2.0, 5.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.0546875, -5.863525390625, -5.67236328125, -5.481201171875, -5.2900390625, -5.098876953125, -4.90771484375, -4.716552734375, -4.525390625, -4.334228515625, -4.14306640625, -3.951904296875, -3.7607421875, -3.569580078125, -3.37841796875, -3.187255859375, -2.99609375, -2.804931640625, -2.61376953125, -2.422607421875, -2.2314453125, -2.040283203125, -1.84912109375, -1.657958984375, -1.466796875, -1.275634765625, -1.08447265625, -0.893310546875, -0.7021484375, -0.510986328125, -0.31982421875, -0.128662109375, 0.0625, 0.253662109375, 0.44482421875, 0.635986328125, 0.8271484375, 1.018310546875, 1.20947265625, 1.400634765625, 1.591796875, 1.782958984375, 1.97412109375, 2.165283203125, 2.3564453125, 2.547607421875, 2.73876953125, 2.929931640625, 3.12109375, 3.312255859375, 3.50341796875, 3.694580078125, 3.8857421875, 4.076904296875, 4.26806640625, 4.459228515625, 4.650390625, 4.841552734375, 5.03271484375, 5.223876953125, 5.4150390625, 5.606201171875, 5.79736328125, 5.988525390625, 6.1796875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 7.0, 9.0, 16.0, 8.0, 20.0, 31.0, 58.0, 80.0, 119.0, 170.0, 285.0, 487.0, 784.0, 1448.0, 2649.0, 4947.0, 9264.0, 17693.0, 35725.0, 76083.0, 172759.0, 354895.0, 200598.0, 87414.0, 40511.0, 19767.0, 10390.0, 5504.0, 2875.0, 1614.0, 915.0, 542.0, 324.0, 162.0, 118.0, 84.0, 48.0, 45.0, 28.0, 13.0, 14.0, 12.0, 7.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.1796875, -4.04736328125, -3.9150390625, -3.78271484375, -3.650390625, -3.51806640625, -3.3857421875, -3.25341796875, -3.12109375, -2.98876953125, -2.8564453125, -2.72412109375, -2.591796875, -2.45947265625, -2.3271484375, -2.19482421875, -2.0625, -1.93017578125, -1.7978515625, -1.66552734375, -1.533203125, -1.40087890625, -1.2685546875, -1.13623046875, -1.00390625, -0.87158203125, -0.7392578125, -0.60693359375, -0.474609375, -0.34228515625, -0.2099609375, -0.07763671875, 0.0546875, 0.18701171875, 0.3193359375, 0.45166015625, 0.583984375, 0.71630859375, 0.8486328125, 0.98095703125, 1.11328125, 1.24560546875, 1.3779296875, 1.51025390625, 1.642578125, 1.77490234375, 1.9072265625, 2.03955078125, 2.171875, 2.30419921875, 2.4365234375, 2.56884765625, 2.701171875, 2.83349609375, 2.9658203125, 3.09814453125, 3.23046875, 3.36279296875, 3.4951171875, 3.62744140625, 3.759765625, 3.89208984375, 4.0244140625, 4.15673828125, 4.2890625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 12.0, 12.0, 12.0, 23.0, 22.0, 18.0, 21.0, 26.0, 43.0, 26.0, 36.0, 51.0, 42.0, 52.0, 86.0, 219.0, 1620.0, 203.0, 80.0, 53.0, 48.0, 33.0, 42.0, 26.0, 31.0, 30.0, 27.0, 16.0, 24.0, 16.0, 17.0, 6.0, 7.0, 9.0, 7.0, 6.0, 2.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.859375, -21.163330078125, -20.46728515625, -19.771240234375, -19.0751953125, -18.379150390625, -17.68310546875, -16.987060546875, -16.291015625, -15.594970703125, -14.89892578125, -14.202880859375, -13.5068359375, -12.810791015625, -12.11474609375, -11.418701171875, -10.72265625, -10.026611328125, -9.33056640625, -8.634521484375, -7.9384765625, -7.242431640625, -6.54638671875, -5.850341796875, -5.154296875, -4.458251953125, -3.76220703125, -3.066162109375, -2.3701171875, -1.674072265625, -0.97802734375, -0.281982421875, 0.4140625, 1.110107421875, 1.80615234375, 2.502197265625, 3.1982421875, 3.894287109375, 4.59033203125, 5.286376953125, 5.982421875, 6.678466796875, 7.37451171875, 8.070556640625, 8.7666015625, 9.462646484375, 10.15869140625, 10.854736328125, 11.55078125, 12.246826171875, 12.94287109375, 13.638916015625, 14.3349609375, 15.031005859375, 15.72705078125, 16.423095703125, 17.119140625, 17.815185546875, 18.51123046875, 19.207275390625, 19.9033203125, 20.599365234375, 21.29541015625, 21.991455078125, 22.6875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 5.0, 10.0, 8.0, 10.0, 12.0, 16.0, 26.0, 36.0, 29.0, 49.0, 51.0, 77.0, 77.0, 134.0, 142.0, 203.0, 298.0, 569.0, 1941.0, 168968.0, 2964987.0, 5904.0, 703.0, 359.0, 245.0, 175.0, 137.0, 118.0, 83.0, 72.0, 50.0, 36.0, 31.0, 32.0, 14.0, 19.0, 12.0, 8.0, 9.0, 6.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-52.8125, -51.171875, -49.53125, -47.890625, -46.25, -44.609375, -42.96875, -41.328125, -39.6875, -38.046875, -36.40625, -34.765625, -33.125, -31.484375, -29.84375, -28.203125, -26.5625, -24.921875, -23.28125, -21.640625, -20.0, -18.359375, -16.71875, -15.078125, -13.4375, -11.796875, -10.15625, -8.515625, -6.875, -5.234375, -3.59375, -1.953125, -0.3125, 1.328125, 2.96875, 4.609375, 6.25, 7.890625, 9.53125, 11.171875, 12.8125, 14.453125, 16.09375, 17.734375, 19.375, 21.015625, 22.65625, 24.296875, 25.9375, 27.578125, 29.21875, 30.859375, 32.5, 34.140625, 35.78125, 37.421875, 39.0625, 40.703125, 42.34375, 43.984375, 45.625, 47.265625, 48.90625, 50.546875, 52.1875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 82.0, 469.0, 419.0, 39.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.46463012695312, -150.38973999023438, -147.31483459472656, -144.23992919921875, -141.1650390625, -138.09014892578125, -135.01524353027344, -131.94033813476562, -128.86544799804688, -125.7905502319336, -122.71565246582031, -119.64075469970703, -116.56585693359375, -113.49095916748047, -110.41606140136719, -107.3411636352539, -104.26626586914062, -101.19136810302734, -98.11647033691406, -95.04157257080078, -91.9666748046875, -88.89177703857422, -85.81687927246094, -82.74198150634766, -79.66708374023438, -76.5921859741211, -73.51728820800781, -70.44239044189453, -67.36749267578125, -64.29259490966797, -61.21769714355469, -58.142799377441406, -55.067901611328125, -51.993003845214844, -48.91810607910156, -45.84320831298828, -42.768310546875, -39.69341278076172, -36.61851501464844, -33.543617248535156, -30.468719482421875, -27.393821716308594, -24.318923950195312, -21.24402618408203, -18.16912841796875, -15.094230651855469, -12.019332885742188, -8.944435119628906, -5.869537353515625, -2.7946395874023438, 0.2802581787109375, 3.3551559448242188, 6.4300537109375, 9.504951477050781, 12.579849243164062, 15.654747009277344, 18.729644775390625, 21.804542541503906, 24.879440307617188, 27.95433807373047, 31.02923583984375, 34.10413360595703, 37.17903137207031, 40.253929138183594, 43.328826904296875]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 1.0, 5.0, 4.0, 12.0, 6.0, 10.0, 8.0, 21.0, 20.0, 24.0, 22.0, 30.0, 28.0, 29.0, 33.0, 37.0, 33.0, 33.0, 36.0, 41.0, 40.0, 46.0, 38.0, 48.0, 45.0, 36.0, 29.0, 38.0, 32.0, 32.0, 35.0, 16.0, 18.0, 22.0, 11.0, 12.0, 12.0, 11.0, 5.0, 8.0, 13.0, 3.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-61.41435241699219, -59.62894058227539, -57.843528747558594, -56.05811309814453, -54.272701263427734, -52.48728942871094, -50.70187759399414, -48.916465759277344, -47.13105010986328, -45.345638275146484, -43.56022644042969, -41.774810791015625, -39.98939895629883, -38.20398712158203, -36.418575286865234, -34.63316345214844, -32.84775161743164, -31.062339782714844, -29.276926040649414, -27.491514205932617, -25.706100463867188, -23.92068862915039, -22.135276794433594, -20.349864959716797, -18.564451217651367, -16.77903938293457, -14.99362564086914, -13.208213806152344, -11.42280101776123, -9.637388229370117, -7.85197639465332, -6.066563606262207, -4.281150817871094, -2.4957382678985596, -0.7103257179260254, 1.0750865936279297, 2.860499382019043, 4.645912170410156, 6.431324005126953, 8.216736793518066, 10.00214958190918, 11.787562370300293, 13.572975158691406, 15.358386993408203, 17.143798828125, 18.92921257019043, 20.714624404907227, 22.500038146972656, 24.285449981689453, 26.07086181640625, 27.85627555847168, 29.641687393188477, 31.427101135253906, 33.2125129699707, 34.9979248046875, 36.7833366394043, 38.568748474121094, 40.35416030883789, 42.13957214355469, 43.92498779296875, 45.71039962768555, 47.495811462402344, 49.28122329711914, 51.06663513183594, 52.85205078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 10.0, 7.0, 2.0, 13.0, 7.0, 11.0, 13.0, 14.0, 21.0, 11.0, 20.0, 26.0, 26.0, 33.0, 29.0, 31.0, 36.0, 38.0, 37.0, 34.0, 41.0, 46.0, 40.0, 43.0, 43.0, 30.0, 36.0, 36.0, 23.0, 28.0, 21.0, 25.0, 17.0, 14.0, 23.0, 19.0, 14.0, 15.0, 12.0, 11.0, 5.0, 9.0, 8.0, 9.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1953125, -5.99005126953125, -5.7847900390625, -5.57952880859375, -5.374267578125, -5.16900634765625, -4.9637451171875, -4.75848388671875, -4.55322265625, -4.34796142578125, -4.1427001953125, -3.93743896484375, -3.732177734375, -3.52691650390625, -3.3216552734375, -3.11639404296875, -2.9111328125, -2.70587158203125, -2.5006103515625, -2.29534912109375, -2.090087890625, -1.88482666015625, -1.6795654296875, -1.47430419921875, -1.26904296875, -1.06378173828125, -0.8585205078125, -0.65325927734375, -0.447998046875, -0.24273681640625, -0.0374755859375, 0.16778564453125, 0.373046875, 0.57830810546875, 0.7835693359375, 0.98883056640625, 1.194091796875, 1.39935302734375, 1.6046142578125, 1.80987548828125, 2.01513671875, 2.22039794921875, 2.4256591796875, 2.63092041015625, 2.836181640625, 3.04144287109375, 3.2467041015625, 3.45196533203125, 3.6572265625, 3.86248779296875, 4.0677490234375, 4.27301025390625, 4.478271484375, 4.68353271484375, 4.8887939453125, 5.09405517578125, 5.29931640625, 5.50457763671875, 5.7098388671875, 5.91510009765625, 6.120361328125, 6.32562255859375, 6.5308837890625, 6.73614501953125, 6.94140625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 8.0, 9.0, 5.0, 11.0, 13.0, 13.0, 12.0, 15.0, 22.0, 15.0, 19.0, 37.0, 46.0, 59.0, 93.0, 204.0, 415.0, 1123.0, 4694.0, 75602.0, 2581227.0, 1496227.0, 29918.0, 2841.0, 807.0, 328.0, 148.0, 92.0, 55.0, 36.0, 23.0, 24.0, 21.0, 26.0, 13.0, 15.0, 9.0, 11.0, 9.0, 9.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.28125, -22.52734375, -21.7734375, -21.01953125, -20.265625, -19.51171875, -18.7578125, -18.00390625, -17.25, -16.49609375, -15.7421875, -14.98828125, -14.234375, -13.48046875, -12.7265625, -11.97265625, -11.21875, -10.46484375, -9.7109375, -8.95703125, -8.203125, -7.44921875, -6.6953125, -5.94140625, -5.1875, -4.43359375, -3.6796875, -2.92578125, -2.171875, -1.41796875, -0.6640625, 0.08984375, 0.84375, 1.59765625, 2.3515625, 3.10546875, 3.859375, 4.61328125, 5.3671875, 6.12109375, 6.875, 7.62890625, 8.3828125, 9.13671875, 9.890625, 10.64453125, 11.3984375, 12.15234375, 12.90625, 13.66015625, 14.4140625, 15.16796875, 15.921875, 16.67578125, 17.4296875, 18.18359375, 18.9375, 19.69140625, 20.4453125, 21.19921875, 21.953125, 22.70703125, 23.4609375, 24.21484375, 24.96875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 11.0, 9.0, 9.0, 18.0, 27.0, 54.0, 42.0, 69.0, 85.0, 101.0, 152.0, 161.0, 263.0, 295.0, 376.0, 468.0, 424.0, 363.0, 289.0, 217.0, 159.0, 112.0, 103.0, 62.0, 53.0, 45.0, 17.0, 19.0, 15.0, 12.0, 11.0, 5.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.6220703125, -14.212890625, -13.8037109375, -13.39453125, -12.9853515625, -12.576171875, -12.1669921875, -11.7578125, -11.3486328125, -10.939453125, -10.5302734375, -10.12109375, -9.7119140625, -9.302734375, -8.8935546875, -8.484375, -8.0751953125, -7.666015625, -7.2568359375, -6.84765625, -6.4384765625, -6.029296875, -5.6201171875, -5.2109375, -4.8017578125, -4.392578125, -3.9833984375, -3.57421875, -3.1650390625, -2.755859375, -2.3466796875, -1.9375, -1.5283203125, -1.119140625, -0.7099609375, -0.30078125, 0.1083984375, 0.517578125, 0.9267578125, 1.3359375, 1.7451171875, 2.154296875, 2.5634765625, 2.97265625, 3.3818359375, 3.791015625, 4.2001953125, 4.609375, 5.0185546875, 5.427734375, 5.8369140625, 6.24609375, 6.6552734375, 7.064453125, 7.4736328125, 7.8828125, 8.2919921875, 8.701171875, 9.1103515625, 9.51953125, 9.9287109375, 10.337890625, 10.7470703125, 11.15625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 13.0, 17.0, 19.0, 20.0, 33.0, 27.0, 35.0, 66.0, 72.0, 93.0, 122.0, 135.0, 217.0, 248.0, 356.0, 595.0, 2898.0, 2345116.0, 1839590.0, 2551.0, 570.0, 313.0, 262.0, 188.0, 150.0, 121.0, 115.0, 93.0, 45.0, 50.0, 34.0, 28.0, 17.0, 14.0, 14.0, 14.0, 4.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-59.78125, -57.64501953125, -55.5087890625, -53.37255859375, -51.236328125, -49.10009765625, -46.9638671875, -44.82763671875, -42.69140625, -40.55517578125, -38.4189453125, -36.28271484375, -34.146484375, -32.01025390625, -29.8740234375, -27.73779296875, -25.6015625, -23.46533203125, -21.3291015625, -19.19287109375, -17.056640625, -14.92041015625, -12.7841796875, -10.64794921875, -8.51171875, -6.37548828125, -4.2392578125, -2.10302734375, 0.033203125, 2.16943359375, 4.3056640625, 6.44189453125, 8.578125, 10.71435546875, 12.8505859375, 14.98681640625, 17.123046875, 19.25927734375, 21.3955078125, 23.53173828125, 25.66796875, 27.80419921875, 29.9404296875, 32.07666015625, 34.212890625, 36.34912109375, 38.4853515625, 40.62158203125, 42.7578125, 44.89404296875, 47.0302734375, 49.16650390625, 51.302734375, 53.43896484375, 55.5751953125, 57.71142578125, 59.84765625, 61.98388671875, 64.1201171875, 66.25634765625, 68.392578125, 70.52880859375, 72.6650390625, 74.80126953125, 76.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 27.0, 136.0, 328.0, 311.0, 158.0, 48.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.14505004882812, -75.45402526855469, -70.76300048828125, -66.07197570800781, -61.380950927734375, -56.68992614746094, -51.9989013671875, -47.30787658691406, -42.616851806640625, -37.92582702636719, -33.23480224609375, -28.543777465820312, -23.852752685546875, -19.161727905273438, -14.470703125, -9.779678344726562, -5.088653564453125, -0.3976287841796875, 4.29339599609375, 8.984420776367188, 13.675445556640625, 18.366470336914062, 23.0574951171875, 27.748519897460938, 32.439544677734375, 37.13056945800781, 41.82159423828125, 46.51261901855469, 51.203643798828125, 55.89466857910156, 60.585693359375, 65.27671813964844, 69.96774291992188, 74.65876770019531, 79.34979248046875, 84.04081726074219, 88.73184204101562, 93.42286682128906, 98.1138916015625, 102.80491638183594, 107.49594116210938, 112.18696594238281, 116.87799072265625, 121.56901550292969, 126.26004028320312, 130.95106506347656, 135.64208984375, 140.33311462402344, 145.02413940429688, 149.7151641845703, 154.40618896484375, 159.0972137451172, 163.78823852539062, 168.47926330566406, 173.1702880859375, 177.86131286621094, 182.55233764648438, 187.2433624267578, 191.93438720703125, 196.6254119873047, 201.31643676757812, 206.00746154785156, 210.698486328125, 215.38951110839844, 220.08053588867188]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 4.0, 8.0, 15.0, 10.0, 9.0, 17.0, 18.0, 15.0, 18.0, 21.0, 22.0, 29.0, 40.0, 45.0, 32.0, 38.0, 40.0, 37.0, 30.0, 37.0, 47.0, 41.0, 41.0, 40.0, 43.0, 32.0, 26.0, 37.0, 22.0, 25.0, 22.0, 22.0, 26.0, 16.0, 13.0, 15.0, 8.0, 13.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-44.460479736328125, -43.14581298828125, -41.83115005493164, -40.516483306884766, -39.201820373535156, -37.88715362548828, -36.572486877441406, -35.25782012939453, -33.94315719604492, -32.62849044799805, -31.313827514648438, -29.999160766601562, -28.68449592590332, -27.369831085205078, -26.055164337158203, -24.74049949645996, -23.42583465576172, -22.111169815063477, -20.796504974365234, -19.48183822631836, -18.167173385620117, -16.852508544921875, -15.537842750549316, -14.223176956176758, -12.908512115478516, -11.593847274780273, -10.279181480407715, -8.964515686035156, -7.649850845336914, -6.335185527801514, -5.020520210266113, -3.7058544158935547, -2.3911895751953125, -1.076524257659912, 0.23814105987548828, 1.5528063774108887, 2.867471694946289, 4.1821370124816895, 5.49680233001709, 6.811468124389648, 8.12613296508789, 9.440797805786133, 10.755463600158691, 12.07012939453125, 13.384794235229492, 14.699459075927734, 16.01412582397461, 17.32879066467285, 18.643455505371094, 19.958120346069336, 21.272785186767578, 22.587451934814453, 23.902116775512695, 25.216781616210938, 26.531448364257812, 27.846113204956055, 29.160778045654297, 30.47544288635254, 31.79010772705078, 33.104774475097656, 34.41944122314453, 35.73410415649414, 37.048770904541016, 38.363433837890625, 39.6781005859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 8.0, 1.0, 5.0, 4.0, 9.0, 6.0, 11.0, 11.0, 10.0, 11.0, 16.0, 18.0, 21.0, 25.0, 25.0, 27.0, 37.0, 32.0, 27.0, 36.0, 36.0, 44.0, 48.0, 34.0, 43.0, 34.0, 43.0, 33.0, 44.0, 35.0, 32.0, 37.0, 26.0, 31.0, 21.0, 22.0, 18.0, 12.0, 14.0, 6.0, 8.0, 10.0, 6.0, 8.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.03125, -5.81744384765625, -5.6036376953125, -5.38983154296875, -5.176025390625, -4.96221923828125, -4.7484130859375, -4.53460693359375, -4.32080078125, -4.10699462890625, -3.8931884765625, -3.67938232421875, -3.465576171875, -3.25177001953125, -3.0379638671875, -2.82415771484375, -2.6103515625, -2.39654541015625, -2.1827392578125, -1.96893310546875, -1.755126953125, -1.54132080078125, -1.3275146484375, -1.11370849609375, -0.89990234375, -0.68609619140625, -0.4722900390625, -0.25848388671875, -0.044677734375, 0.16912841796875, 0.3829345703125, 0.59674072265625, 0.810546875, 1.02435302734375, 1.2381591796875, 1.45196533203125, 1.665771484375, 1.87957763671875, 2.0933837890625, 2.30718994140625, 2.52099609375, 2.73480224609375, 2.9486083984375, 3.16241455078125, 3.376220703125, 3.59002685546875, 3.8038330078125, 4.01763916015625, 4.2314453125, 4.44525146484375, 4.6590576171875, 4.87286376953125, 5.086669921875, 5.30047607421875, 5.5142822265625, 5.72808837890625, 5.94189453125, 6.15570068359375, 6.3695068359375, 6.58331298828125, 6.797119140625, 7.01092529296875, 7.2247314453125, 7.43853759765625, 7.65234375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 12.0, 23.0, 40.0, 51.0, 73.0, 113.0, 198.0, 277.0, 405.0, 605.0, 849.0, 1197.0, 1712.0, 2394.0, 3600.0, 5445.0, 8703.0, 12970.0, 19877.0, 31918.0, 52619.0, 88357.0, 158043.0, 251662.0, 166024.0, 93206.0, 54604.0, 33152.0, 20892.0, 13254.0, 8708.0, 5614.0, 3812.0, 2580.0, 1683.0, 1246.0, 826.0, 570.0, 408.0, 280.0, 193.0, 134.0, 69.0, 48.0, 42.0, 22.0, 11.0, 7.0, 10.0, 5.0, 9.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.95263671875, -0.9224319458007812, -0.8922271728515625, -0.8620223999023438, -0.831817626953125, -0.8016128540039062, -0.7714080810546875, -0.7412033081054688, -0.71099853515625, -0.6807937622070312, -0.6505889892578125, -0.6203842163085938, -0.590179443359375, -0.5599746704101562, -0.5297698974609375, -0.49956512451171875, -0.4693603515625, -0.43915557861328125, -0.4089508056640625, -0.37874603271484375, -0.348541259765625, -0.31833648681640625, -0.2881317138671875, -0.25792694091796875, -0.22772216796875, -0.19751739501953125, -0.1673126220703125, -0.13710784912109375, -0.106903076171875, -0.07669830322265625, -0.0464935302734375, -0.01628875732421875, 0.013916015625, 0.04412078857421875, 0.0743255615234375, 0.10453033447265625, 0.134735107421875, 0.16493988037109375, 0.1951446533203125, 0.22534942626953125, 0.25555419921875, 0.28575897216796875, 0.3159637451171875, 0.34616851806640625, 0.376373291015625, 0.40657806396484375, 0.4367828369140625, 0.46698760986328125, 0.4971923828125, 0.5273971557617188, 0.5576019287109375, 0.5878067016601562, 0.618011474609375, 0.6482162475585938, 0.6784210205078125, 0.7086257934570312, 0.73883056640625, 0.7690353393554688, 0.7992401123046875, 0.8294448852539062, 0.859649658203125, 0.8898544311523438, 0.9200592041015625, 0.9502639770507812, 0.98046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 9.0, 5.0, 10.0, 20.0, 14.0, 18.0, 13.0, 14.0, 19.0, 25.0, 31.0, 35.0, 35.0, 39.0, 50.0, 48.0, 35.0, 34.0, 27.0, 1064.0, 43.0, 34.0, 38.0, 43.0, 30.0, 36.0, 42.0, 30.0, 25.0, 19.0, 13.0, 18.0, 18.0, 14.0, 7.0, 14.0, 1.0, 13.0, 5.0, 7.0, 4.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.962890625, -3.826690673828125, -3.69049072265625, -3.554290771484375, -3.4180908203125, -3.281890869140625, -3.14569091796875, -3.009490966796875, -2.873291015625, -2.737091064453125, -2.60089111328125, -2.464691162109375, -2.3284912109375, -2.192291259765625, -2.05609130859375, -1.919891357421875, -1.78369140625, -1.647491455078125, -1.51129150390625, -1.375091552734375, -1.2388916015625, -1.102691650390625, -0.96649169921875, -0.830291748046875, -0.694091796875, -0.557891845703125, -0.42169189453125, -0.285491943359375, -0.1492919921875, -0.013092041015625, 0.12310791015625, 0.259307861328125, 0.3955078125, 0.531707763671875, 0.66790771484375, 0.804107666015625, 0.9403076171875, 1.076507568359375, 1.21270751953125, 1.348907470703125, 1.485107421875, 1.621307373046875, 1.75750732421875, 1.893707275390625, 2.0299072265625, 2.166107177734375, 2.30230712890625, 2.438507080078125, 2.57470703125, 2.710906982421875, 2.84710693359375, 2.983306884765625, 3.1195068359375, 3.255706787109375, 3.39190673828125, 3.528106689453125, 3.664306640625, 3.800506591796875, 3.93670654296875, 4.072906494140625, 4.2091064453125, 4.345306396484375, 4.48150634765625, 4.617706298828125, 4.75390625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 6.0, 13.0, 20.0, 12.0, 21.0, 39.0, 38.0, 62.0, 75.0, 115.0, 155.0, 212.0, 336.0, 465.0, 687.0, 945.0, 1363.0, 1903.0, 2736.0, 3936.0, 5711.0, 8466.0, 12200.0, 18327.0, 28623.0, 46407.0, 76832.0, 129685.0, 1267157.0, 193477.0, 112331.0, 66640.0, 40691.0, 25285.0, 16632.0, 10928.0, 7460.0, 5099.0, 3554.0, 2492.0, 1752.0, 1217.0, 871.0, 621.0, 450.0, 349.0, 205.0, 162.0, 114.0, 76.0, 73.0, 37.0, 25.0, 15.0, 18.0, 8.0, 3.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.86669921875, -0.8395004272460938, -0.8123016357421875, -0.7851028442382812, -0.757904052734375, -0.7307052612304688, -0.7035064697265625, -0.6763076782226562, -0.64910888671875, -0.6219100952148438, -0.5947113037109375, -0.5675125122070312, -0.540313720703125, -0.5131149291992188, -0.4859161376953125, -0.45871734619140625, -0.4315185546875, -0.40431976318359375, -0.3771209716796875, -0.34992218017578125, -0.322723388671875, -0.29552459716796875, -0.2683258056640625, -0.24112701416015625, -0.21392822265625, -0.18672943115234375, -0.1595306396484375, -0.13233184814453125, -0.105133056640625, -0.07793426513671875, -0.0507354736328125, -0.02353668212890625, 0.003662109375, 0.03086090087890625, 0.0580596923828125, 0.08525848388671875, 0.112457275390625, 0.13965606689453125, 0.1668548583984375, 0.19405364990234375, 0.22125244140625, 0.24845123291015625, 0.2756500244140625, 0.30284881591796875, 0.330047607421875, 0.35724639892578125, 0.3844451904296875, 0.41164398193359375, 0.4388427734375, 0.46604156494140625, 0.4932403564453125, 0.5204391479492188, 0.547637939453125, 0.5748367309570312, 0.6020355224609375, 0.6292343139648438, 0.65643310546875, 0.6836318969726562, 0.7108306884765625, 0.7380294799804688, 0.765228271484375, 0.7924270629882812, 0.8196258544921875, 0.8468246459960938, 0.8740234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 8.0, 7.0, 6.0, 7.0, 5.0, 5.0, 6.0, 5.0, 12.0, 18.0, 26.0, 26.0, 35.0, 38.0, 36.0, 43.0, 55.0, 73.0, 65.0, 77.0, 65.0, 52.0, 57.0, 40.0, 54.0, 29.0, 28.0, 26.0, 14.0, 15.0, 10.0, 13.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0012912750244140625, -0.0012529492378234863, -0.0012146234512329102, -0.001176297664642334, -0.0011379718780517578, -0.0010996460914611816, -0.0010613203048706055, -0.0010229945182800293, -0.0009846687316894531, -0.000946342945098877, -0.0009080171585083008, -0.0008696913719177246, -0.0008313655853271484, -0.0007930397987365723, -0.0007547140121459961, -0.0007163882255554199, -0.0006780624389648438, -0.0006397366523742676, -0.0006014108657836914, -0.0005630850791931152, -0.0005247592926025391, -0.0004864335060119629, -0.0004481077194213867, -0.00040978193283081055, -0.0003714561462402344, -0.0003331303596496582, -0.00029480457305908203, -0.00025647878646850586, -0.0002181529998779297, -0.00017982721328735352, -0.00014150142669677734, -0.00010317564010620117, -6.4849853515625e-05, -2.6524066925048828e-05, 1.1801719665527344e-05, 5.0127506256103516e-05, 8.845329284667969e-05, 0.00012677907943725586, 0.00016510486602783203, 0.0002034306526184082, 0.00024175643920898438, 0.00028008222579956055, 0.0003184080123901367, 0.0003567337989807129, 0.00039505958557128906, 0.00043338537216186523, 0.0004717111587524414, 0.0005100369453430176, 0.0005483627319335938, 0.0005866885185241699, 0.0006250143051147461, 0.0006633400917053223, 0.0007016658782958984, 0.0007399916648864746, 0.0007783174514770508, 0.000816643238067627, 0.0008549690246582031, 0.0008932948112487793, 0.0009316205978393555, 0.0009699463844299316, 0.0010082721710205078, 0.001046597957611084, 0.0010849237442016602, 0.0011232495307922363, 0.0011615753173828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 3.0, 4.0, 4.0, 6.0, 4.0, 8.0, 10.0, 14.0, 19.0, 20.0, 28.0, 36.0, 51.0, 63.0, 97.0, 150.0, 337.0, 913.0, 315342.0, 729353.0, 1068.0, 353.0, 180.0, 114.0, 90.0, 57.0, 56.0, 29.0, 23.0, 13.0, 15.0, 16.0, 13.0, 11.0, 10.0, 7.0, 5.0, 7.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.02752685546875, -0.026610612869262695, -0.02569437026977539, -0.024778127670288086, -0.02386188507080078, -0.022945642471313477, -0.022029399871826172, -0.021113157272338867, -0.020196914672851562, -0.019280672073364258, -0.018364429473876953, -0.01744818687438965, -0.016531944274902344, -0.015615701675415039, -0.014699459075927734, -0.01378321647644043, -0.012866973876953125, -0.01195073127746582, -0.011034488677978516, -0.010118246078491211, -0.009202003479003906, -0.008285760879516602, -0.007369518280029297, -0.006453275680541992, -0.0055370330810546875, -0.004620790481567383, -0.003704547882080078, -0.0027883052825927734, -0.0018720626831054688, -0.0009558200836181641, -3.9577484130859375e-05, 0.0008766651153564453, 0.00179290771484375, 0.0027091503143310547, 0.0036253929138183594, 0.004541635513305664, 0.005457878112792969, 0.0063741207122802734, 0.007290363311767578, 0.008206605911254883, 0.009122848510742188, 0.010039091110229492, 0.010955333709716797, 0.011871576309204102, 0.012787818908691406, 0.013704061508178711, 0.014620304107666016, 0.01553654670715332, 0.016452789306640625, 0.01736903190612793, 0.018285274505615234, 0.01920151710510254, 0.020117759704589844, 0.02103400230407715, 0.021950244903564453, 0.022866487503051758, 0.023782730102539062, 0.024698972702026367, 0.025615215301513672, 0.026531457901000977, 0.02744770050048828, 0.028363943099975586, 0.02928018569946289, 0.030196428298950195, 0.0311126708984375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 55.0, 825.0, 130.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004903407301753759, -0.0047256825491786, -0.004547957796603441, -0.004370233044028282, -0.004192508291453123, -0.004014783538877964, -0.0038370590191334486, -0.003659334499388933, -0.003481609746813774, -0.003303884994238615, -0.003126160241663456, -0.002948435489088297, -0.0027707109693437815, -0.0025929862167686224, -0.0024152614641934633, -0.002237536944448948, -0.002059811959043145, -0.001882087206467986, -0.0017043625703081489, -0.0015266378177329898, -0.0013489131815731525, -0.0011711884289979935, -0.0009934636764228344, -0.0008157390402629972, -0.0006380142876878381, -0.0004602895933203399, -0.0002825648698490113, -0.00010484014637768269, 7.288454798981547e-05, 0.00025060924235731363, 0.0004283339949324727, 0.00060605863109231, 0.000783783383667469, 0.0009615080780349672, 0.0011392327724024653, 0.0013169575249776244, 0.0014946821611374617, 0.0016724069137126207, 0.0018501316662877798, 0.0020278561860322952, 0.0022055809386074543, 0.0023833056911826134, 0.0025610304437577724, 0.0027387551963329315, 0.002916479716077447, 0.003094204468652606, 0.003271929221227765, 0.0034496537409722805, 0.0036273787263780832, 0.0038051034789532423, 0.003982827998697758, 0.004160552751272917, 0.004338277503848076, 0.004516002256423235, 0.004693727008998394, 0.004871451761573553, 0.005049176514148712, 0.005226901266723871, 0.00540462601929903, 0.005582350771874189, 0.0057600755244493484, 0.00593779981136322, 0.006115525029599667, 0.006293249316513538, 0.006470974069088697]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 7.0, 5.0, 6.0, 7.0, 11.0, 18.0, 24.0, 20.0, 19.0, 14.0, 25.0, 26.0, 38.0, 30.0, 27.0, 22.0, 30.0, 28.0, 36.0, 28.0, 29.0, 41.0, 26.0, 39.0, 31.0, 35.0, 32.0, 23.0, 27.0, 40.0, 25.0, 30.0, 28.0, 33.0, 14.0, 14.0, 16.0, 13.0, 11.0, 11.0, 10.0, 8.0, 14.0, 2.0, 6.0, 6.0, 6.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0005882382392883301, -0.0005705226212739944, -0.0005528070032596588, -0.0005350913852453232, -0.0005173757672309875, -0.0004996601492166519, -0.0004819445312023163, -0.00046422891318798065, -0.000446513295173645, -0.0004287976771593094, -0.00041108205914497375, -0.0003933664411306381, -0.0003756508231163025, -0.00035793520510196686, -0.0003402195870876312, -0.0003225039690732956, -0.00030478835105895996, -0.00028707273304462433, -0.0002693571150302887, -0.00025164149701595306, -0.00023392587900161743, -0.0002162102609872818, -0.00019849464297294617, -0.00018077902495861053, -0.0001630634069442749, -0.00014534778892993927, -0.00012763217091560364, -0.000109916552901268, -9.220093488693237e-05, -7.448531687259674e-05, -5.676969885826111e-05, -3.9054080843925476e-05, -2.1338462829589844e-05, -3.6228448152542114e-06, 1.4092773199081421e-05, 3.180839121341705e-05, 4.9524009227752686e-05, 6.723962724208832e-05, 8.495524525642395e-05, 0.00010267086327075958, 0.00012038648128509521, 0.00013810209929943085, 0.00015581771731376648, 0.0001735333353281021, 0.00019124895334243774, 0.00020896457135677338, 0.000226680189371109, 0.00024439580738544464, 0.0002621114253997803, 0.0002798270434141159, 0.00029754266142845154, 0.00031525827944278717, 0.0003329738974571228, 0.00035068951547145844, 0.00036840513348579407, 0.0003861207515001297, 0.00040383636951446533, 0.00042155198752880096, 0.0004392676055431366, 0.00045698322355747223, 0.00047469884157180786, 0.0004924144595861435, 0.0005101300776004791, 0.0005278456956148148, 0.0005455613136291504]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 8.0, 1.0, 5.0, 4.0, 9.0, 6.0, 11.0, 11.0, 10.0, 11.0, 16.0, 18.0, 21.0, 24.0, 26.0, 27.0, 37.0, 32.0, 27.0, 36.0, 36.0, 44.0, 48.0, 34.0, 43.0, 34.0, 43.0, 33.0, 44.0, 35.0, 32.0, 37.0, 26.0, 31.0, 21.0, 22.0, 18.0, 12.0, 14.0, 6.0, 8.0, 10.0, 6.0, 8.0, 9.0, 3.0, 5.0, 3.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.03125, -5.81744384765625, -5.6036376953125, -5.38983154296875, -5.176025390625, -4.96221923828125, -4.7484130859375, -4.53460693359375, -4.32080078125, -4.10699462890625, -3.8931884765625, -3.67938232421875, -3.465576171875, -3.25177001953125, -3.0379638671875, -2.82415771484375, -2.6103515625, -2.39654541015625, -2.1827392578125, -1.96893310546875, -1.755126953125, -1.54132080078125, -1.3275146484375, -1.11370849609375, -0.89990234375, -0.68609619140625, -0.4722900390625, -0.25848388671875, -0.044677734375, 0.16912841796875, 0.3829345703125, 0.59674072265625, 0.810546875, 1.02435302734375, 1.2381591796875, 1.45196533203125, 1.665771484375, 1.87957763671875, 2.0933837890625, 2.30718994140625, 2.52099609375, 2.73480224609375, 2.9486083984375, 3.16241455078125, 3.376220703125, 3.59002685546875, 3.8038330078125, 4.01763916015625, 4.2314453125, 4.44525146484375, 4.6590576171875, 4.87286376953125, 5.086669921875, 5.30047607421875, 5.5142822265625, 5.72808837890625, 5.94189453125, 6.15570068359375, 6.3695068359375, 6.58331298828125, 6.797119140625, 7.01092529296875, 7.2247314453125, 7.43853759765625, 7.65234375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 8.0, 14.0, 11.0, 16.0, 26.0, 29.0, 34.0, 54.0, 54.0, 84.0, 84.0, 112.0, 174.0, 250.0, 436.0, 843.0, 2047.0, 5594.0, 15977.0, 45917.0, 136777.0, 441136.0, 268898.0, 84166.0, 28850.0, 10120.0, 3641.0, 1376.0, 616.0, 340.0, 226.0, 159.0, 105.0, 84.0, 57.0, 40.0, 43.0, 29.0, 25.0, 21.0, 15.0, 13.0, 11.0, 11.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.002685546875, -5.78662109375, -5.570556640625, -5.3544921875, -5.138427734375, -4.92236328125, -4.706298828125, -4.490234375, -4.274169921875, -4.05810546875, -3.842041015625, -3.6259765625, -3.409912109375, -3.19384765625, -2.977783203125, -2.76171875, -2.545654296875, -2.32958984375, -2.113525390625, -1.8974609375, -1.681396484375, -1.46533203125, -1.249267578125, -1.033203125, -0.817138671875, -0.60107421875, -0.385009765625, -0.1689453125, 0.047119140625, 0.26318359375, 0.479248046875, 0.6953125, 0.911376953125, 1.12744140625, 1.343505859375, 1.5595703125, 1.775634765625, 1.99169921875, 2.207763671875, 2.423828125, 2.639892578125, 2.85595703125, 3.072021484375, 3.2880859375, 3.504150390625, 3.72021484375, 3.936279296875, 4.15234375, 4.368408203125, 4.58447265625, 4.800537109375, 5.0166015625, 5.232666015625, 5.44873046875, 5.664794921875, 5.880859375, 6.096923828125, 6.31298828125, 6.529052734375, 6.7451171875, 6.961181640625, 7.17724609375, 7.393310546875, 7.609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 3.0, 5.0, 6.0, 4.0, 8.0, 19.0, 9.0, 15.0, 12.0, 22.0, 31.0, 34.0, 27.0, 28.0, 34.0, 52.0, 53.0, 64.0, 92.0, 378.0, 1610.0, 108.0, 45.0, 52.0, 41.0, 46.0, 31.0, 33.0, 30.0, 22.0, 20.0, 16.0, 22.0, 19.0, 8.0, 5.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-25.609375, -24.859130859375, -24.10888671875, -23.358642578125, -22.6083984375, -21.858154296875, -21.10791015625, -20.357666015625, -19.607421875, -18.857177734375, -18.10693359375, -17.356689453125, -16.6064453125, -15.856201171875, -15.10595703125, -14.355712890625, -13.60546875, -12.855224609375, -12.10498046875, -11.354736328125, -10.6044921875, -9.854248046875, -9.10400390625, -8.353759765625, -7.603515625, -6.853271484375, -6.10302734375, -5.352783203125, -4.6025390625, -3.852294921875, -3.10205078125, -2.351806640625, -1.6015625, -0.851318359375, -0.10107421875, 0.649169921875, 1.3994140625, 2.149658203125, 2.89990234375, 3.650146484375, 4.400390625, 5.150634765625, 5.90087890625, 6.651123046875, 7.4013671875, 8.151611328125, 8.90185546875, 9.652099609375, 10.40234375, 11.152587890625, 11.90283203125, 12.653076171875, 13.4033203125, 14.153564453125, 14.90380859375, 15.654052734375, 16.404296875, 17.154541015625, 17.90478515625, 18.655029296875, 19.4052734375, 20.155517578125, 20.90576171875, 21.656005859375, 22.40625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 5.0, 6.0, 14.0, 6.0, 10.0, 9.0, 21.0, 22.0, 25.0, 31.0, 38.0, 53.0, 59.0, 74.0, 123.0, 169.0, 273.0, 424.0, 993.0, 5113.0, 3017120.0, 117215.0, 2033.0, 655.0, 340.0, 211.0, 153.0, 100.0, 86.0, 77.0, 44.0, 35.0, 39.0, 24.0, 20.0, 10.0, 13.0, 9.0, 12.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-64.5625, -62.75830078125, -60.9541015625, -59.14990234375, -57.345703125, -55.54150390625, -53.7373046875, -51.93310546875, -50.12890625, -48.32470703125, -46.5205078125, -44.71630859375, -42.912109375, -41.10791015625, -39.3037109375, -37.49951171875, -35.6953125, -33.89111328125, -32.0869140625, -30.28271484375, -28.478515625, -26.67431640625, -24.8701171875, -23.06591796875, -21.26171875, -19.45751953125, -17.6533203125, -15.84912109375, -14.044921875, -12.24072265625, -10.4365234375, -8.63232421875, -6.828125, -5.02392578125, -3.2197265625, -1.41552734375, 0.388671875, 2.19287109375, 3.9970703125, 5.80126953125, 7.60546875, 9.40966796875, 11.2138671875, 13.01806640625, 14.822265625, 16.62646484375, 18.4306640625, 20.23486328125, 22.0390625, 23.84326171875, 25.6474609375, 27.45166015625, 29.255859375, 31.06005859375, 32.8642578125, 34.66845703125, 36.47265625, 38.27685546875, 40.0810546875, 41.88525390625, 43.689453125, 45.49365234375, 47.2978515625, 49.10205078125, 50.90625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 442.0, 562.0, 10.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.49967193603516, -60.99116134643555, -55.48264694213867, -49.97413635253906, -44.46562194824219, -38.95711135864258, -33.44860076904297, -27.940086364746094, -22.431575775146484, -16.923063278198242, -11.414551734924316, -5.906040191650391, -0.39752769470214844, 5.110984802246094, 10.619495391845703, 16.128009796142578, 21.636520385742188, 27.14503288269043, 32.65354537963867, 38.16205596923828, 43.670570373535156, 49.179080963134766, 54.687591552734375, 60.19610595703125, 65.70462036132812, 71.213134765625, 76.72164154052734, 82.23015594482422, 87.7386703491211, 93.24717712402344, 98.75569152832031, 104.26420593261719, 109.77272033691406, 115.28123474121094, 120.78974151611328, 126.29825592041016, 131.8067626953125, 137.31527709960938, 142.82379150390625, 148.33230590820312, 153.8408203125, 159.34933471679688, 164.85784912109375, 170.36636352539062, 175.87486267089844, 181.3833770751953, 186.8918914794922, 192.40040588378906, 197.90890502929688, 203.41741943359375, 208.92593383789062, 214.4344482421875, 219.9429473876953, 225.4514617919922, 230.95997619628906, 236.46849060058594, 241.9770050048828, 247.4855194091797, 252.99403381347656, 258.5025329589844, 264.01104736328125, 269.5195617675781, 275.028076171875, 280.5365905761719, 286.04510498046875]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 7.0, 3.0, 8.0, 6.0, 11.0, 14.0, 12.0, 17.0, 19.0, 16.0, 14.0, 22.0, 19.0, 18.0, 33.0, 31.0, 38.0, 39.0, 24.0, 40.0, 43.0, 37.0, 46.0, 42.0, 23.0, 34.0, 37.0, 29.0, 28.0, 33.0, 18.0, 27.0, 32.0, 24.0, 27.0, 21.0, 17.0, 20.0, 11.0, 11.0, 10.0, 3.0, 5.0, 10.0, 7.0, 1.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0], "bins": [-53.88520431518555, -52.26403045654297, -50.64285659790039, -49.02168273925781, -47.40050506591797, -45.779335021972656, -44.15815734863281, -42.536983489990234, -40.915809631347656, -39.29463577270508, -37.6734619140625, -36.05228805541992, -34.431114196777344, -32.8099365234375, -31.188762664794922, -29.567588806152344, -27.946414947509766, -26.325241088867188, -24.70406723022461, -23.0828914642334, -21.46171760559082, -19.840543746948242, -18.21936798095703, -16.598194122314453, -14.977020263671875, -13.355846405029297, -11.734671592712402, -10.113496780395508, -8.49232292175293, -6.871149063110352, -5.249974250793457, -3.6287994384765625, -2.0076217651367188, -0.3864474296569824, 1.234726905822754, 2.8559012413024902, 4.477075576782227, 6.098249435424805, 7.719424247741699, 9.340599060058594, 10.961772918701172, 12.58294677734375, 14.204121589660645, 15.825296401977539, 17.446470260620117, 19.067644119262695, 20.688819885253906, 22.309993743896484, 23.931167602539062, 25.55234146118164, 27.17351531982422, 28.79469108581543, 30.415864944458008, 32.03704071044922, 33.6582145690918, 35.279388427734375, 36.90056228637695, 38.52173614501953, 40.14291000366211, 41.76408386230469, 43.38526153564453, 45.006431579589844, 46.62760925292969, 48.248783111572266, 49.869956970214844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 6.0, 4.0, 6.0, 2.0, 2.0, 9.0, 8.0, 13.0, 16.0, 15.0, 8.0, 17.0, 24.0, 22.0, 27.0, 20.0, 34.0, 37.0, 33.0, 38.0, 33.0, 45.0, 44.0, 41.0, 44.0, 50.0, 29.0, 41.0, 43.0, 38.0, 29.0, 27.0, 31.0, 23.0, 28.0, 13.0, 16.0, 13.0, 14.0, 12.0, 7.0, 12.0, 3.0, 8.0, 7.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.6171875, -6.38983154296875, -6.1624755859375, -5.93511962890625, -5.707763671875, -5.48040771484375, -5.2530517578125, -5.02569580078125, -4.79833984375, -4.57098388671875, -4.3436279296875, -4.11627197265625, -3.888916015625, -3.66156005859375, -3.4342041015625, -3.20684814453125, -2.9794921875, -2.75213623046875, -2.5247802734375, -2.29742431640625, -2.070068359375, -1.84271240234375, -1.6153564453125, -1.38800048828125, -1.16064453125, -0.93328857421875, -0.7059326171875, -0.47857666015625, -0.251220703125, -0.02386474609375, 0.2034912109375, 0.43084716796875, 0.658203125, 0.88555908203125, 1.1129150390625, 1.34027099609375, 1.567626953125, 1.79498291015625, 2.0223388671875, 2.24969482421875, 2.47705078125, 2.70440673828125, 2.9317626953125, 3.15911865234375, 3.386474609375, 3.61383056640625, 3.8411865234375, 4.06854248046875, 4.2958984375, 4.52325439453125, 4.7506103515625, 4.97796630859375, 5.205322265625, 5.43267822265625, 5.6600341796875, 5.88739013671875, 6.11474609375, 6.34210205078125, 6.5694580078125, 6.79681396484375, 7.024169921875, 7.25152587890625, 7.4788818359375, 7.70623779296875, 7.93359375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 4.0, 4.0, 5.0, 11.0, 9.0, 8.0, 18.0, 15.0, 14.0, 24.0, 25.0, 34.0, 35.0, 52.0, 88.0, 100.0, 138.0, 267.0, 477.0, 1594.0, 14201.0, 730152.0, 3306988.0, 132911.0, 5077.0, 930.0, 356.0, 216.0, 133.0, 68.0, 82.0, 48.0, 35.0, 33.0, 20.0, 14.0, 23.0, 16.0, 9.0, 9.0, 8.0, 7.0, 3.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.375, -22.577392578125, -21.77978515625, -20.982177734375, -20.1845703125, -19.386962890625, -18.58935546875, -17.791748046875, -16.994140625, -16.196533203125, -15.39892578125, -14.601318359375, -13.8037109375, -13.006103515625, -12.20849609375, -11.410888671875, -10.61328125, -9.815673828125, -9.01806640625, -8.220458984375, -7.4228515625, -6.625244140625, -5.82763671875, -5.030029296875, -4.232421875, -3.434814453125, -2.63720703125, -1.839599609375, -1.0419921875, -0.244384765625, 0.55322265625, 1.350830078125, 2.1484375, 2.946044921875, 3.74365234375, 4.541259765625, 5.3388671875, 6.136474609375, 6.93408203125, 7.731689453125, 8.529296875, 9.326904296875, 10.12451171875, 10.922119140625, 11.7197265625, 12.517333984375, 13.31494140625, 14.112548828125, 14.91015625, 15.707763671875, 16.50537109375, 17.302978515625, 18.1005859375, 18.898193359375, 19.69580078125, 20.493408203125, 21.291015625, 22.088623046875, 22.88623046875, 23.683837890625, 24.4814453125, 25.279052734375, 26.07666015625, 26.874267578125, 27.671875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 13.0, 5.0, 15.0, 20.0, 28.0, 30.0, 43.0, 69.0, 73.0, 119.0, 155.0, 220.0, 285.0, 384.0, 407.0, 481.0, 401.0, 342.0, 247.0, 203.0, 144.0, 100.0, 55.0, 46.0, 49.0, 26.0, 24.0, 20.0, 12.0, 8.0, 8.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6171875, -12.2010498046875, -11.784912109375, -11.3687744140625, -10.95263671875, -10.5364990234375, -10.120361328125, -9.7042236328125, -9.2880859375, -8.8719482421875, -8.455810546875, -8.0396728515625, -7.62353515625, -7.2073974609375, -6.791259765625, -6.3751220703125, -5.958984375, -5.5428466796875, -5.126708984375, -4.7105712890625, -4.29443359375, -3.8782958984375, -3.462158203125, -3.0460205078125, -2.6298828125, -2.2137451171875, -1.797607421875, -1.3814697265625, -0.96533203125, -0.5491943359375, -0.133056640625, 0.2830810546875, 0.69921875, 1.1153564453125, 1.531494140625, 1.9476318359375, 2.36376953125, 2.7799072265625, 3.196044921875, 3.6121826171875, 4.0283203125, 4.4444580078125, 4.860595703125, 5.2767333984375, 5.69287109375, 6.1090087890625, 6.525146484375, 6.9412841796875, 7.357421875, 7.7735595703125, 8.189697265625, 8.6058349609375, 9.02197265625, 9.4381103515625, 9.854248046875, 10.2703857421875, 10.6865234375, 11.1026611328125, 11.518798828125, 11.9349365234375, 12.35107421875, 12.7672119140625, 13.183349609375, 13.5994873046875, 14.015625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 7.0, 7.0, 8.0, 20.0, 17.0, 30.0, 40.0, 49.0, 50.0, 66.0, 90.0, 108.0, 126.0, 222.0, 261.0, 384.0, 647.0, 12865.0, 4121463.0, 55243.0, 912.0, 438.0, 275.0, 226.0, 172.0, 133.0, 103.0, 69.0, 68.0, 45.0, 25.0, 23.0, 20.0, 13.0, 10.0, 10.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-83.625, -81.13671875, -78.6484375, -76.16015625, -73.671875, -71.18359375, -68.6953125, -66.20703125, -63.71875, -61.23046875, -58.7421875, -56.25390625, -53.765625, -51.27734375, -48.7890625, -46.30078125, -43.8125, -41.32421875, -38.8359375, -36.34765625, -33.859375, -31.37109375, -28.8828125, -26.39453125, -23.90625, -21.41796875, -18.9296875, -16.44140625, -13.953125, -11.46484375, -8.9765625, -6.48828125, -4.0, -1.51171875, 0.9765625, 3.46484375, 5.953125, 8.44140625, 10.9296875, 13.41796875, 15.90625, 18.39453125, 20.8828125, 23.37109375, 25.859375, 28.34765625, 30.8359375, 33.32421875, 35.8125, 38.30078125, 40.7890625, 43.27734375, 45.765625, 48.25390625, 50.7421875, 53.23046875, 55.71875, 58.20703125, 60.6953125, 63.18359375, 65.671875, 68.16015625, 70.6484375, 73.13671875, 75.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 34.0, 80.0, 120.0, 168.0, 200.0, 189.0, 108.0, 55.0, 26.0, 13.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.26085662841797, -66.63582611083984, -64.01079559326172, -61.38576126098633, -58.7607307434082, -56.13570022583008, -53.51066589355469, -50.88563537597656, -48.26060485839844, -45.63557434082031, -43.01054382324219, -40.3855094909668, -37.76047897338867, -35.13544845581055, -32.510414123535156, -29.88538360595703, -27.260353088378906, -24.63532257080078, -22.010290145874023, -19.385257720947266, -16.76022720336914, -14.1351957321167, -11.510164260864258, -8.8851318359375, -6.260101318359375, -3.6350698471069336, -1.0100383758544922, 1.6149930953979492, 4.240024566650391, 6.865056037902832, 9.490087509155273, 12.115119934082031, 14.740142822265625, 17.36517333984375, 19.990205764770508, 22.615238189697266, 25.24026870727539, 27.865299224853516, 30.490331649780273, 33.11536407470703, 35.740394592285156, 38.36542510986328, 40.990455627441406, 43.6154899597168, 46.24052047729492, 48.86555099487305, 51.49058532714844, 54.11561584472656, 56.74064636230469, 59.36567687988281, 61.99070739746094, 64.61573791503906, 67.24076843261719, 69.86580657958984, 72.49083709716797, 75.1158676147461, 77.74089813232422, 80.36592864990234, 82.99095916748047, 85.6159896850586, 88.24102783203125, 90.86605834960938, 93.4910888671875, 96.11611938476562, 98.74114990234375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 8.0, 10.0, 14.0, 16.0, 22.0, 23.0, 18.0, 27.0, 30.0, 29.0, 32.0, 40.0, 30.0, 41.0, 44.0, 44.0, 39.0, 40.0, 34.0, 45.0, 49.0, 33.0, 41.0, 29.0, 21.0, 26.0, 27.0, 22.0, 20.0, 22.0, 21.0, 14.0, 11.0, 9.0, 2.0, 6.0, 7.0, 9.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.578460693359375, -40.11146545410156, -38.644474029541016, -37.1774787902832, -35.710487365722656, -34.243492126464844, -32.77649688720703, -31.309505462646484, -29.842512130737305, -28.375518798828125, -26.908525466918945, -25.441532135009766, -23.974536895751953, -22.507545471191406, -21.040550231933594, -19.573556900024414, -18.106563568115234, -16.639570236206055, -15.172576904296875, -13.705582618713379, -12.2385892868042, -10.77159595489502, -9.304601669311523, -7.837608337402344, -6.370615005493164, -4.903621673583984, -3.4366278648376465, -1.9696340560913086, -0.5026407241821289, 0.9643526077270508, 2.431346893310547, 3.8983402252197266, 5.365333557128906, 6.832326889038086, 8.299320220947266, 9.766314506530762, 11.233307838439941, 12.700301170349121, 14.167295455932617, 15.634288787841797, 17.101282119750977, 18.568275451660156, 20.035268783569336, 21.502262115478516, 22.969257354736328, 24.436248779296875, 25.903244018554688, 27.370237350463867, 28.837230682373047, 30.304224014282227, 31.771217346191406, 33.23821258544922, 34.705204010009766, 36.17219924926758, 37.639190673828125, 39.10618591308594, 40.57318115234375, 42.04017639160156, 43.50716781616211, 44.97416305541992, 46.44115447998047, 47.90814971923828, 49.375144958496094, 50.84213638305664, 52.30912780761719]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 6.0, 17.0, 11.0, 21.0, 20.0, 16.0, 16.0, 24.0, 37.0, 36.0, 43.0, 45.0, 50.0, 54.0, 38.0, 46.0, 46.0, 50.0, 47.0, 51.0, 35.0, 37.0, 41.0, 33.0, 31.0, 22.0, 18.0, 22.0, 10.0, 13.0, 7.0, 13.0, 7.0, 7.0, 10.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.7794189453125, -7.511962890625, -7.2445068359375, -6.97705078125, -6.7095947265625, -6.442138671875, -6.1746826171875, -5.9072265625, -5.6397705078125, -5.372314453125, -5.1048583984375, -4.83740234375, -4.5699462890625, -4.302490234375, -4.0350341796875, -3.767578125, -3.5001220703125, -3.232666015625, -2.9652099609375, -2.69775390625, -2.4302978515625, -2.162841796875, -1.8953857421875, -1.6279296875, -1.3604736328125, -1.093017578125, -0.8255615234375, -0.55810546875, -0.2906494140625, -0.023193359375, 0.2442626953125, 0.51171875, 0.7791748046875, 1.046630859375, 1.3140869140625, 1.58154296875, 1.8489990234375, 2.116455078125, 2.3839111328125, 2.6513671875, 2.9188232421875, 3.186279296875, 3.4537353515625, 3.72119140625, 3.9886474609375, 4.256103515625, 4.5235595703125, 4.791015625, 5.0584716796875, 5.325927734375, 5.5933837890625, 5.86083984375, 6.1282958984375, 6.395751953125, 6.6632080078125, 6.9306640625, 7.1981201171875, 7.465576171875, 7.7330322265625, 8.00048828125, 8.2679443359375, 8.535400390625, 8.8028564453125, 9.0703125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 10.0, 27.0, 33.0, 53.0, 75.0, 91.0, 182.0, 265.0, 383.0, 567.0, 881.0, 1364.0, 2079.0, 3332.0, 5083.0, 8262.0, 13789.0, 23274.0, 41377.0, 75666.0, 144572.0, 276613.0, 209175.0, 105922.0, 56878.0, 31307.0, 18109.0, 10858.0, 6676.0, 4122.0, 2599.0, 1720.0, 1104.0, 681.0, 465.0, 292.0, 224.0, 141.0, 95.0, 62.0, 53.0, 26.0, 19.0, 7.0, 13.0, 9.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.3173828125, -1.2783660888671875, -1.239349365234375, -1.2003326416015625, -1.16131591796875, -1.1222991943359375, -1.083282470703125, -1.0442657470703125, -1.0052490234375, -0.9662322998046875, -0.927215576171875, -0.8881988525390625, -0.84918212890625, -0.8101654052734375, -0.771148681640625, -0.7321319580078125, -0.693115234375, -0.6540985107421875, -0.615081787109375, -0.5760650634765625, -0.53704833984375, -0.4980316162109375, -0.459014892578125, -0.4199981689453125, -0.3809814453125, -0.3419647216796875, -0.302947998046875, -0.2639312744140625, -0.22491455078125, -0.1858978271484375, -0.146881103515625, -0.1078643798828125, -0.06884765625, -0.0298309326171875, 0.009185791015625, 0.0482025146484375, 0.08721923828125, 0.1262359619140625, 0.165252685546875, 0.2042694091796875, 0.2432861328125, 0.2823028564453125, 0.321319580078125, 0.3603363037109375, 0.39935302734375, 0.4383697509765625, 0.477386474609375, 0.5164031982421875, 0.555419921875, 0.5944366455078125, 0.633453369140625, 0.6724700927734375, 0.71148681640625, 0.7505035400390625, 0.789520263671875, 0.8285369873046875, 0.8675537109375, 0.9065704345703125, 0.945587158203125, 0.9846038818359375, 1.02362060546875, 1.0626373291015625, 1.101654052734375, 1.1406707763671875, 1.1796875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 7.0, 4.0, 13.0, 10.0, 16.0, 11.0, 12.0, 16.0, 24.0, 26.0, 18.0, 28.0, 34.0, 23.0, 39.0, 31.0, 42.0, 43.0, 47.0, 52.0, 1070.0, 59.0, 43.0, 47.0, 33.0, 34.0, 30.0, 21.0, 31.0, 18.0, 27.0, 17.0, 21.0, 6.0, 11.0, 10.0, 6.0, 10.0, 11.0, 5.0, 6.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.16070556640625, -4.0089111328125, -3.85711669921875, -3.705322265625, -3.55352783203125, -3.4017333984375, -3.24993896484375, -3.09814453125, -2.94635009765625, -2.7945556640625, -2.64276123046875, -2.490966796875, -2.33917236328125, -2.1873779296875, -2.03558349609375, -1.8837890625, -1.73199462890625, -1.5802001953125, -1.42840576171875, -1.276611328125, -1.12481689453125, -0.9730224609375, -0.82122802734375, -0.66943359375, -0.51763916015625, -0.3658447265625, -0.21405029296875, -0.062255859375, 0.08953857421875, 0.2413330078125, 0.39312744140625, 0.544921875, 0.69671630859375, 0.8485107421875, 1.00030517578125, 1.152099609375, 1.30389404296875, 1.4556884765625, 1.60748291015625, 1.75927734375, 1.91107177734375, 2.0628662109375, 2.21466064453125, 2.366455078125, 2.51824951171875, 2.6700439453125, 2.82183837890625, 2.9736328125, 3.12542724609375, 3.2772216796875, 3.42901611328125, 3.580810546875, 3.73260498046875, 3.8843994140625, 4.03619384765625, 4.18798828125, 4.33978271484375, 4.4915771484375, 4.64337158203125, 4.795166015625, 4.94696044921875, 5.0987548828125, 5.25054931640625, 5.40234375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 3.0, 7.0, 7.0, 16.0, 26.0, 24.0, 35.0, 50.0, 79.0, 116.0, 182.0, 234.0, 379.0, 567.0, 798.0, 1095.0, 1648.0, 2450.0, 3618.0, 5267.0, 7742.0, 11308.0, 16718.0, 26366.0, 42562.0, 70083.0, 124694.0, 1289563.0, 209976.0, 109761.0, 62560.0, 37747.0, 23914.0, 15293.0, 10170.0, 6928.0, 4813.0, 3264.0, 2270.0, 1451.0, 984.0, 718.0, 538.0, 342.0, 247.0, 176.0, 120.0, 80.0, 46.0, 28.0, 21.0, 20.0, 13.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.97607421875, -0.945465087890625, -0.91485595703125, -0.884246826171875, -0.8536376953125, -0.823028564453125, -0.79241943359375, -0.761810302734375, -0.731201171875, -0.700592041015625, -0.66998291015625, -0.639373779296875, -0.6087646484375, -0.578155517578125, -0.54754638671875, -0.516937255859375, -0.486328125, -0.455718994140625, -0.42510986328125, -0.394500732421875, -0.3638916015625, -0.333282470703125, -0.30267333984375, -0.272064208984375, -0.241455078125, -0.210845947265625, -0.18023681640625, -0.149627685546875, -0.1190185546875, -0.088409423828125, -0.05780029296875, -0.027191162109375, 0.00341796875, 0.034027099609375, 0.06463623046875, 0.095245361328125, 0.1258544921875, 0.156463623046875, 0.18707275390625, 0.217681884765625, 0.248291015625, 0.278900146484375, 0.30950927734375, 0.340118408203125, 0.3707275390625, 0.401336669921875, 0.43194580078125, 0.462554931640625, 0.4931640625, 0.523773193359375, 0.55438232421875, 0.584991455078125, 0.6156005859375, 0.646209716796875, 0.67681884765625, 0.707427978515625, 0.738037109375, 0.768646240234375, 0.79925537109375, 0.829864501953125, 0.8604736328125, 0.891082763671875, 0.92169189453125, 0.952301025390625, 0.98291015625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 6.0, 8.0, 10.0, 15.0, 13.0, 27.0, 42.0, 25.0, 35.0, 41.0, 34.0, 56.0, 52.0, 47.0, 52.0, 52.0, 52.0, 45.0, 51.0, 50.0, 40.0, 33.0, 31.0, 26.0, 25.0, 20.0, 18.0, 13.0, 15.0, 14.0, 2.0, 11.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010833740234375, -0.0010501593351364136, -0.0010169446468353271, -0.0009837299585342407, -0.0009505152702331543, -0.0009173005819320679, -0.0008840858936309814, -0.000850871205329895, -0.0008176565170288086, -0.0007844418287277222, -0.0007512271404266357, -0.0007180124521255493, -0.0006847977638244629, -0.0006515830755233765, -0.00061836838722229, -0.0005851536989212036, -0.0005519390106201172, -0.0005187243223190308, -0.00048550963401794434, -0.0004522949457168579, -0.0004190802574157715, -0.00038586556911468506, -0.00035265088081359863, -0.0003194361925125122, -0.0002862215042114258, -0.00025300681591033936, -0.00021979212760925293, -0.0001865774393081665, -0.00015336275100708008, -0.00012014806270599365, -8.693337440490723e-05, -5.37186861038208e-05, -2.0503997802734375e-05, 1.271069049835205e-05, 4.5925378799438477e-05, 7.91400671005249e-05, 0.00011235475540161133, 0.00014556944370269775, 0.00017878413200378418, 0.0002119988203048706, 0.00024521350860595703, 0.00027842819690704346, 0.0003116428852081299, 0.0003448575735092163, 0.00037807226181030273, 0.00041128695011138916, 0.0004445016384124756, 0.000477716326713562, 0.0005109310150146484, 0.0005441457033157349, 0.0005773603916168213, 0.0006105750799179077, 0.0006437897682189941, 0.0006770044565200806, 0.000710219144821167, 0.0007434338331222534, 0.0007766485214233398, 0.0008098632097244263, 0.0008430778980255127, 0.0008762925863265991, 0.0009095072746276855, 0.000942721962928772, 0.0009759366512298584, 0.0010091513395309448, 0.0010423660278320312]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 10.0, 8.0, 11.0, 15.0, 22.0, 23.0, 20.0, 35.0, 40.0, 53.0, 72.0, 97.0, 161.0, 330.0, 1004.0, 522379.0, 522302.0, 1045.0, 292.0, 171.0, 114.0, 88.0, 46.0, 49.0, 44.0, 28.0, 24.0, 17.0, 14.0, 5.0, 6.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02789306640625, -0.027021408081054688, -0.026149749755859375, -0.025278091430664062, -0.02440643310546875, -0.023534774780273438, -0.022663116455078125, -0.021791458129882812, -0.0209197998046875, -0.020048141479492188, -0.019176483154296875, -0.018304824829101562, -0.01743316650390625, -0.016561508178710938, -0.015689849853515625, -0.014818191528320312, -0.013946533203125, -0.013074874877929688, -0.012203216552734375, -0.011331558227539062, -0.01045989990234375, -0.009588241577148438, -0.008716583251953125, -0.007844924926757812, -0.0069732666015625, -0.0061016082763671875, -0.005229949951171875, -0.0043582916259765625, -0.00348663330078125, -0.0026149749755859375, -0.001743316650390625, -0.0008716583251953125, 0.0, 0.0008716583251953125, 0.001743316650390625, 0.0026149749755859375, 0.00348663330078125, 0.0043582916259765625, 0.005229949951171875, 0.0061016082763671875, 0.0069732666015625, 0.007844924926757812, 0.008716583251953125, 0.009588241577148438, 0.01045989990234375, 0.011331558227539062, 0.012203216552734375, 0.013074874877929688, 0.013946533203125, 0.014818191528320312, 0.015689849853515625, 0.016561508178710938, 0.01743316650390625, 0.018304824829101562, 0.019176483154296875, 0.020048141479492188, 0.0209197998046875, 0.021791458129882812, 0.022663116455078125, 0.023534774780273438, 0.02440643310546875, 0.025278091430664062, 0.026149749755859375, 0.027021408081054688, 0.02789306640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 56.0, 288.0, 465.0, 174.0, 27.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038274978287518024, -0.003754319390282035, -0.003681141184642911, -0.0036079627461731434, -0.003534784307703376, -0.0034616058692336082, -0.0033884276635944843, -0.0033152492251247168, -0.003242070786654949, -0.0031688923481851816, -0.0030957141425460577, -0.00302253570407629, -0.0029493572656065226, -0.002876178827136755, -0.002803000621497631, -0.0027298221830278635, -0.002656643744558096, -0.0025834653060883284, -0.0025102871004492044, -0.002437108661979437, -0.0023639302235096693, -0.0022907517850399017, -0.002217573579400778, -0.0021443951409310102, -0.0020712169352918863, -0.0019980384968221188, -0.001924860174767673, -0.0018516818527132273, -0.0017785034142434597, -0.001705325092189014, -0.0016321467701345682, -0.0015589683316648006, -0.001485789893195033, -0.0014126115711405873, -0.0013394331326708198, -0.001266254810616374, -0.0011930763721466064, -0.0011198980500921607, -0.001046719728037715, -0.0009735412895679474, -0.0009003628510981798, -0.0008271844708360732, -0.0007540060905739665, -0.0006808277685195208, -0.0006076493300497532, -0.0005344710079953074, -0.0004612926277332008, -0.00038811424747109413, -0.0003149358672089875, -0.00024175748694688082, -0.0001685791212366894, -9.540075552649796e-05, -2.2222375264391303e-05, 5.0956004997715354e-05, 0.00012413435615599155, 0.0001973127364180982, 0.00027049111668020487, 0.0003436694969423115, 0.0004168478772044182, 0.0004900261992588639, 0.0005632046377286315, 0.0006363829597830772, 0.0007095613400451839, 0.0007827397203072906, 0.0008559181005693972]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 8.0, 9.0, 7.0, 10.0, 17.0, 14.0, 14.0, 20.0, 28.0, 34.0, 37.0, 35.0, 40.0, 36.0, 37.0, 50.0, 38.0, 40.0, 46.0, 39.0, 43.0, 34.0, 37.0, 31.0, 20.0, 38.0, 36.0, 23.0, 24.0, 30.0, 17.0, 16.0, 19.0, 12.0, 12.0, 9.0, 11.0, 4.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0005714893341064453, -0.0005539869889616966, -0.0005364846438169479, -0.0005189822986721992, -0.0005014799535274506, -0.0004839776083827019, -0.0004664752632379532, -0.0004489729180932045, -0.0004314705729484558, -0.0004139682278037071, -0.00039646588265895844, -0.00037896353751420975, -0.00036146119236946106, -0.00034395884722471237, -0.0003264565020799637, -0.000308954156935215, -0.0002914518117904663, -0.0002739494666457176, -0.00025644712150096893, -0.00023894477635622025, -0.00022144243121147156, -0.00020394008606672287, -0.00018643774092197418, -0.0001689353957772255, -0.0001514330506324768, -0.00013393070548772812, -0.00011642836034297943, -9.892601519823074e-05, -8.142367005348206e-05, -6.392132490873337e-05, -4.641897976398468e-05, -2.8916634619235992e-05, -1.1414289474487305e-05, 6.088055670261383e-06, 2.359040081501007e-05, 4.109274595975876e-05, 5.8595091104507446e-05, 7.609743624925613e-05, 9.359978139400482e-05, 0.00011110212653875351, 0.0001286044716835022, 0.00014610681682825089, 0.00016360916197299957, 0.00018111150711774826, 0.00019861385226249695, 0.00021611619740724564, 0.00023361854255199432, 0.000251120887696743, 0.0002686232328414917, 0.0002861255779862404, 0.0003036279231309891, 0.00032113026827573776, 0.00033863261342048645, 0.00035613495856523514, 0.0003736373037099838, 0.0003911396488547325, 0.0004086419939994812, 0.0004261443391442299, 0.0004436466842889786, 0.00046114902943372726, 0.00047865137457847595, 0.0004961537197232246, 0.0005136560648679733, 0.000531158410012722, 0.0005486607551574707]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 6.0, 17.0, 11.0, 21.0, 20.0, 16.0, 16.0, 24.0, 37.0, 36.0, 43.0, 44.0, 51.0, 54.0, 38.0, 46.0, 46.0, 50.0, 47.0, 51.0, 35.0, 37.0, 41.0, 33.0, 31.0, 22.0, 18.0, 22.0, 10.0, 13.0, 7.0, 13.0, 7.0, 7.0, 10.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.7794189453125, -7.511962890625, -7.2445068359375, -6.97705078125, -6.7095947265625, -6.442138671875, -6.1746826171875, -5.9072265625, -5.6397705078125, -5.372314453125, -5.1048583984375, -4.83740234375, -4.5699462890625, -4.302490234375, -4.0350341796875, -3.767578125, -3.5001220703125, -3.232666015625, -2.9652099609375, -2.69775390625, -2.4302978515625, -2.162841796875, -1.8953857421875, -1.6279296875, -1.3604736328125, -1.093017578125, -0.8255615234375, -0.55810546875, -0.2906494140625, -0.023193359375, 0.2442626953125, 0.51171875, 0.7791748046875, 1.046630859375, 1.3140869140625, 1.58154296875, 1.8489990234375, 2.116455078125, 2.3839111328125, 2.6513671875, 2.9188232421875, 3.186279296875, 3.4537353515625, 3.72119140625, 3.9886474609375, 4.256103515625, 4.5235595703125, 4.791015625, 5.0584716796875, 5.325927734375, 5.5933837890625, 5.86083984375, 6.1282958984375, 6.395751953125, 6.6632080078125, 6.9306640625, 7.1981201171875, 7.465576171875, 7.7330322265625, 8.00048828125, 8.2679443359375, 8.535400390625, 8.8028564453125, 9.0703125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 24.0, 21.0, 34.0, 39.0, 42.0, 64.0, 93.0, 117.0, 173.0, 277.0, 488.0, 1021.0, 3452.0, 21186.0, 239299.0, 718349.0, 53454.0, 7085.0, 1546.0, 646.0, 381.0, 208.0, 155.0, 91.0, 73.0, 49.0, 42.0, 31.0, 14.0, 18.0, 16.0, 9.0, 8.0, 12.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8671875, -14.3751220703125, -13.883056640625, -13.3909912109375, -12.89892578125, -12.4068603515625, -11.914794921875, -11.4227294921875, -10.9306640625, -10.4385986328125, -9.946533203125, -9.4544677734375, -8.96240234375, -8.4703369140625, -7.978271484375, -7.4862060546875, -6.994140625, -6.5020751953125, -6.010009765625, -5.5179443359375, -5.02587890625, -4.5338134765625, -4.041748046875, -3.5496826171875, -3.0576171875, -2.5655517578125, -2.073486328125, -1.5814208984375, -1.08935546875, -0.5972900390625, -0.105224609375, 0.3868408203125, 0.87890625, 1.3709716796875, 1.863037109375, 2.3551025390625, 2.84716796875, 3.3392333984375, 3.831298828125, 4.3233642578125, 4.8154296875, 5.3074951171875, 5.799560546875, 6.2916259765625, 6.78369140625, 7.2757568359375, 7.767822265625, 8.2598876953125, 8.751953125, 9.2440185546875, 9.736083984375, 10.2281494140625, 10.72021484375, 11.2122802734375, 11.704345703125, 12.1964111328125, 12.6884765625, 13.1805419921875, 13.672607421875, 14.1646728515625, 14.65673828125, 15.1488037109375, 15.640869140625, 16.1329345703125, 16.625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 9.0, 12.0, 14.0, 13.0, 19.0, 16.0, 27.0, 38.0, 39.0, 43.0, 41.0, 58.0, 62.0, 134.0, 1802.0, 233.0, 73.0, 58.0, 44.0, 55.0, 46.0, 37.0, 30.0, 31.0, 22.0, 19.0, 21.0, 6.0, 5.0, 9.0, 6.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -32.05126953125, -31.0400390625, -30.02880859375, -29.017578125, -28.00634765625, -26.9951171875, -25.98388671875, -24.97265625, -23.96142578125, -22.9501953125, -21.93896484375, -20.927734375, -19.91650390625, -18.9052734375, -17.89404296875, -16.8828125, -15.87158203125, -14.8603515625, -13.84912109375, -12.837890625, -11.82666015625, -10.8154296875, -9.80419921875, -8.79296875, -7.78173828125, -6.7705078125, -5.75927734375, -4.748046875, -3.73681640625, -2.7255859375, -1.71435546875, -0.703125, 0.30810546875, 1.3193359375, 2.33056640625, 3.341796875, 4.35302734375, 5.3642578125, 6.37548828125, 7.38671875, 8.39794921875, 9.4091796875, 10.42041015625, 11.431640625, 12.44287109375, 13.4541015625, 14.46533203125, 15.4765625, 16.48779296875, 17.4990234375, 18.51025390625, 19.521484375, 20.53271484375, 21.5439453125, 22.55517578125, 23.56640625, 24.57763671875, 25.5888671875, 26.60009765625, 27.611328125, 28.62255859375, 29.6337890625, 30.64501953125, 31.65625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 12.0, 5.0, 9.0, 18.0, 16.0, 25.0, 33.0, 39.0, 47.0, 63.0, 104.0, 129.0, 292.0, 760.0, 17974.0, 3123176.0, 1876.0, 462.0, 202.0, 117.0, 89.0, 58.0, 46.0, 36.0, 16.0, 21.0, 11.0, 17.0, 18.0, 6.0, 9.0, 3.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-96.5625, -93.4765625, -90.390625, -87.3046875, -84.21875, -81.1328125, -78.046875, -74.9609375, -71.875, -68.7890625, -65.703125, -62.6171875, -59.53125, -56.4453125, -53.359375, -50.2734375, -47.1875, -44.1015625, -41.015625, -37.9296875, -34.84375, -31.7578125, -28.671875, -25.5859375, -22.5, -19.4140625, -16.328125, -13.2421875, -10.15625, -7.0703125, -3.984375, -0.8984375, 2.1875, 5.2734375, 8.359375, 11.4453125, 14.53125, 17.6171875, 20.703125, 23.7890625, 26.875, 29.9609375, 33.046875, 36.1328125, 39.21875, 42.3046875, 45.390625, 48.4765625, 51.5625, 54.6484375, 57.734375, 60.8203125, 63.90625, 66.9921875, 70.078125, 73.1640625, 76.25, 79.3359375, 82.421875, 85.5078125, 88.59375, 91.6796875, 94.765625, 97.8515625, 100.9375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 10.0, 36.0, 180.0, 379.0, 298.0, 93.0, 18.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.36552429199219, -84.4797592163086, -82.59400177001953, -80.70823669433594, -78.82247161865234, -76.93670654296875, -75.05094909667969, -73.1651840209961, -71.2794189453125, -69.3936538696289, -67.50789642333984, -65.62213134765625, -63.736366271972656, -61.85060501098633, -59.96484375, -58.079078674316406, -56.193321228027344, -54.307559967041016, -52.42179489135742, -50.536033630371094, -48.6502685546875, -46.76450729370117, -44.878746032714844, -42.99298095703125, -41.107215881347656, -39.22145462036133, -37.335689544677734, -35.449928283691406, -33.56416320800781, -31.678401947021484, -29.792638778686523, -27.906875610351562, -26.021114349365234, -24.135351181030273, -22.249588012695312, -20.363826751708984, -18.478063583374023, -16.592300415039062, -14.706537246704102, -12.820775032043457, -10.935011863708496, -9.049248695373535, -7.163486480712891, -5.27772331237793, -3.391960620880127, -1.5061979293823242, 0.3795652389526367, 2.2653274536132812, 4.151090621948242, 6.036853313446045, 7.922616004943848, 9.808379173278809, 11.694141387939453, 13.579904556274414, 15.465667724609375, 17.351428985595703, 19.237194061279297, 21.122957229614258, 23.00872039794922, 24.894481658935547, 26.780244827270508, 28.66600799560547, 30.55177116394043, 32.43753433227539, 34.32329559326172]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 8.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 7.0, 11.0, 9.0, 15.0, 20.0, 18.0, 27.0, 30.0, 27.0, 14.0, 38.0, 45.0, 49.0, 43.0, 32.0, 42.0, 39.0, 51.0, 33.0, 39.0, 38.0, 42.0, 38.0, 38.0, 36.0, 28.0, 24.0, 27.0, 17.0, 18.0, 15.0, 9.0, 15.0, 9.0, 5.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-75.71621704101562, -73.21619415283203, -70.7161636352539, -68.21614074707031, -65.71611022949219, -63.216087341308594, -60.716064453125, -58.21603775024414, -55.71601104736328, -53.21598434448242, -50.71595764160156, -48.21593475341797, -45.71590805053711, -43.21588134765625, -40.715858459472656, -38.2158317565918, -35.71580505371094, -33.21577835083008, -30.71575355529785, -28.215728759765625, -25.715702056884766, -23.215675354003906, -20.71565055847168, -18.215625762939453, -15.715599060058594, -13.21557331085205, -10.715547561645508, -8.215521812438965, -5.715496063232422, -3.215470314025879, -0.7154445648193359, 1.7845802307128906, 4.284599304199219, 6.784625053405762, 9.284650802612305, 11.784676551818848, 14.28470230102539, 16.78472900390625, 19.284753799438477, 21.784778594970703, 24.284805297851562, 26.784832000732422, 29.28485679626465, 31.784881591796875, 34.284908294677734, 36.784934997558594, 39.28495788574219, 41.78498458862305, 44.285011291503906, 46.785037994384766, 49.285064697265625, 51.78508758544922, 54.28511428833008, 56.78514099121094, 59.28516387939453, 61.78519058227539, 64.28521728515625, 66.78524017333984, 69.28527069091797, 71.78529357910156, 74.28532409667969, 76.78534698486328, 79.28536987304688, 81.785400390625, 84.2854232788086]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 14.0, 7.0, 10.0, 13.0, 13.0, 20.0, 21.0, 21.0, 25.0, 29.0, 25.0, 40.0, 45.0, 46.0, 49.0, 48.0, 44.0, 47.0, 55.0, 55.0, 41.0, 37.0, 40.0, 39.0, 33.0, 25.0, 34.0, 22.0, 24.0, 13.0, 10.0, 8.0, 10.0, 10.0, 14.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4560546875, -8.169921875, -7.8837890625, -7.59765625, -7.3115234375, -7.025390625, -6.7392578125, -6.453125, -6.1669921875, -5.880859375, -5.5947265625, -5.30859375, -5.0224609375, -4.736328125, -4.4501953125, -4.1640625, -3.8779296875, -3.591796875, -3.3056640625, -3.01953125, -2.7333984375, -2.447265625, -2.1611328125, -1.875, -1.5888671875, -1.302734375, -1.0166015625, -0.73046875, -0.4443359375, -0.158203125, 0.1279296875, 0.4140625, 0.7001953125, 0.986328125, 1.2724609375, 1.55859375, 1.8447265625, 2.130859375, 2.4169921875, 2.703125, 2.9892578125, 3.275390625, 3.5615234375, 3.84765625, 4.1337890625, 4.419921875, 4.7060546875, 4.9921875, 5.2783203125, 5.564453125, 5.8505859375, 6.13671875, 6.4228515625, 6.708984375, 6.9951171875, 7.28125, 7.5673828125, 7.853515625, 8.1396484375, 8.42578125, 8.7119140625, 8.998046875, 9.2841796875, 9.5703125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 11.0, 6.0, 14.0, 18.0, 24.0, 21.0, 22.0, 47.0, 56.0, 74.0, 100.0, 145.0, 244.0, 468.0, 1003.0, 2669.0, 8728.0, 41987.0, 253071.0, 1119258.0, 1793819.0, 783814.0, 152930.0, 25913.0, 6050.0, 1892.0, 811.0, 373.0, 214.0, 135.0, 93.0, 59.0, 39.0, 48.0, 36.0, 25.0, 15.0, 10.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.53125, -10.184326171875, -9.83740234375, -9.490478515625, -9.1435546875, -8.796630859375, -8.44970703125, -8.102783203125, -7.755859375, -7.408935546875, -7.06201171875, -6.715087890625, -6.3681640625, -6.021240234375, -5.67431640625, -5.327392578125, -4.98046875, -4.633544921875, -4.28662109375, -3.939697265625, -3.5927734375, -3.245849609375, -2.89892578125, -2.552001953125, -2.205078125, -1.858154296875, -1.51123046875, -1.164306640625, -0.8173828125, -0.470458984375, -0.12353515625, 0.223388671875, 0.5703125, 0.917236328125, 1.26416015625, 1.611083984375, 1.9580078125, 2.304931640625, 2.65185546875, 2.998779296875, 3.345703125, 3.692626953125, 4.03955078125, 4.386474609375, 4.7333984375, 5.080322265625, 5.42724609375, 5.774169921875, 6.12109375, 6.468017578125, 6.81494140625, 7.161865234375, 7.5087890625, 7.855712890625, 8.20263671875, 8.549560546875, 8.896484375, 9.243408203125, 9.59033203125, 9.937255859375, 10.2841796875, 10.631103515625, 10.97802734375, 11.324951171875, 11.671875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 5.0, 11.0, 11.0, 14.0, 18.0, 26.0, 29.0, 28.0, 50.0, 75.0, 93.0, 127.0, 168.0, 220.0, 281.0, 332.0, 415.0, 394.0, 405.0, 298.0, 255.0, 197.0, 165.0, 102.0, 99.0, 80.0, 56.0, 31.0, 25.0, 19.0, 16.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.0859375, -14.63232421875, -14.1787109375, -13.72509765625, -13.271484375, -12.81787109375, -12.3642578125, -11.91064453125, -11.45703125, -11.00341796875, -10.5498046875, -10.09619140625, -9.642578125, -9.18896484375, -8.7353515625, -8.28173828125, -7.828125, -7.37451171875, -6.9208984375, -6.46728515625, -6.013671875, -5.56005859375, -5.1064453125, -4.65283203125, -4.19921875, -3.74560546875, -3.2919921875, -2.83837890625, -2.384765625, -1.93115234375, -1.4775390625, -1.02392578125, -0.5703125, -0.11669921875, 0.3369140625, 0.79052734375, 1.244140625, 1.69775390625, 2.1513671875, 2.60498046875, 3.05859375, 3.51220703125, 3.9658203125, 4.41943359375, 4.873046875, 5.32666015625, 5.7802734375, 6.23388671875, 6.6875, 7.14111328125, 7.5947265625, 8.04833984375, 8.501953125, 8.95556640625, 9.4091796875, 9.86279296875, 10.31640625, 10.77001953125, 11.2236328125, 11.67724609375, 12.130859375, 12.58447265625, 13.0380859375, 13.49169921875, 13.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 15.0, 9.0, 13.0, 21.0, 27.0, 31.0, 39.0, 58.0, 67.0, 103.0, 128.0, 132.0, 187.0, 214.0, 274.0, 385.0, 685.0, 1870.0, 27807.0, 3991746.0, 164817.0, 2935.0, 860.0, 490.0, 294.0, 224.0, 203.0, 116.0, 107.0, 93.0, 69.0, 59.0, 41.0, 32.0, 31.0, 16.0, 25.0, 13.0, 8.0, 8.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-55.6875, -53.87060546875, -52.0537109375, -50.23681640625, -48.419921875, -46.60302734375, -44.7861328125, -42.96923828125, -41.15234375, -39.33544921875, -37.5185546875, -35.70166015625, -33.884765625, -32.06787109375, -30.2509765625, -28.43408203125, -26.6171875, -24.80029296875, -22.9833984375, -21.16650390625, -19.349609375, -17.53271484375, -15.7158203125, -13.89892578125, -12.08203125, -10.26513671875, -8.4482421875, -6.63134765625, -4.814453125, -2.99755859375, -1.1806640625, 0.63623046875, 2.453125, 4.27001953125, 6.0869140625, 7.90380859375, 9.720703125, 11.53759765625, 13.3544921875, 15.17138671875, 16.98828125, 18.80517578125, 20.6220703125, 22.43896484375, 24.255859375, 26.07275390625, 27.8896484375, 29.70654296875, 31.5234375, 33.34033203125, 35.1572265625, 36.97412109375, 38.791015625, 40.60791015625, 42.4248046875, 44.24169921875, 46.05859375, 47.87548828125, 49.6923828125, 51.50927734375, 53.326171875, 55.14306640625, 56.9599609375, 58.77685546875, 60.59375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 15.0, 354.0, 589.0, 54.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.98284912109375, -131.0111083984375, -121.03938293457031, -111.0676498413086, -101.09591674804688, -91.12418365478516, -81.15245056152344, -71.18071746826172, -61.208984375, -51.23725128173828, -41.26551818847656, -31.293785095214844, -21.322052001953125, -11.350318908691406, -1.3785858154296875, 8.593147277832031, 18.56488037109375, 28.53661346435547, 38.50834655761719, 48.480079650878906, 58.451812744140625, 68.42354583740234, 78.39527893066406, 88.36701202392578, 98.3387451171875, 108.31047821044922, 118.28221130371094, 128.25393676757812, 138.22567749023438, 148.19741821289062, 158.1691436767578, 168.140869140625, 178.11264038085938, 188.08438110351562, 198.0561065673828, 208.02783203125, 217.99957275390625, 227.9713134765625, 237.9430389404297, 247.91476440429688, 257.8865051269531, 267.8582458496094, 277.8299560546875, 287.80169677734375, 297.7734375, 307.74517822265625, 317.7169189453125, 327.6886291503906, 337.6603698730469, 347.6321105957031, 357.60382080078125, 367.5755615234375, 377.54730224609375, 387.51904296875, 397.49078369140625, 407.4624938964844, 417.4342346191406, 427.4059753417969, 437.377685546875, 447.34942626953125, 457.3211669921875, 467.29290771484375, 477.2646484375, 487.2363586425781, 497.2080993652344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 10.0, 6.0, 9.0, 13.0, 21.0, 18.0, 19.0, 23.0, 32.0, 23.0, 34.0, 31.0, 40.0, 40.0, 39.0, 30.0, 29.0, 44.0, 53.0, 46.0, 48.0, 36.0, 54.0, 43.0, 31.0, 21.0, 28.0, 29.0, 32.0, 17.0, 15.0, 16.0, 19.0, 10.0, 5.0, 8.0, 8.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.103248596191406, -52.46516418457031, -50.82707595825195, -49.18899154663086, -47.550907135009766, -45.912818908691406, -44.27473449707031, -42.63665008544922, -40.998565673828125, -39.36048126220703, -37.72239303588867, -36.08430862426758, -34.446224212646484, -32.808135986328125, -31.17005157470703, -29.531967163085938, -27.893878936767578, -26.25579261779785, -24.617708206176758, -22.97962188720703, -21.341537475585938, -19.70345115661621, -18.065364837646484, -16.42728042602539, -14.789194107055664, -13.151108741760254, -11.513023376464844, -9.874937057495117, -8.236851692199707, -6.598766326904297, -4.96068000793457, -3.32259464263916, -1.68450927734375, -0.04642367362976074, 1.5916619300842285, 3.229747772216797, 4.867833137512207, 6.505918502807617, 8.144004821777344, 9.782090187072754, 11.420175552368164, 13.058260917663574, 14.696346282958984, 16.33443260192871, 17.972518920898438, 19.61060333251953, 21.248689651489258, 22.886775970458984, 24.524860382080078, 26.162946701049805, 27.8010311126709, 29.439117431640625, 31.07720184326172, 32.71528625488281, 34.35337448120117, 35.991458892822266, 37.629547119140625, 39.26763153076172, 40.90571975708008, 42.54380416870117, 44.181888580322266, 45.819976806640625, 47.45806121826172, 49.09614562988281, 50.734230041503906]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 11.0, 7.0, 9.0, 14.0, 8.0, 14.0, 18.0, 16.0, 28.0, 24.0, 30.0, 32.0, 34.0, 40.0, 29.0, 40.0, 37.0, 48.0, 47.0, 40.0, 47.0, 39.0, 43.0, 47.0, 36.0, 27.0, 29.0, 29.0, 30.0, 24.0, 25.0, 19.0, 18.0, 10.0, 14.0, 1.0, 4.0, 5.0, 8.0, 4.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8660888671875, -6.614990234375, -6.3638916015625, -6.11279296875, -5.8616943359375, -5.610595703125, -5.3594970703125, -5.1083984375, -4.8572998046875, -4.606201171875, -4.3551025390625, -4.10400390625, -3.8529052734375, -3.601806640625, -3.3507080078125, -3.099609375, -2.8485107421875, -2.597412109375, -2.3463134765625, -2.09521484375, -1.8441162109375, -1.593017578125, -1.3419189453125, -1.0908203125, -0.8397216796875, -0.588623046875, -0.3375244140625, -0.08642578125, 0.1646728515625, 0.415771484375, 0.6668701171875, 0.91796875, 1.1690673828125, 1.420166015625, 1.6712646484375, 1.92236328125, 2.1734619140625, 2.424560546875, 2.6756591796875, 2.9267578125, 3.1778564453125, 3.428955078125, 3.6800537109375, 3.93115234375, 4.1822509765625, 4.433349609375, 4.6844482421875, 4.935546875, 5.1866455078125, 5.437744140625, 5.6888427734375, 5.93994140625, 6.1910400390625, 6.442138671875, 6.6932373046875, 6.9443359375, 7.1954345703125, 7.446533203125, 7.6976318359375, 7.94873046875, 8.1998291015625, 8.450927734375, 8.7020263671875, 8.953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 14.0, 14.0, 22.0, 25.0, 40.0, 70.0, 106.0, 150.0, 215.0, 372.0, 545.0, 907.0, 1336.0, 2184.0, 3377.0, 5307.0, 8857.0, 14460.0, 23564.0, 40671.0, 71661.0, 132590.0, 249448.0, 221049.0, 116208.0, 63407.0, 36278.0, 21319.0, 12980.0, 7945.0, 4881.0, 3142.0, 1955.0, 1255.0, 771.0, 501.0, 319.0, 219.0, 128.0, 79.0, 66.0, 37.0, 35.0, 19.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.3359375, -1.2976531982421875, -1.259368896484375, -1.2210845947265625, -1.18280029296875, -1.1445159912109375, -1.106231689453125, -1.0679473876953125, -1.0296630859375, -0.9913787841796875, -0.953094482421875, -0.9148101806640625, -0.87652587890625, -0.8382415771484375, -0.799957275390625, -0.7616729736328125, -0.723388671875, -0.6851043701171875, -0.646820068359375, -0.6085357666015625, -0.57025146484375, -0.5319671630859375, -0.493682861328125, -0.4553985595703125, -0.4171142578125, -0.3788299560546875, -0.340545654296875, -0.3022613525390625, -0.26397705078125, -0.2256927490234375, -0.187408447265625, -0.1491241455078125, -0.11083984375, -0.0725555419921875, -0.034271240234375, 0.0040130615234375, 0.04229736328125, 0.0805816650390625, 0.118865966796875, 0.1571502685546875, 0.1954345703125, 0.2337188720703125, 0.272003173828125, 0.3102874755859375, 0.34857177734375, 0.3868560791015625, 0.425140380859375, 0.4634246826171875, 0.501708984375, 0.5399932861328125, 0.578277587890625, 0.6165618896484375, 0.65484619140625, 0.6931304931640625, 0.731414794921875, 0.7696990966796875, 0.8079833984375, 0.8462677001953125, 0.884552001953125, 0.9228363037109375, 0.96112060546875, 0.9994049072265625, 1.037689208984375, 1.0759735107421875, 1.1142578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 3.0, 5.0, 8.0, 5.0, 5.0, 11.0, 11.0, 7.0, 7.0, 13.0, 20.0, 20.0, 24.0, 34.0, 26.0, 27.0, 29.0, 43.0, 48.0, 40.0, 55.0, 1059.0, 49.0, 39.0, 34.0, 42.0, 38.0, 44.0, 43.0, 31.0, 32.0, 27.0, 30.0, 17.0, 14.0, 22.0, 15.0, 15.0, 4.0, 4.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.89898681640625, -4.7354736328125, -4.57196044921875, -4.408447265625, -4.24493408203125, -4.0814208984375, -3.91790771484375, -3.75439453125, -3.59088134765625, -3.4273681640625, -3.26385498046875, -3.100341796875, -2.93682861328125, -2.7733154296875, -2.60980224609375, -2.4462890625, -2.28277587890625, -2.1192626953125, -1.95574951171875, -1.792236328125, -1.62872314453125, -1.4652099609375, -1.30169677734375, -1.13818359375, -0.97467041015625, -0.8111572265625, -0.64764404296875, -0.484130859375, -0.32061767578125, -0.1571044921875, 0.00640869140625, 0.169921875, 0.33343505859375, 0.4969482421875, 0.66046142578125, 0.823974609375, 0.98748779296875, 1.1510009765625, 1.31451416015625, 1.47802734375, 1.64154052734375, 1.8050537109375, 1.96856689453125, 2.132080078125, 2.29559326171875, 2.4591064453125, 2.62261962890625, 2.7861328125, 2.94964599609375, 3.1131591796875, 3.27667236328125, 3.440185546875, 3.60369873046875, 3.7672119140625, 3.93072509765625, 4.09423828125, 4.25775146484375, 4.4212646484375, 4.58477783203125, 4.748291015625, 4.91180419921875, 5.0753173828125, 5.23883056640625, 5.40234375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 6.0, 20.0, 28.0, 32.0, 63.0, 87.0, 108.0, 212.0, 259.0, 396.0, 489.0, 724.0, 1100.0, 1564.0, 2218.0, 3329.0, 4570.0, 6717.0, 10237.0, 15527.0, 23493.0, 37484.0, 62133.0, 106060.0, 188710.0, 1284503.0, 135147.0, 78568.0, 47124.0, 29231.0, 18415.0, 12321.0, 8267.0, 5600.0, 3687.0, 2715.0, 1846.0, 1276.0, 847.0, 615.0, 422.0, 280.0, 197.0, 150.0, 109.0, 74.0, 55.0, 42.0, 27.0, 11.0, 11.0, 8.0, 2.0, 3.0, 1.0, 4.0], "bins": [-1.041015625, -1.0096817016601562, -0.9783477783203125, -0.9470138549804688, -0.915679931640625, -0.8843460083007812, -0.8530120849609375, -0.8216781616210938, -0.79034423828125, -0.7590103149414062, -0.7276763916015625, -0.6963424682617188, -0.665008544921875, -0.6336746215820312, -0.6023406982421875, -0.5710067749023438, -0.5396728515625, -0.5083389282226562, -0.4770050048828125, -0.44567108154296875, -0.414337158203125, -0.38300323486328125, -0.3516693115234375, -0.32033538818359375, -0.28900146484375, -0.25766754150390625, -0.2263336181640625, -0.19499969482421875, -0.163665771484375, -0.13233184814453125, -0.1009979248046875, -0.06966400146484375, -0.038330078125, -0.00699615478515625, 0.0243377685546875, 0.05567169189453125, 0.087005615234375, 0.11833953857421875, 0.1496734619140625, 0.18100738525390625, 0.21234130859375, 0.24367523193359375, 0.2750091552734375, 0.30634307861328125, 0.337677001953125, 0.36901092529296875, 0.4003448486328125, 0.43167877197265625, 0.4630126953125, 0.49434661865234375, 0.5256805419921875, 0.5570144653320312, 0.588348388671875, 0.6196823120117188, 0.6510162353515625, 0.6823501586914062, 0.71368408203125, 0.7450180053710938, 0.7763519287109375, 0.8076858520507812, 0.839019775390625, 0.8703536987304688, 0.9016876220703125, 0.9330215454101562, 0.96435546875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 10.0, 17.0, 10.0, 20.0, 22.0, 28.0, 29.0, 44.0, 52.0, 65.0, 77.0, 71.0, 104.0, 90.0, 84.0, 60.0, 46.0, 37.0, 27.0, 32.0, 9.0, 19.0, 6.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0012826919555664062, -0.001246526837348938, -0.0012103617191314697, -0.0011741966009140015, -0.0011380314826965332, -0.001101866364479065, -0.0010657012462615967, -0.0010295361280441284, -0.0009933710098266602, -0.0009572058916091919, -0.0009210407733917236, -0.0008848756551742554, -0.0008487105369567871, -0.0008125454187393188, -0.0007763803005218506, -0.0007402151823043823, -0.0007040500640869141, -0.0006678849458694458, -0.0006317198276519775, -0.0005955547094345093, -0.000559389591217041, -0.0005232244729995728, -0.0004870593547821045, -0.00045089423656463623, -0.00041472911834716797, -0.0003785640001296997, -0.00034239888191223145, -0.0003062337636947632, -0.0002700686454772949, -0.00023390352725982666, -0.0001977384090423584, -0.00016157329082489014, -0.00012540817260742188, -8.924305438995361e-05, -5.307793617248535e-05, -1.691281795501709e-05, 1.9252300262451172e-05, 5.5417418479919434e-05, 9.15825366973877e-05, 0.00012774765491485596, 0.00016391277313232422, 0.00020007789134979248, 0.00023624300956726074, 0.000272408127784729, 0.00030857324600219727, 0.00034473836421966553, 0.0003809034824371338, 0.00041706860065460205, 0.0004532337188720703, 0.0004893988370895386, 0.0005255639553070068, 0.0005617290735244751, 0.0005978941917419434, 0.0006340593099594116, 0.0006702244281768799, 0.0007063895463943481, 0.0007425546646118164, 0.0007787197828292847, 0.0008148849010467529, 0.0008510500192642212, 0.0008872151374816895, 0.0009233802556991577, 0.000959545373916626, 0.0009957104921340942, 0.0010318756103515625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 10.0, 15.0, 29.0, 40.0, 67.0, 72.0, 96.0, 201.0, 563.0, 4000.0, 1037987.0, 4186.0, 590.0, 220.0, 131.0, 82.0, 68.0, 38.0, 32.0, 23.0, 16.0, 23.0, 8.0, 7.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022335529327392578, -0.021492958068847656, -0.020650386810302734, -0.019807815551757812, -0.01896524429321289, -0.01812267303466797, -0.017280101776123047, -0.016437530517578125, -0.015594959259033203, -0.014752388000488281, -0.01390981674194336, -0.013067245483398438, -0.012224674224853516, -0.011382102966308594, -0.010539531707763672, -0.00969696044921875, -0.008854389190673828, -0.008011817932128906, -0.007169246673583984, -0.0063266754150390625, -0.005484104156494141, -0.004641532897949219, -0.003798961639404297, -0.002956390380859375, -0.002113819122314453, -0.0012712478637695312, -0.0004286766052246094, 0.0004138946533203125, 0.0012564659118652344, 0.0020990371704101562, 0.002941608428955078, 0.0037841796875, 0.004626750946044922, 0.005469322204589844, 0.006311893463134766, 0.0071544647216796875, 0.00799703598022461, 0.008839607238769531, 0.009682178497314453, 0.010524749755859375, 0.011367321014404297, 0.012209892272949219, 0.01305246353149414, 0.013895034790039062, 0.014737606048583984, 0.015580177307128906, 0.016422748565673828, 0.01726531982421875, 0.018107891082763672, 0.018950462341308594, 0.019793033599853516, 0.020635604858398438, 0.02147817611694336, 0.02232074737548828, 0.023163318634033203, 0.024005889892578125, 0.024848461151123047, 0.02569103240966797, 0.02653360366821289, 0.027376174926757812, 0.028218746185302734, 0.029061317443847656, 0.029903888702392578, 0.0307464599609375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 52.0, 607.0, 338.0, 17.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001381020643748343, -0.0012530566891655326, -0.0011250926181674004, -0.00099712866358459, -0.0008691646507941186, -0.0007412006380036473, -0.0006132366834208369, -0.0004852726706303656, -0.0003573086578398943, -0.0002293446596013382, -0.00010138066136278212, 2.6583322323858738e-05, 0.00015454733511433005, 0.00028251134790480137, 0.00041047530248761177, 0.0005384393152780831, 0.0006664033280685544, 0.0007943673408590257, 0.000922331353649497, 0.0010502953082323074, 0.0011782592628151178, 0.00130622333381325, 0.0014341872883960605, 0.0015621513593941927, 0.001690115313977003, 0.0018180792685598135, 0.0019460433395579457, 0.002074007410556078, 0.0022019713651388884, 0.0023299353197216988, 0.002457899274304509, 0.0025858632288873196, 0.0027138274163007736, 0.002841791370883584, 0.0029697553254663944, 0.0030977195128798485, 0.003225683467462659, 0.0033536474220454693, 0.0034816113766282797, 0.00360957533121109, 0.003737539518624544, 0.0038655034732073545, 0.003993467427790165, 0.004121431615203619, 0.004249395336955786, 0.00437735952436924, 0.0045053232461214066, 0.004633287433534861, 0.004761251620948315, 0.004889215808361769, 0.0050171795301139355, 0.0051451437175273895, 0.005273107439279556, 0.00540107162669301, 0.005529035814106464, 0.005656999535858631, 0.005784963257610798, 0.005912927445024252, 0.006040891166776419, 0.006168855354189873, 0.0062968190759420395, 0.0064247832633554935, 0.006552747450768948, 0.006680711172521114, 0.006808675359934568]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 4.0, 9.0, 14.0, 12.0, 16.0, 17.0, 16.0, 18.0, 21.0, 24.0, 31.0, 23.0, 31.0, 39.0, 46.0, 43.0, 46.0, 36.0, 32.0, 41.0, 27.0, 46.0, 34.0, 44.0, 24.0, 24.0, 26.0, 31.0, 21.0, 29.0, 24.0, 26.0, 22.0, 13.0, 14.0, 10.0, 14.0, 9.0, 10.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00046628713607788086, -0.0004523731768131256, -0.00043845921754837036, -0.0004245452582836151, -0.00041063129901885986, -0.0003967173397541046, -0.00038280338048934937, -0.0003688894212245941, -0.00035497546195983887, -0.0003410615026950836, -0.00032714754343032837, -0.0003132335841655731, -0.00029931962490081787, -0.0002854056656360626, -0.0002714917063713074, -0.0002575777471065521, -0.00024366378784179688, -0.00022974982857704163, -0.00021583586931228638, -0.00020192191004753113, -0.00018800795078277588, -0.00017409399151802063, -0.00016018003225326538, -0.00014626607298851013, -0.00013235211372375488, -0.00011843815445899963, -0.00010452419519424438, -9.061023592948914e-05, -7.669627666473389e-05, -6.278231739997864e-05, -4.886835813522339e-05, -3.495439887046814e-05, -2.104043960571289e-05, -7.126480340957642e-06, 6.787478923797607e-06, 2.0701438188552856e-05, 3.4615397453308105e-05, 4.8529356718063354e-05, 6.24433159828186e-05, 7.635727524757385e-05, 9.02712345123291e-05, 0.00010418519377708435, 0.0001180991530418396, 0.00013201311230659485, 0.0001459270715713501, 0.00015984103083610535, 0.0001737549901008606, 0.00018766894936561584, 0.0002015829086303711, 0.00021549686789512634, 0.0002294108271598816, 0.00024332478642463684, 0.0002572387456893921, 0.00027115270495414734, 0.0002850666642189026, 0.00029898062348365784, 0.0003128945827484131, 0.00032680854201316833, 0.0003407225012779236, 0.00035463646054267883, 0.0003685504198074341, 0.00038246437907218933, 0.0003963783383369446, 0.00041029229760169983, 0.0004242062568664551]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 11.0, 7.0, 9.0, 14.0, 8.0, 14.0, 18.0, 16.0, 28.0, 24.0, 30.0, 32.0, 34.0, 40.0, 29.0, 40.0, 37.0, 48.0, 47.0, 40.0, 47.0, 39.0, 43.0, 47.0, 36.0, 27.0, 29.0, 29.0, 30.0, 24.0, 25.0, 19.0, 18.0, 10.0, 14.0, 1.0, 4.0, 5.0, 8.0, 4.0, 4.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8660888671875, -6.614990234375, -6.3638916015625, -6.11279296875, -5.8616943359375, -5.610595703125, -5.3594970703125, -5.1083984375, -4.8572998046875, -4.606201171875, -4.3551025390625, -4.10400390625, -3.8529052734375, -3.601806640625, -3.3507080078125, -3.099609375, -2.8485107421875, -2.597412109375, -2.3463134765625, -2.09521484375, -1.8441162109375, -1.593017578125, -1.3419189453125, -1.0908203125, -0.8397216796875, -0.588623046875, -0.3375244140625, -0.08642578125, 0.1646728515625, 0.415771484375, 0.6668701171875, 0.91796875, 1.1690673828125, 1.420166015625, 1.6712646484375, 1.92236328125, 2.1734619140625, 2.424560546875, 2.6756591796875, 2.9267578125, 3.1778564453125, 3.428955078125, 3.6800537109375, 3.93115234375, 4.1822509765625, 4.433349609375, 4.6844482421875, 4.935546875, 5.1866455078125, 5.437744140625, 5.6888427734375, 5.93994140625, 6.1910400390625, 6.442138671875, 6.6932373046875, 6.9443359375, 7.1954345703125, 7.446533203125, 7.6976318359375, 7.94873046875, 8.1998291015625, 8.450927734375, 8.7020263671875, 8.953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 7.0, 10.0, 9.0, 9.0, 14.0, 21.0, 22.0, 32.0, 49.0, 73.0, 101.0, 177.0, 333.0, 628.0, 1394.0, 3053.0, 7280.0, 17286.0, 41849.0, 109465.0, 304572.0, 346281.0, 130857.0, 49535.0, 20155.0, 8518.0, 3670.0, 1520.0, 700.0, 352.0, 196.0, 120.0, 79.0, 46.0, 32.0, 21.0, 27.0, 11.0, 12.0, 10.0, 8.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.3203125, -6.10302734375, -5.8857421875, -5.66845703125, -5.451171875, -5.23388671875, -5.0166015625, -4.79931640625, -4.58203125, -4.36474609375, -4.1474609375, -3.93017578125, -3.712890625, -3.49560546875, -3.2783203125, -3.06103515625, -2.84375, -2.62646484375, -2.4091796875, -2.19189453125, -1.974609375, -1.75732421875, -1.5400390625, -1.32275390625, -1.10546875, -0.88818359375, -0.6708984375, -0.45361328125, -0.236328125, -0.01904296875, 0.1982421875, 0.41552734375, 0.6328125, 0.85009765625, 1.0673828125, 1.28466796875, 1.501953125, 1.71923828125, 1.9365234375, 2.15380859375, 2.37109375, 2.58837890625, 2.8056640625, 3.02294921875, 3.240234375, 3.45751953125, 3.6748046875, 3.89208984375, 4.109375, 4.32666015625, 4.5439453125, 4.76123046875, 4.978515625, 5.19580078125, 5.4130859375, 5.63037109375, 5.84765625, 6.06494140625, 6.2822265625, 6.49951171875, 6.716796875, 6.93408203125, 7.1513671875, 7.36865234375, 7.5859375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 4.0, 10.0, 12.0, 7.0, 11.0, 20.0, 10.0, 13.0, 24.0, 32.0, 32.0, 40.0, 41.0, 50.0, 51.0, 68.0, 84.0, 329.0, 1609.0, 146.0, 70.0, 56.0, 40.0, 41.0, 29.0, 34.0, 32.0, 25.0, 22.0, 17.0, 18.0, 12.0, 15.0, 13.0, 7.0, 5.0, 5.0, 1.0, 5.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.171875, -25.27734375, -24.3828125, -23.48828125, -22.59375, -21.69921875, -20.8046875, -19.91015625, -19.015625, -18.12109375, -17.2265625, -16.33203125, -15.4375, -14.54296875, -13.6484375, -12.75390625, -11.859375, -10.96484375, -10.0703125, -9.17578125, -8.28125, -7.38671875, -6.4921875, -5.59765625, -4.703125, -3.80859375, -2.9140625, -2.01953125, -1.125, -0.23046875, 0.6640625, 1.55859375, 2.453125, 3.34765625, 4.2421875, 5.13671875, 6.03125, 6.92578125, 7.8203125, 8.71484375, 9.609375, 10.50390625, 11.3984375, 12.29296875, 13.1875, 14.08203125, 14.9765625, 15.87109375, 16.765625, 17.66015625, 18.5546875, 19.44921875, 20.34375, 21.23828125, 22.1328125, 23.02734375, 23.921875, 24.81640625, 25.7109375, 26.60546875, 27.5, 28.39453125, 29.2890625, 30.18359375, 31.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 11.0, 15.0, 16.0, 20.0, 15.0, 34.0, 34.0, 46.0, 65.0, 84.0, 105.0, 142.0, 199.0, 349.0, 585.0, 1842.0, 111921.0, 3011639.0, 15939.0, 1129.0, 472.0, 273.0, 189.0, 126.0, 108.0, 63.0, 65.0, 57.0, 38.0, 13.0, 23.0, 17.0, 13.0, 10.0, 11.0, 4.0, 9.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-51.28125, -49.8291015625, -48.376953125, -46.9248046875, -45.47265625, -44.0205078125, -42.568359375, -41.1162109375, -39.6640625, -38.2119140625, -36.759765625, -35.3076171875, -33.85546875, -32.4033203125, -30.951171875, -29.4990234375, -28.046875, -26.5947265625, -25.142578125, -23.6904296875, -22.23828125, -20.7861328125, -19.333984375, -17.8818359375, -16.4296875, -14.9775390625, -13.525390625, -12.0732421875, -10.62109375, -9.1689453125, -7.716796875, -6.2646484375, -4.8125, -3.3603515625, -1.908203125, -0.4560546875, 0.99609375, 2.4482421875, 3.900390625, 5.3525390625, 6.8046875, 8.2568359375, 9.708984375, 11.1611328125, 12.61328125, 14.0654296875, 15.517578125, 16.9697265625, 18.421875, 19.8740234375, 21.326171875, 22.7783203125, 24.23046875, 25.6826171875, 27.134765625, 28.5869140625, 30.0390625, 31.4912109375, 32.943359375, 34.3955078125, 35.84765625, 37.2998046875, 38.751953125, 40.2041015625, 41.65625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 26.0, 109.0, 324.0, 340.0, 176.0, 34.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.59844970703125, -63.17793655395508, -60.757423400878906, -58.336910247802734, -55.91639709472656, -53.495887756347656, -51.075374603271484, -48.65486145019531, -46.23434829711914, -43.81383514404297, -41.3933219909668, -38.972808837890625, -36.55229949951172, -34.13178253173828, -31.711273193359375, -29.290760040283203, -26.87024688720703, -24.44973373413086, -22.029220581054688, -19.60870933532715, -17.188196182250977, -14.767683029174805, -12.34717082977295, -9.926658630371094, -7.506145477294922, -5.085632801055908, -2.6651201248168945, -0.24460744857788086, 2.175905227661133, 4.596418380737305, 7.01693058013916, 9.437442779541016, 11.857955932617188, 14.27846908569336, 16.69898223876953, 19.11949348449707, 21.540006637573242, 23.960519790649414, 26.381031036376953, 28.801544189453125, 31.222057342529297, 33.64257049560547, 36.06308364868164, 38.48359680175781, 40.90410614013672, 43.324623107910156, 45.74513244628906, 48.165645599365234, 50.586158752441406, 53.00667190551758, 55.42718505859375, 57.84769821166992, 60.268211364746094, 62.688720703125, 65.10923767089844, 67.52974700927734, 69.95025634765625, 72.37076568603516, 74.7912826538086, 77.2117919921875, 79.63230895996094, 82.05281829833984, 84.47333526611328, 86.89384460449219, 89.31436157226562]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 6.0, 12.0, 16.0, 12.0, 11.0, 12.0, 19.0, 18.0, 23.0, 17.0, 31.0, 34.0, 34.0, 35.0, 32.0, 43.0, 53.0, 33.0, 35.0, 38.0, 49.0, 49.0, 31.0, 34.0, 35.0, 27.0, 26.0, 28.0, 24.0, 25.0, 21.0, 27.0, 12.0, 12.0, 10.0, 8.0, 10.0, 9.0, 7.0, 8.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.788787841796875, -57.810386657714844, -55.83198547363281, -53.85358428955078, -51.875179290771484, -49.89677810668945, -47.91837692260742, -45.93997573852539, -43.961570739746094, -41.98316955566406, -40.00476837158203, -38.0263671875, -36.0479621887207, -34.06956100463867, -32.09115982055664, -30.11275863647461, -28.134357452392578, -26.155956268310547, -24.177553176879883, -22.19915199279785, -20.220748901367188, -18.242347717285156, -16.263946533203125, -14.285544395446777, -12.30714225769043, -10.328740119934082, -8.350337982177734, -6.371936798095703, -4.3935346603393555, -2.415132522583008, -0.43673133850097656, 1.541670799255371, 3.5200729370117188, 5.498475074768066, 7.476876735687256, 9.455278396606445, 11.433680534362793, 13.41208267211914, 15.390483856201172, 17.368885040283203, 19.347288131713867, 21.3256893157959, 23.304092407226562, 25.282493591308594, 27.260894775390625, 29.23929786682129, 31.21769905090332, 33.196102142333984, 35.174503326416016, 37.15290451049805, 39.13130569458008, 41.109710693359375, 43.088111877441406, 45.06651306152344, 47.04491424560547, 49.0233154296875, 51.00171661376953, 52.98011779785156, 54.958518981933594, 56.936920166015625, 58.91532516479492, 60.89372634887695, 62.872127532958984, 64.85053253173828, 66.82893371582031]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 10.0, 11.0, 13.0, 7.0, 11.0, 9.0, 14.0, 24.0, 16.0, 17.0, 22.0, 27.0, 38.0, 40.0, 28.0, 32.0, 31.0, 45.0, 41.0, 43.0, 55.0, 29.0, 47.0, 32.0, 42.0, 33.0, 29.0, 27.0, 27.0, 26.0, 26.0, 24.0, 24.0, 19.0, 11.0, 18.0, 7.0, 10.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.46484375, -7.22210693359375, -6.9793701171875, -6.73663330078125, -6.493896484375, -6.25115966796875, -6.0084228515625, -5.76568603515625, -5.52294921875, -5.28021240234375, -5.0374755859375, -4.79473876953125, -4.552001953125, -4.30926513671875, -4.0665283203125, -3.82379150390625, -3.5810546875, -3.33831787109375, -3.0955810546875, -2.85284423828125, -2.610107421875, -2.36737060546875, -2.1246337890625, -1.88189697265625, -1.63916015625, -1.39642333984375, -1.1536865234375, -0.91094970703125, -0.668212890625, -0.42547607421875, -0.1827392578125, 0.05999755859375, 0.302734375, 0.54547119140625, 0.7882080078125, 1.03094482421875, 1.273681640625, 1.51641845703125, 1.7591552734375, 2.00189208984375, 2.24462890625, 2.48736572265625, 2.7301025390625, 2.97283935546875, 3.215576171875, 3.45831298828125, 3.7010498046875, 3.94378662109375, 4.1865234375, 4.42926025390625, 4.6719970703125, 4.91473388671875, 5.157470703125, 5.40020751953125, 5.6429443359375, 5.88568115234375, 6.12841796875, 6.37115478515625, 6.6138916015625, 6.85662841796875, 7.099365234375, 7.34210205078125, 7.5848388671875, 7.82757568359375, 8.0703125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 8.0, 10.0, 9.0, 8.0, 10.0, 13.0, 22.0, 23.0, 32.0, 44.0, 52.0, 51.0, 74.0, 78.0, 129.0, 242.0, 713.0, 5437.0, 182657.0, 3435673.0, 555938.0, 11017.0, 1104.0, 309.0, 148.0, 98.0, 73.0, 49.0, 41.0, 30.0, 36.0, 29.0, 22.0, 18.0, 16.0, 13.0, 13.0, 2.0, 4.0, 9.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.78125, -24.9111328125, -24.041015625, -23.1708984375, -22.30078125, -21.4306640625, -20.560546875, -19.6904296875, -18.8203125, -17.9501953125, -17.080078125, -16.2099609375, -15.33984375, -14.4697265625, -13.599609375, -12.7294921875, -11.859375, -10.9892578125, -10.119140625, -9.2490234375, -8.37890625, -7.5087890625, -6.638671875, -5.7685546875, -4.8984375, -4.0283203125, -3.158203125, -2.2880859375, -1.41796875, -0.5478515625, 0.322265625, 1.1923828125, 2.0625, 2.9326171875, 3.802734375, 4.6728515625, 5.54296875, 6.4130859375, 7.283203125, 8.1533203125, 9.0234375, 9.8935546875, 10.763671875, 11.6337890625, 12.50390625, 13.3740234375, 14.244140625, 15.1142578125, 15.984375, 16.8544921875, 17.724609375, 18.5947265625, 19.46484375, 20.3349609375, 21.205078125, 22.0751953125, 22.9453125, 23.8154296875, 24.685546875, 25.5556640625, 26.42578125, 27.2958984375, 28.166015625, 29.0361328125, 29.90625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 1.0, 7.0, 14.0, 13.0, 18.0, 25.0, 30.0, 53.0, 66.0, 74.0, 141.0, 167.0, 240.0, 310.0, 450.0, 467.0, 474.0, 385.0, 302.0, 219.0, 176.0, 123.0, 83.0, 75.0, 45.0, 31.0, 29.0, 17.0, 12.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -14.1453857421875, -13.673583984375, -13.2017822265625, -12.72998046875, -12.2581787109375, -11.786376953125, -11.3145751953125, -10.8427734375, -10.3709716796875, -9.899169921875, -9.4273681640625, -8.95556640625, -8.4837646484375, -8.011962890625, -7.5401611328125, -7.068359375, -6.5965576171875, -6.124755859375, -5.6529541015625, -5.18115234375, -4.7093505859375, -4.237548828125, -3.7657470703125, -3.2939453125, -2.8221435546875, -2.350341796875, -1.8785400390625, -1.40673828125, -0.9349365234375, -0.463134765625, 0.0086669921875, 0.48046875, 0.9522705078125, 1.424072265625, 1.8958740234375, 2.36767578125, 2.8394775390625, 3.311279296875, 3.7830810546875, 4.2548828125, 4.7266845703125, 5.198486328125, 5.6702880859375, 6.14208984375, 6.6138916015625, 7.085693359375, 7.5574951171875, 8.029296875, 8.5010986328125, 8.972900390625, 9.4447021484375, 9.91650390625, 10.3883056640625, 10.860107421875, 11.3319091796875, 11.8037109375, 12.2755126953125, 12.747314453125, 13.2191162109375, 13.69091796875, 14.1627197265625, 14.634521484375, 15.1063232421875, 15.578125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 11.0, 9.0, 9.0, 14.0, 17.0, 16.0, 40.0, 35.0, 52.0, 66.0, 92.0, 116.0, 159.0, 248.0, 311.0, 639.0, 3006.0, 1601941.0, 2581869.0, 3675.0, 677.0, 364.0, 217.0, 177.0, 119.0, 94.0, 70.0, 56.0, 45.0, 32.0, 28.0, 19.0, 17.0, 8.0, 6.0, 7.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0], "bins": [-98.375, -95.91748046875, -93.4599609375, -91.00244140625, -88.544921875, -86.08740234375, -83.6298828125, -81.17236328125, -78.71484375, -76.25732421875, -73.7998046875, -71.34228515625, -68.884765625, -66.42724609375, -63.9697265625, -61.51220703125, -59.0546875, -56.59716796875, -54.1396484375, -51.68212890625, -49.224609375, -46.76708984375, -44.3095703125, -41.85205078125, -39.39453125, -36.93701171875, -34.4794921875, -32.02197265625, -29.564453125, -27.10693359375, -24.6494140625, -22.19189453125, -19.734375, -17.27685546875, -14.8193359375, -12.36181640625, -9.904296875, -7.44677734375, -4.9892578125, -2.53173828125, -0.07421875, 2.38330078125, 4.8408203125, 7.29833984375, 9.755859375, 12.21337890625, 14.6708984375, 17.12841796875, 19.5859375, 22.04345703125, 24.5009765625, 26.95849609375, 29.416015625, 31.87353515625, 34.3310546875, 36.78857421875, 39.24609375, 41.70361328125, 44.1611328125, 46.61865234375, 49.076171875, 51.53369140625, 53.9912109375, 56.44873046875, 58.90625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 40.0, 104.0, 222.0, 273.0, 206.0, 97.0, 48.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.93165588378906, -39.5295524597168, -36.12744903564453, -32.725341796875, -29.323240280151367, -25.9211368560791, -22.519031524658203, -19.116928100585938, -15.714824676513672, -12.312721252441406, -8.910616874694824, -5.508512496948242, -2.1064090728759766, 1.295694351196289, 4.6977996826171875, 8.099903106689453, 11.502006530761719, 14.904109954833984, 18.30621337890625, 21.70831871032715, 25.110422134399414, 28.51252555847168, 31.914630889892578, 35.316734313964844, 38.71883773803711, 42.120941162109375, 45.52304458618164, 48.925148010253906, 52.32725524902344, 55.72935485839844, 59.13146209716797, 62.533565521240234, 65.9356689453125, 69.33777618408203, 72.73987579345703, 76.14198303222656, 79.54408264160156, 82.9461898803711, 86.34829711914062, 89.75039672851562, 93.15249633789062, 96.55460357666016, 99.95670318603516, 103.35881042480469, 106.76091003417969, 110.16301727294922, 113.56512451171875, 116.96722412109375, 120.36933135986328, 123.77143859863281, 127.17353820800781, 130.5756378173828, 133.97775268554688, 137.37985229492188, 140.78195190429688, 144.18405151367188, 147.58616638183594, 150.98826599121094, 154.390380859375, 157.79248046875, 161.194580078125, 164.5966796875, 167.99879455566406, 171.40089416503906, 174.80299377441406]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 1.0, 4.0, 6.0, 10.0, 4.0, 14.0, 19.0, 21.0, 28.0, 27.0, 39.0, 33.0, 38.0, 40.0, 34.0, 38.0, 41.0, 56.0, 48.0, 38.0, 50.0, 52.0, 48.0, 41.0, 37.0, 27.0, 30.0, 26.0, 35.0, 14.0, 17.0, 16.0, 15.0, 13.0, 11.0, 6.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-61.08990478515625, -59.3248291015625, -57.55975341796875, -55.794673919677734, -54.029598236083984, -52.264522552490234, -50.49944305419922, -48.73436737060547, -46.96929168701172, -45.20421600341797, -43.43914031982422, -41.6740608215332, -39.90898513793945, -38.1439094543457, -36.37882995605469, -34.61375427246094, -32.84867858886719, -31.083602905273438, -29.318525314331055, -27.553447723388672, -25.788372039794922, -24.023296356201172, -22.25821876525879, -20.493141174316406, -18.728065490722656, -16.962989807128906, -15.197912216186523, -13.432835578918457, -11.66775894165039, -9.902682304382324, -8.137605667114258, -6.372529029846191, -4.607452392578125, -2.8423757553100586, -1.0772991180419922, 0.6877775192260742, 2.4528541564941406, 4.217930793762207, 5.983007431030273, 7.74808406829834, 9.513160705566406, 11.278237342834473, 13.043313980102539, 14.808390617370605, 16.573467254638672, 18.338542938232422, 20.103620529174805, 21.868698120117188, 23.633773803710938, 25.398849487304688, 27.16392707824707, 28.929004669189453, 30.694080352783203, 32.45915603637695, 34.22423553466797, 35.98931121826172, 37.75438690185547, 39.51946258544922, 41.28453826904297, 43.049617767333984, 44.814693450927734, 46.579769134521484, 48.3448486328125, 50.10992431640625, 51.875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 11.0, 11.0, 12.0, 20.0, 18.0, 24.0, 19.0, 23.0, 25.0, 37.0, 31.0, 37.0, 46.0, 25.0, 46.0, 41.0, 51.0, 44.0, 31.0, 48.0, 47.0, 38.0, 26.0, 27.0, 33.0, 38.0, 19.0, 24.0, 20.0, 19.0, 16.0, 17.0, 16.0, 10.0, 9.0, 0.0, 7.0, 6.0, 7.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.12835693359375, -6.8778076171875, -6.62725830078125, -6.376708984375, -6.12615966796875, -5.8756103515625, -5.62506103515625, -5.37451171875, -5.12396240234375, -4.8734130859375, -4.62286376953125, -4.372314453125, -4.12176513671875, -3.8712158203125, -3.62066650390625, -3.3701171875, -3.11956787109375, -2.8690185546875, -2.61846923828125, -2.367919921875, -2.11737060546875, -1.8668212890625, -1.61627197265625, -1.36572265625, -1.11517333984375, -0.8646240234375, -0.61407470703125, -0.363525390625, -0.11297607421875, 0.1375732421875, 0.38812255859375, 0.638671875, 0.88922119140625, 1.1397705078125, 1.39031982421875, 1.640869140625, 1.89141845703125, 2.1419677734375, 2.39251708984375, 2.64306640625, 2.89361572265625, 3.1441650390625, 3.39471435546875, 3.645263671875, 3.89581298828125, 4.1463623046875, 4.39691162109375, 4.6474609375, 4.89801025390625, 5.1485595703125, 5.39910888671875, 5.649658203125, 5.90020751953125, 6.1507568359375, 6.40130615234375, 6.65185546875, 6.90240478515625, 7.1529541015625, 7.40350341796875, 7.654052734375, 7.90460205078125, 8.1551513671875, 8.40570068359375, 8.65625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 20.0, 18.0, 32.0, 53.0, 90.0, 154.0, 226.0, 347.0, 474.0, 720.0, 1136.0, 1723.0, 2558.0, 3864.0, 5706.0, 8766.0, 13333.0, 20703.0, 32873.0, 53354.0, 89602.0, 157873.0, 248847.0, 162942.0, 92391.0, 54832.0, 33978.0, 21295.0, 13804.0, 9071.0, 5965.0, 3924.0, 2621.0, 1797.0, 1180.0, 791.0, 527.0, 316.0, 211.0, 148.0, 101.0, 68.0, 42.0, 29.0, 8.0, 12.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0274658203125, -0.991455078125, -0.9554443359375, -0.91943359375, -0.8834228515625, -0.847412109375, -0.8114013671875, -0.775390625, -0.7393798828125, -0.703369140625, -0.6673583984375, -0.63134765625, -0.5953369140625, -0.559326171875, -0.5233154296875, -0.4873046875, -0.4512939453125, -0.415283203125, -0.3792724609375, -0.34326171875, -0.3072509765625, -0.271240234375, -0.2352294921875, -0.19921875, -0.1632080078125, -0.127197265625, -0.0911865234375, -0.05517578125, -0.0191650390625, 0.016845703125, 0.0528564453125, 0.0888671875, 0.1248779296875, 0.160888671875, 0.1968994140625, 0.23291015625, 0.2689208984375, 0.304931640625, 0.3409423828125, 0.376953125, 0.4129638671875, 0.448974609375, 0.4849853515625, 0.52099609375, 0.5570068359375, 0.593017578125, 0.6290283203125, 0.6650390625, 0.7010498046875, 0.737060546875, 0.7730712890625, 0.80908203125, 0.8450927734375, 0.881103515625, 0.9171142578125, 0.953125, 0.9891357421875, 1.025146484375, 1.0611572265625, 1.09716796875, 1.1331787109375, 1.169189453125, 1.2052001953125, 1.2412109375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 8.0, 2.0, 8.0, 8.0, 13.0, 19.0, 23.0, 16.0, 18.0, 20.0, 11.0, 24.0, 35.0, 29.0, 24.0, 28.0, 22.0, 40.0, 37.0, 29.0, 31.0, 1062.0, 31.0, 39.0, 30.0, 23.0, 28.0, 39.0, 33.0, 31.0, 36.0, 24.0, 21.0, 27.0, 20.0, 24.0, 20.0, 11.0, 16.0, 6.0, 7.0, 5.0, 11.0, 8.0, 4.0, 5.0, 7.0, 1.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0], "bins": [-4.24609375, -4.11328125, -3.98046875, -3.84765625, -3.71484375, -3.58203125, -3.44921875, -3.31640625, -3.18359375, -3.05078125, -2.91796875, -2.78515625, -2.65234375, -2.51953125, -2.38671875, -2.25390625, -2.12109375, -1.98828125, -1.85546875, -1.72265625, -1.58984375, -1.45703125, -1.32421875, -1.19140625, -1.05859375, -0.92578125, -0.79296875, -0.66015625, -0.52734375, -0.39453125, -0.26171875, -0.12890625, 0.00390625, 0.13671875, 0.26953125, 0.40234375, 0.53515625, 0.66796875, 0.80078125, 0.93359375, 1.06640625, 1.19921875, 1.33203125, 1.46484375, 1.59765625, 1.73046875, 1.86328125, 1.99609375, 2.12890625, 2.26171875, 2.39453125, 2.52734375, 2.66015625, 2.79296875, 2.92578125, 3.05859375, 3.19140625, 3.32421875, 3.45703125, 3.58984375, 3.72265625, 3.85546875, 3.98828125, 4.12109375, 4.25390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 6.0, 14.0, 22.0, 25.0, 36.0, 55.0, 69.0, 90.0, 122.0, 165.0, 257.0, 358.0, 446.0, 633.0, 927.0, 1282.0, 1756.0, 2482.0, 3572.0, 4936.0, 7093.0, 9871.0, 13976.0, 20787.0, 30082.0, 45195.0, 68498.0, 105054.0, 168149.0, 1244024.0, 122510.0, 79024.0, 52363.0, 34735.0, 23582.0, 16330.0, 11154.0, 7927.0, 5497.0, 3935.0, 2893.0, 2008.0, 1481.0, 1069.0, 763.0, 527.0, 374.0, 290.0, 213.0, 141.0, 120.0, 64.0, 63.0, 35.0, 22.0, 17.0, 3.0, 4.0, 11.0, 3.0, 2.0, 1.0], "bins": [-0.81298828125, -0.7869110107421875, -0.760833740234375, -0.7347564697265625, -0.70867919921875, -0.6826019287109375, -0.656524658203125, -0.6304473876953125, -0.6043701171875, -0.5782928466796875, -0.552215576171875, -0.5261383056640625, -0.50006103515625, -0.4739837646484375, -0.447906494140625, -0.4218292236328125, -0.395751953125, -0.3696746826171875, -0.343597412109375, -0.3175201416015625, -0.29144287109375, -0.2653656005859375, -0.239288330078125, -0.2132110595703125, -0.1871337890625, -0.1610565185546875, -0.134979248046875, -0.1089019775390625, -0.08282470703125, -0.0567474365234375, -0.030670166015625, -0.0045928955078125, 0.021484375, 0.0475616455078125, 0.073638916015625, 0.0997161865234375, 0.12579345703125, 0.1518707275390625, 0.177947998046875, 0.2040252685546875, 0.2301025390625, 0.2561798095703125, 0.282257080078125, 0.3083343505859375, 0.33441162109375, 0.3604888916015625, 0.386566162109375, 0.4126434326171875, 0.438720703125, 0.4647979736328125, 0.490875244140625, 0.5169525146484375, 0.54302978515625, 0.5691070556640625, 0.595184326171875, 0.6212615966796875, 0.6473388671875, 0.6734161376953125, 0.699493408203125, 0.7255706787109375, 0.75164794921875, 0.7777252197265625, 0.803802490234375, 0.8298797607421875, 0.85595703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 15.0, 13.0, 18.0, 29.0, 43.0, 34.0, 47.0, 51.0, 69.0, 75.0, 81.0, 84.0, 65.0, 65.0, 61.0, 37.0, 36.0, 33.0, 29.0, 21.0, 15.0, 16.0, 11.0, 5.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012693405151367188, -0.001221880316734314, -0.0011744201183319092, -0.0011269599199295044, -0.0010794997215270996, -0.0010320395231246948, -0.00098457932472229, -0.0009371191263198853, -0.0008896589279174805, -0.0008421987295150757, -0.0007947385311126709, -0.0007472783327102661, -0.0006998181343078613, -0.0006523579359054565, -0.0006048977375030518, -0.000557437539100647, -0.0005099773406982422, -0.0004625171422958374, -0.0004150569438934326, -0.00036759674549102783, -0.00032013654708862305, -0.00027267634868621826, -0.00022521615028381348, -0.0001777559518814087, -0.0001302957534790039, -8.283555507659912e-05, -3.5375356674194336e-05, 1.208484172821045e-05, 5.9545040130615234e-05, 0.00010700523853302002, 0.0001544654369354248, 0.0002019256353378296, 0.0002493858337402344, 0.00029684603214263916, 0.00034430623054504395, 0.00039176642894744873, 0.0004392266273498535, 0.0004866868257522583, 0.0005341470241546631, 0.0005816072225570679, 0.0006290674209594727, 0.0006765276193618774, 0.0007239878177642822, 0.000771448016166687, 0.0008189082145690918, 0.0008663684129714966, 0.0009138286113739014, 0.0009612888097763062, 0.001008749008178711, 0.0010562092065811157, 0.0011036694049835205, 0.0011511296033859253, 0.00119858980178833, 0.0012460500001907349, 0.0012935101985931396, 0.0013409703969955444, 0.0013884305953979492, 0.001435890793800354, 0.0014833509922027588, 0.0015308111906051636, 0.0015782713890075684, 0.0016257315874099731, 0.001673191785812378, 0.0017206519842147827, 0.0017681121826171875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 9.0, 5.0, 8.0, 14.0, 20.0, 22.0, 48.0, 50.0, 63.0, 100.0, 128.0, 255.0, 661.0, 10827.0, 1033899.0, 1442.0, 410.0, 181.0, 116.0, 83.0, 57.0, 38.0, 22.0, 15.0, 20.0, 13.0, 9.0, 7.0, 4.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036285400390625, -0.035195350646972656, -0.03410530090332031, -0.03301525115966797, -0.031925201416015625, -0.03083515167236328, -0.029745101928710938, -0.028655052185058594, -0.02756500244140625, -0.026474952697753906, -0.025384902954101562, -0.02429485321044922, -0.023204803466796875, -0.02211475372314453, -0.021024703979492188, -0.019934654235839844, -0.0188446044921875, -0.017754554748535156, -0.016664505004882812, -0.015574455261230469, -0.014484405517578125, -0.013394355773925781, -0.012304306030273438, -0.011214256286621094, -0.01012420654296875, -0.009034156799316406, -0.007944107055664062, -0.006854057312011719, -0.005764007568359375, -0.004673957824707031, -0.0035839080810546875, -0.0024938583374023438, -0.00140380859375, -0.00031375885009765625, 0.0007762908935546875, 0.0018663406372070312, 0.002956390380859375, 0.004046440124511719, 0.0051364898681640625, 0.006226539611816406, 0.00731658935546875, 0.008406639099121094, 0.009496688842773438, 0.010586738586425781, 0.011676788330078125, 0.012766838073730469, 0.013856887817382812, 0.014946937561035156, 0.0160369873046875, 0.017127037048339844, 0.018217086791992188, 0.01930713653564453, 0.020397186279296875, 0.02148723602294922, 0.022577285766601562, 0.023667335510253906, 0.02475738525390625, 0.025847434997558594, 0.026937484741210938, 0.02802753448486328, 0.029117584228515625, 0.03020763397216797, 0.03129768371582031, 0.032387733459472656, 0.033477783203125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 71.0, 266.0, 411.0, 198.0, 49.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003533209441229701, -0.0034657451324164867, -0.0033982808236032724, -0.003330816514790058, -0.003263352205976844, -0.0031958878971636295, -0.0031284235883504152, -0.003060959279537201, -0.0029934949707239866, -0.0029260306619107723, -0.002858566353097558, -0.0027911020442843437, -0.0027236377354711294, -0.002656173426657915, -0.002588709117844701, -0.0025212448090314865, -0.002453780500218272, -0.002386316191405058, -0.0023188518825918436, -0.0022513875737786293, -0.002183923264965415, -0.0021164589561522007, -0.0020489946473389864, -0.001981530338525772, -0.0019140660297125578, -0.0018466017208993435, -0.0017791374120861292, -0.0017116731032729149, -0.0016442087944597006, -0.0015767444856464863, -0.001509280176833272, -0.0014418158680200577, -0.0013743514427915215, -0.0013068871339783072, -0.001239422825165093, -0.0011719585163518786, -0.0011044942075386643, -0.00103702989872545, -0.0009695655899122357, -0.0009021012810990214, -0.0008346369722858071, -0.0007671726634725928, -0.0006997083546593785, -0.0006322440458461642, -0.0005647797370329499, -0.0004973154282197356, -0.0004298511194065213, -0.000362386810593307, -0.0002949225017800927, -0.00022745819296687841, -0.0001599938841536641, -9.252957534044981e-05, -2.5065266527235508e-05, 4.2399042285978794e-05, 0.0001098633510991931, 0.0001773276599124074, 0.0002447919687256217, 0.000312256277538836, 0.0003797205863520503, 0.0004471848951652646, 0.0005146492039784789, 0.0005821135127916932, 0.0006495778216049075, 0.0007170421304181218, 0.0007845064392313361]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 10.0, 8.0, 12.0, 17.0, 8.0, 19.0, 20.0, 23.0, 35.0, 32.0, 31.0, 31.0, 25.0, 31.0, 31.0, 34.0, 44.0, 30.0, 40.0, 37.0, 36.0, 39.0, 37.0, 40.0, 34.0, 32.0, 36.0, 19.0, 18.0, 27.0, 24.0, 18.0, 20.0, 9.0, 13.0, 17.0, 9.0, 8.0, 11.0, 5.0, 6.0, 5.0, 3.0, 2.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006362199783325195, -0.0006170328706502914, -0.0005978457629680634, -0.0005786586552858353, -0.0005594715476036072, -0.0005402844399213791, -0.000521097332239151, -0.0005019102245569229, -0.0004827231168746948, -0.00046353600919246674, -0.00044434890151023865, -0.00042516179382801056, -0.00040597468614578247, -0.0003867875784635544, -0.0003676004707813263, -0.0003484133630990982, -0.0003292262554168701, -0.00031003914773464203, -0.00029085204005241394, -0.00027166493237018585, -0.00025247782468795776, -0.00023329071700572968, -0.0002141036093235016, -0.0001949165016412735, -0.0001757293939590454, -0.00015654228627681732, -0.00013735517859458923, -0.00011816807091236115, -9.898096323013306e-05, -7.979385554790497e-05, -6.060674786567688e-05, -4.141964018344879e-05, -2.2232532501220703e-05, -3.0454248189926147e-06, 1.6141682863235474e-05, 3.532879054546356e-05, 5.451589822769165e-05, 7.370300590991974e-05, 9.289011359214783e-05, 0.00011207722127437592, 0.000131264328956604, 0.0001504514366388321, 0.00016963854432106018, 0.00018882565200328827, 0.00020801275968551636, 0.00022719986736774445, 0.00024638697504997253, 0.0002655740827322006, 0.0002847611904144287, 0.0003039482980966568, 0.0003231354057788849, 0.000342322513461113, 0.00036150962114334106, 0.00038069672882556915, 0.00039988383650779724, 0.00041907094419002533, 0.0004382580518722534, 0.0004574451595544815, 0.0004766322672367096, 0.0004958193749189377, 0.0005150064826011658, 0.0005341935902833939, 0.000553380697965622, 0.00057256780564785, 0.0005917549133300781]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 11.0, 11.0, 12.0, 20.0, 18.0, 24.0, 19.0, 23.0, 25.0, 37.0, 31.0, 37.0, 46.0, 25.0, 46.0, 41.0, 51.0, 44.0, 31.0, 48.0, 47.0, 38.0, 26.0, 27.0, 33.0, 38.0, 19.0, 24.0, 20.0, 19.0, 16.0, 17.0, 16.0, 10.0, 9.0, 0.0, 7.0, 6.0, 7.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.12835693359375, -6.8778076171875, -6.62725830078125, -6.376708984375, -6.12615966796875, -5.8756103515625, -5.62506103515625, -5.37451171875, -5.12396240234375, -4.8734130859375, -4.62286376953125, -4.372314453125, -4.12176513671875, -3.8712158203125, -3.62066650390625, -3.3701171875, -3.11956787109375, -2.8690185546875, -2.61846923828125, -2.367919921875, -2.11737060546875, -1.8668212890625, -1.61627197265625, -1.36572265625, -1.11517333984375, -0.8646240234375, -0.61407470703125, -0.363525390625, -0.11297607421875, 0.1375732421875, 0.38812255859375, 0.638671875, 0.88922119140625, 1.1397705078125, 1.39031982421875, 1.640869140625, 1.89141845703125, 2.1419677734375, 2.39251708984375, 2.64306640625, 2.89361572265625, 3.1441650390625, 3.39471435546875, 3.645263671875, 3.89581298828125, 4.1463623046875, 4.39691162109375, 4.6474609375, 4.89801025390625, 5.1485595703125, 5.39910888671875, 5.649658203125, 5.90020751953125, 6.1507568359375, 6.40130615234375, 6.65185546875, 6.90240478515625, 7.1529541015625, 7.40350341796875, 7.654052734375, 7.90460205078125, 8.1551513671875, 8.40570068359375, 8.65625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 8.0, 6.0, 12.0, 12.0, 22.0, 26.0, 25.0, 38.0, 40.0, 51.0, 77.0, 127.0, 142.0, 208.0, 325.0, 595.0, 1955.0, 10546.0, 88083.0, 700287.0, 217075.0, 23139.0, 3531.0, 906.0, 399.0, 247.0, 191.0, 121.0, 77.0, 74.0, 46.0, 36.0, 26.0, 28.0, 18.0, 10.0, 12.0, 3.0, 9.0, 4.0, 7.0, 4.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5390625, -14.0494384765625, -13.559814453125, -13.0701904296875, -12.58056640625, -12.0909423828125, -11.601318359375, -11.1116943359375, -10.6220703125, -10.1324462890625, -9.642822265625, -9.1531982421875, -8.66357421875, -8.1739501953125, -7.684326171875, -7.1947021484375, -6.705078125, -6.2154541015625, -5.725830078125, -5.2362060546875, -4.74658203125, -4.2569580078125, -3.767333984375, -3.2777099609375, -2.7880859375, -2.2984619140625, -1.808837890625, -1.3192138671875, -0.82958984375, -0.3399658203125, 0.149658203125, 0.6392822265625, 1.12890625, 1.6185302734375, 2.108154296875, 2.5977783203125, 3.08740234375, 3.5770263671875, 4.066650390625, 4.5562744140625, 5.0458984375, 5.5355224609375, 6.025146484375, 6.5147705078125, 7.00439453125, 7.4940185546875, 7.983642578125, 8.4732666015625, 8.962890625, 9.4525146484375, 9.942138671875, 10.4317626953125, 10.92138671875, 11.4110107421875, 11.900634765625, 12.3902587890625, 12.8798828125, 13.3695068359375, 13.859130859375, 14.3487548828125, 14.83837890625, 15.3280029296875, 15.817626953125, 16.3072509765625, 16.796875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 9.0, 6.0, 17.0, 11.0, 19.0, 14.0, 17.0, 14.0, 25.0, 32.0, 28.0, 34.0, 38.0, 40.0, 45.0, 69.0, 147.0, 433.0, 1434.0, 121.0, 69.0, 38.0, 46.0, 32.0, 42.0, 24.0, 37.0, 30.0, 21.0, 12.0, 17.0, 22.0, 19.0, 12.0, 10.0, 8.0, 10.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-25.90625, -25.166748046875, -24.42724609375, -23.687744140625, -22.9482421875, -22.208740234375, -21.46923828125, -20.729736328125, -19.990234375, -19.250732421875, -18.51123046875, -17.771728515625, -17.0322265625, -16.292724609375, -15.55322265625, -14.813720703125, -14.07421875, -13.334716796875, -12.59521484375, -11.855712890625, -11.1162109375, -10.376708984375, -9.63720703125, -8.897705078125, -8.158203125, -7.418701171875, -6.67919921875, -5.939697265625, -5.2001953125, -4.460693359375, -3.72119140625, -2.981689453125, -2.2421875, -1.502685546875, -0.76318359375, -0.023681640625, 0.7158203125, 1.455322265625, 2.19482421875, 2.934326171875, 3.673828125, 4.413330078125, 5.15283203125, 5.892333984375, 6.6318359375, 7.371337890625, 8.11083984375, 8.850341796875, 9.58984375, 10.329345703125, 11.06884765625, 11.808349609375, 12.5478515625, 13.287353515625, 14.02685546875, 14.766357421875, 15.505859375, 16.245361328125, 16.98486328125, 17.724365234375, 18.4638671875, 19.203369140625, 19.94287109375, 20.682373046875, 21.421875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 6.0, 8.0, 7.0, 10.0, 12.0, 13.0, 28.0, 25.0, 25.0, 28.0, 53.0, 77.0, 74.0, 112.0, 161.0, 296.0, 589.0, 2485.0, 337060.0, 2798192.0, 4605.0, 838.0, 312.0, 179.0, 122.0, 94.0, 55.0, 54.0, 35.0, 23.0, 26.0, 17.0, 16.0, 11.0, 11.0, 12.0, 6.0, 6.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.59375, -57.73828125, -55.8828125, -54.02734375, -52.171875, -50.31640625, -48.4609375, -46.60546875, -44.75, -42.89453125, -41.0390625, -39.18359375, -37.328125, -35.47265625, -33.6171875, -31.76171875, -29.90625, -28.05078125, -26.1953125, -24.33984375, -22.484375, -20.62890625, -18.7734375, -16.91796875, -15.0625, -13.20703125, -11.3515625, -9.49609375, -7.640625, -5.78515625, -3.9296875, -2.07421875, -0.21875, 1.63671875, 3.4921875, 5.34765625, 7.203125, 9.05859375, 10.9140625, 12.76953125, 14.625, 16.48046875, 18.3359375, 20.19140625, 22.046875, 23.90234375, 25.7578125, 27.61328125, 29.46875, 31.32421875, 33.1796875, 35.03515625, 36.890625, 38.74609375, 40.6015625, 42.45703125, 44.3125, 46.16796875, 48.0234375, 49.87890625, 51.734375, 53.58984375, 55.4453125, 57.30078125, 59.15625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 11.0, 319.0, 629.0, 55.0], "bins": [-329.222412109375, -323.92584228515625, -318.6292724609375, -313.3326721191406, -308.0361022949219, -302.7395324707031, -297.44293212890625, -292.1463623046875, -286.84979248046875, -281.55322265625, -276.25665283203125, -270.9600524902344, -265.6634826660156, -260.3669128417969, -255.07032775878906, -249.77374267578125, -244.4771728515625, -239.18060302734375, -233.88401794433594, -228.58743286132812, -223.29086303710938, -217.99429321289062, -212.6977081298828, -207.401123046875, -202.10455322265625, -196.8079833984375, -191.5113983154297, -186.21481323242188, -180.91824340820312, -175.62167358398438, -170.32508850097656, -165.02850341796875, -159.73193359375, -154.43536376953125, -149.13877868652344, -143.84219360351562, -138.54562377929688, -133.24905395507812, -127.95246887207031, -122.65589141845703, -117.35930633544922, -112.06272888183594, -106.76615142822266, -101.46957397460938, -96.1729965209961, -90.87641906738281, -85.57984161376953, -80.28326416015625, -74.98668670654297, -69.69010925292969, -64.3935317993164, -59.096954345703125, -53.800376892089844, -48.50379943847656, -43.20722198486328, -37.91064453125, -32.61406707763672, -27.317489624023438, -22.020912170410156, -16.724334716796875, -11.427757263183594, -6.1311798095703125, -0.8346023559570312, 4.46197509765625, 9.758552551269531]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 4.0, 9.0, 13.0, 12.0, 18.0, 18.0, 23.0, 21.0, 32.0, 34.0, 33.0, 40.0, 29.0, 39.0, 43.0, 38.0, 47.0, 50.0, 37.0, 52.0, 40.0, 36.0, 40.0, 34.0, 39.0, 35.0, 35.0, 23.0, 18.0, 11.0, 14.0, 14.0, 12.0, 10.0, 11.0, 6.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-76.95718383789062, -74.86672973632812, -72.77627563476562, -70.68582916259766, -68.59537506103516, -66.50492095947266, -64.41447448730469, -62.32402038574219, -60.23356628417969, -58.14311218261719, -56.05266189575195, -53.96221160888672, -51.87175750732422, -49.78130340576172, -47.690853118896484, -45.60040283203125, -43.50994873046875, -41.41949462890625, -39.329044342041016, -37.23859405517578, -35.14813995361328, -33.05768585205078, -30.967235565185547, -28.87678337097168, -26.786331176757812, -24.695878982543945, -22.605426788330078, -20.51497459411621, -18.424522399902344, -16.334070205688477, -14.24361801147461, -12.153165817260742, -10.062721252441406, -7.972269058227539, -5.881816864013672, -3.7913646697998047, -1.7009124755859375, 0.3895397186279297, 2.479991912841797, 4.570444107055664, 6.660896301269531, 8.751348495483398, 10.841800689697266, 12.932252883911133, 15.022705078125, 17.113157272338867, 19.203609466552734, 21.2940616607666, 23.38451385498047, 25.474966049194336, 27.565418243408203, 29.65587043762207, 31.746322631835938, 33.83677673339844, 35.92722702026367, 38.017677307128906, 40.108131408691406, 42.198585510253906, 44.28903579711914, 46.379486083984375, 48.469940185546875, 50.560394287109375, 52.65084457397461, 54.741294860839844, 56.831748962402344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 9.0, 7.0, 20.0, 14.0, 18.0, 17.0, 15.0, 24.0, 31.0, 27.0, 33.0, 28.0, 43.0, 34.0, 38.0, 36.0, 52.0, 42.0, 41.0, 41.0, 43.0, 36.0, 49.0, 35.0, 30.0, 30.0, 23.0, 21.0, 27.0, 21.0, 18.0, 10.0, 20.0, 17.0, 15.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.92578125, -7.66363525390625, -7.4014892578125, -7.13934326171875, -6.877197265625, -6.61505126953125, -6.3529052734375, -6.09075927734375, -5.82861328125, -5.56646728515625, -5.3043212890625, -5.04217529296875, -4.780029296875, -4.51788330078125, -4.2557373046875, -3.99359130859375, -3.7314453125, -3.46929931640625, -3.2071533203125, -2.94500732421875, -2.682861328125, -2.42071533203125, -2.1585693359375, -1.89642333984375, -1.63427734375, -1.37213134765625, -1.1099853515625, -0.84783935546875, -0.585693359375, -0.32354736328125, -0.0614013671875, 0.20074462890625, 0.462890625, 0.72503662109375, 0.9871826171875, 1.24932861328125, 1.511474609375, 1.77362060546875, 2.0357666015625, 2.29791259765625, 2.56005859375, 2.82220458984375, 3.0843505859375, 3.34649658203125, 3.608642578125, 3.87078857421875, 4.1329345703125, 4.39508056640625, 4.6572265625, 4.91937255859375, 5.1815185546875, 5.44366455078125, 5.705810546875, 5.96795654296875, 6.2301025390625, 6.49224853515625, 6.75439453125, 7.01654052734375, 7.2786865234375, 7.54083251953125, 7.802978515625, 8.06512451171875, 8.3272705078125, 8.58941650390625, 8.8515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 12.0, 8.0, 10.0, 18.0, 15.0, 20.0, 37.0, 24.0, 33.0, 51.0, 62.0, 124.0, 185.0, 393.0, 1141.0, 6392.0, 135238.0, 2961873.0, 1058491.0, 26033.0, 2677.0, 667.0, 253.0, 145.0, 94.0, 53.0, 52.0, 32.0, 27.0, 26.0, 21.0, 12.0, 15.0, 10.0, 13.0, 5.0, 3.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.731689453125, -23.90087890625, -23.070068359375, -22.2392578125, -21.408447265625, -20.57763671875, -19.746826171875, -18.916015625, -18.085205078125, -17.25439453125, -16.423583984375, -15.5927734375, -14.761962890625, -13.93115234375, -13.100341796875, -12.26953125, -11.438720703125, -10.60791015625, -9.777099609375, -8.9462890625, -8.115478515625, -7.28466796875, -6.453857421875, -5.623046875, -4.792236328125, -3.96142578125, -3.130615234375, -2.2998046875, -1.468994140625, -0.63818359375, 0.192626953125, 1.0234375, 1.854248046875, 2.68505859375, 3.515869140625, 4.3466796875, 5.177490234375, 6.00830078125, 6.839111328125, 7.669921875, 8.500732421875, 9.33154296875, 10.162353515625, 10.9931640625, 11.823974609375, 12.65478515625, 13.485595703125, 14.31640625, 15.147216796875, 15.97802734375, 16.808837890625, 17.6396484375, 18.470458984375, 19.30126953125, 20.132080078125, 20.962890625, 21.793701171875, 22.62451171875, 23.455322265625, 24.2861328125, 25.116943359375, 25.94775390625, 26.778564453125, 27.609375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 6.0, 6.0, 15.0, 17.0, 18.0, 34.0, 56.0, 54.0, 103.0, 143.0, 189.0, 247.0, 363.0, 484.0, 543.0, 493.0, 397.0, 286.0, 205.0, 125.0, 86.0, 61.0, 37.0, 31.0, 30.0, 9.0, 16.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.96875, -18.4505615234375, -17.932373046875, -17.4141845703125, -16.89599609375, -16.3778076171875, -15.859619140625, -15.3414306640625, -14.8232421875, -14.3050537109375, -13.786865234375, -13.2686767578125, -12.75048828125, -12.2322998046875, -11.714111328125, -11.1959228515625, -10.677734375, -10.1595458984375, -9.641357421875, -9.1231689453125, -8.60498046875, -8.0867919921875, -7.568603515625, -7.0504150390625, -6.5322265625, -6.0140380859375, -5.495849609375, -4.9776611328125, -4.45947265625, -3.9412841796875, -3.423095703125, -2.9049072265625, -2.38671875, -1.8685302734375, -1.350341796875, -0.8321533203125, -0.31396484375, 0.2042236328125, 0.722412109375, 1.2406005859375, 1.7587890625, 2.2769775390625, 2.795166015625, 3.3133544921875, 3.83154296875, 4.3497314453125, 4.867919921875, 5.3861083984375, 5.904296875, 6.4224853515625, 6.940673828125, 7.4588623046875, 7.97705078125, 8.4952392578125, 9.013427734375, 9.5316162109375, 10.0498046875, 10.5679931640625, 11.086181640625, 11.6043701171875, 12.12255859375, 12.6407470703125, 13.158935546875, 13.6771240234375, 14.1953125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 7.0, 8.0, 10.0, 13.0, 15.0, 21.0, 32.0, 41.0, 43.0, 58.0, 96.0, 101.0, 127.0, 171.0, 252.0, 446.0, 1125.0, 9040.0, 2200031.0, 1971478.0, 8545.0, 1152.0, 476.0, 241.0, 187.0, 147.0, 77.0, 76.0, 60.0, 44.0, 35.0, 29.0, 22.0, 15.0, 13.0, 13.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-58.28125, -56.45947265625, -54.6376953125, -52.81591796875, -50.994140625, -49.17236328125, -47.3505859375, -45.52880859375, -43.70703125, -41.88525390625, -40.0634765625, -38.24169921875, -36.419921875, -34.59814453125, -32.7763671875, -30.95458984375, -29.1328125, -27.31103515625, -25.4892578125, -23.66748046875, -21.845703125, -20.02392578125, -18.2021484375, -16.38037109375, -14.55859375, -12.73681640625, -10.9150390625, -9.09326171875, -7.271484375, -5.44970703125, -3.6279296875, -1.80615234375, 0.015625, 1.83740234375, 3.6591796875, 5.48095703125, 7.302734375, 9.12451171875, 10.9462890625, 12.76806640625, 14.58984375, 16.41162109375, 18.2333984375, 20.05517578125, 21.876953125, 23.69873046875, 25.5205078125, 27.34228515625, 29.1640625, 30.98583984375, 32.8076171875, 34.62939453125, 36.451171875, 38.27294921875, 40.0947265625, 41.91650390625, 43.73828125, 45.56005859375, 47.3818359375, 49.20361328125, 51.025390625, 52.84716796875, 54.6689453125, 56.49072265625, 58.3125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 36.0, 210.0, 422.0, 262.0, 69.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.28794860839844, -241.8827362060547, -236.47752380371094, -231.0723114013672, -225.66709899902344, -220.26190185546875, -214.856689453125, -209.45147705078125, -204.0462646484375, -198.64105224609375, -193.23583984375, -187.83062744140625, -182.4254150390625, -177.02020263671875, -171.614990234375, -166.2097930908203, -160.8045654296875, -155.39935302734375, -149.994140625, -144.58892822265625, -139.1837158203125, -133.77850341796875, -128.373291015625, -122.96809387207031, -117.56288146972656, -112.15766906738281, -106.75245666503906, -101.34724426269531, -95.9420394897461, -90.53682708740234, -85.1316146850586, -79.72640991210938, -74.32119750976562, -68.91598510742188, -63.51077651977539, -58.10556411743164, -52.700355529785156, -47.295143127441406, -41.889930725097656, -36.48472213745117, -31.079509735107422, -25.674299240112305, -20.269088745117188, -14.863876342773438, -9.45866584777832, -4.053455352783203, 1.3517570495605469, 6.756965637207031, 12.162178039550781, 17.5673885345459, 22.972599029541016, 28.377811431884766, 33.78302001953125, 39.188232421875, 44.59344482421875, 49.998653411865234, 55.403865814208984, 60.809078216552734, 66.21428680419922, 71.61949920654297, 77.02471160888672, 82.42991638183594, 87.83512878417969, 93.24034118652344, 98.64555358886719]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 1.0, 3.0, 6.0, 11.0, 10.0, 8.0, 16.0, 12.0, 24.0, 23.0, 23.0, 28.0, 28.0, 23.0, 26.0, 33.0, 33.0, 34.0, 40.0, 46.0, 43.0, 44.0, 33.0, 42.0, 46.0, 38.0, 40.0, 45.0, 35.0, 29.0, 20.0, 22.0, 17.0, 15.0, 20.0, 20.0, 11.0, 11.0, 11.0, 9.0, 5.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.21568298339844, -50.677772521972656, -49.13985824584961, -47.60194778442383, -46.06403732299805, -44.526123046875, -42.98821258544922, -41.45030212402344, -39.912391662597656, -38.374481201171875, -36.83656692504883, -35.29865646362305, -33.760746002197266, -32.22283172607422, -30.684921264648438, -29.147010803222656, -27.60909652709961, -26.071184158325195, -24.533273696899414, -22.995361328125, -21.45745086669922, -19.919538497924805, -18.38162612915039, -16.84371566772461, -15.305803298950195, -13.767891883850098, -12.22998046875, -10.692068099975586, -9.154156684875488, -7.616245269775391, -6.078332901000977, -4.540421485900879, -3.0025100708007812, -1.4645984172821045, 0.07331323623657227, 1.6112251281738281, 3.149136543273926, 4.687047958374023, 6.2249603271484375, 7.762871742248535, 9.300783157348633, 10.83869457244873, 12.376605987548828, 13.914518356323242, 15.45242977142334, 16.990341186523438, 18.52825355529785, 20.066165924072266, 21.604076385498047, 23.14198875427246, 24.679899215698242, 26.217811584472656, 27.755722045898438, 29.29363441467285, 30.831546783447266, 32.36945724487305, 33.907371520996094, 35.445281982421875, 36.98319625854492, 38.5211067199707, 40.059017181396484, 41.59693145751953, 43.13484191894531, 44.672752380371094, 46.210662841796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 12.0, 13.0, 9.0, 8.0, 10.0, 10.0, 23.0, 29.0, 16.0, 32.0, 23.0, 28.0, 39.0, 36.0, 43.0, 37.0, 35.0, 36.0, 53.0, 38.0, 36.0, 51.0, 33.0, 36.0, 27.0, 27.0, 25.0, 36.0, 31.0, 20.0, 15.0, 13.0, 13.0, 19.0, 11.0, 10.0, 10.0, 9.0, 12.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0], "bins": [-8.4453125, -8.19732666015625, -7.9493408203125, -7.70135498046875, -7.453369140625, -7.20538330078125, -6.9573974609375, -6.70941162109375, -6.46142578125, -6.21343994140625, -5.9654541015625, -5.71746826171875, -5.469482421875, -5.22149658203125, -4.9735107421875, -4.72552490234375, -4.4775390625, -4.22955322265625, -3.9815673828125, -3.73358154296875, -3.485595703125, -3.23760986328125, -2.9896240234375, -2.74163818359375, -2.49365234375, -2.24566650390625, -1.9976806640625, -1.74969482421875, -1.501708984375, -1.25372314453125, -1.0057373046875, -0.75775146484375, -0.509765625, -0.26177978515625, -0.0137939453125, 0.23419189453125, 0.482177734375, 0.73016357421875, 0.9781494140625, 1.22613525390625, 1.47412109375, 1.72210693359375, 1.9700927734375, 2.21807861328125, 2.466064453125, 2.71405029296875, 2.9620361328125, 3.21002197265625, 3.4580078125, 3.70599365234375, 3.9539794921875, 4.20196533203125, 4.449951171875, 4.69793701171875, 4.9459228515625, 5.19390869140625, 5.44189453125, 5.68988037109375, 5.9378662109375, 6.18585205078125, 6.433837890625, 6.68182373046875, 6.9298095703125, 7.17779541015625, 7.42578125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 12.0, 15.0, 11.0, 28.0, 43.0, 70.0, 113.0, 161.0, 285.0, 457.0, 794.0, 1324.0, 2192.0, 3677.0, 6009.0, 10528.0, 17705.0, 31529.0, 57760.0, 113189.0, 237055.0, 279462.0, 133407.0, 67486.0, 36115.0, 20174.0, 11672.0, 6889.0, 3990.0, 2505.0, 1529.0, 945.0, 550.0, 342.0, 199.0, 115.0, 69.0, 49.0, 28.0, 23.0, 15.0, 7.0, 7.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.328399658203125, -1.28277587890625, -1.237152099609375, -1.1915283203125, -1.145904541015625, -1.10028076171875, -1.054656982421875, -1.009033203125, -0.963409423828125, -0.91778564453125, -0.872161865234375, -0.8265380859375, -0.780914306640625, -0.73529052734375, -0.689666748046875, -0.64404296875, -0.598419189453125, -0.55279541015625, -0.507171630859375, -0.4615478515625, -0.415924072265625, -0.37030029296875, -0.324676513671875, -0.279052734375, -0.233428955078125, -0.18780517578125, -0.142181396484375, -0.0965576171875, -0.050933837890625, -0.00531005859375, 0.040313720703125, 0.0859375, 0.131561279296875, 0.17718505859375, 0.222808837890625, 0.2684326171875, 0.314056396484375, 0.35968017578125, 0.405303955078125, 0.450927734375, 0.496551513671875, 0.54217529296875, 0.587799072265625, 0.6334228515625, 0.679046630859375, 0.72467041015625, 0.770294189453125, 0.81591796875, 0.861541748046875, 0.90716552734375, 0.952789306640625, 0.9984130859375, 1.044036865234375, 1.08966064453125, 1.135284423828125, 1.180908203125, 1.226531982421875, 1.27215576171875, 1.317779541015625, 1.3634033203125, 1.409027099609375, 1.45465087890625, 1.500274658203125, 1.5458984375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 11.0, 8.0, 10.0, 12.0, 15.0, 23.0, 30.0, 13.0, 21.0, 28.0, 29.0, 34.0, 32.0, 43.0, 40.0, 29.0, 31.0, 27.0, 1070.0, 27.0, 43.0, 33.0, 39.0, 41.0, 31.0, 32.0, 30.0, 36.0, 20.0, 18.0, 19.0, 20.0, 19.0, 12.0, 13.0, 7.0, 12.0, 12.0, 7.0, 7.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.58984375, -4.4393310546875, -4.288818359375, -4.1383056640625, -3.98779296875, -3.8372802734375, -3.686767578125, -3.5362548828125, -3.3857421875, -3.2352294921875, -3.084716796875, -2.9342041015625, -2.78369140625, -2.6331787109375, -2.482666015625, -2.3321533203125, -2.181640625, -2.0311279296875, -1.880615234375, -1.7301025390625, -1.57958984375, -1.4290771484375, -1.278564453125, -1.1280517578125, -0.9775390625, -0.8270263671875, -0.676513671875, -0.5260009765625, -0.37548828125, -0.2249755859375, -0.074462890625, 0.0760498046875, 0.2265625, 0.3770751953125, 0.527587890625, 0.6781005859375, 0.82861328125, 0.9791259765625, 1.129638671875, 1.2801513671875, 1.4306640625, 1.5811767578125, 1.731689453125, 1.8822021484375, 2.03271484375, 2.1832275390625, 2.333740234375, 2.4842529296875, 2.634765625, 2.7852783203125, 2.935791015625, 3.0863037109375, 3.23681640625, 3.3873291015625, 3.537841796875, 3.6883544921875, 3.8388671875, 3.9893798828125, 4.139892578125, 4.2904052734375, 4.44091796875, 4.5914306640625, 4.741943359375, 4.8924560546875, 5.04296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 21.0, 24.0, 32.0, 59.0, 62.0, 97.0, 126.0, 224.0, 270.0, 418.0, 568.0, 839.0, 1149.0, 1653.0, 2410.0, 3250.0, 4716.0, 6773.0, 9606.0, 13924.0, 20519.0, 31256.0, 47828.0, 75548.0, 120967.0, 1242653.0, 188273.0, 113865.0, 71248.0, 45350.0, 29852.0, 19245.0, 13269.0, 9201.0, 6514.0, 4466.0, 3248.0, 2188.0, 1591.0, 1127.0, 769.0, 567.0, 395.0, 290.0, 208.0, 155.0, 100.0, 64.0, 51.0, 31.0, 21.0, 10.0, 10.0, 9.0, 6.0, 2.0, 3.0], "bins": [-0.9697265625, -0.9402847290039062, -0.9108428955078125, -0.8814010620117188, -0.851959228515625, -0.8225173950195312, -0.7930755615234375, -0.7636337280273438, -0.73419189453125, -0.7047500610351562, -0.6753082275390625, -0.6458663940429688, -0.616424560546875, -0.5869827270507812, -0.5575408935546875, -0.5280990600585938, -0.4986572265625, -0.46921539306640625, -0.4397735595703125, -0.41033172607421875, -0.380889892578125, -0.35144805908203125, -0.3220062255859375, -0.29256439208984375, -0.26312255859375, -0.23368072509765625, -0.2042388916015625, -0.17479705810546875, -0.145355224609375, -0.11591339111328125, -0.0864715576171875, -0.05702972412109375, -0.027587890625, 0.00185394287109375, 0.0312957763671875, 0.06073760986328125, 0.090179443359375, 0.11962127685546875, 0.1490631103515625, 0.17850494384765625, 0.20794677734375, 0.23738861083984375, 0.2668304443359375, 0.29627227783203125, 0.325714111328125, 0.35515594482421875, 0.3845977783203125, 0.41403961181640625, 0.4434814453125, 0.47292327880859375, 0.5023651123046875, 0.5318069458007812, 0.561248779296875, 0.5906906127929688, 0.6201324462890625, 0.6495742797851562, 0.67901611328125, 0.7084579467773438, 0.7378997802734375, 0.7673416137695312, 0.796783447265625, 0.8262252807617188, 0.8556671142578125, 0.8851089477539062, 0.91455078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 10.0, 13.0, 13.0, 18.0, 35.0, 47.0, 56.0, 106.0, 125.0, 144.0, 136.0, 96.0, 54.0, 49.0, 39.0, 19.0, 9.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017824172973632812, -0.0017197579145431519, -0.0016570985317230225, -0.001594439148902893, -0.0015317797660827637, -0.0014691203832626343, -0.0014064610004425049, -0.0013438016176223755, -0.001281142234802246, -0.0012184828519821167, -0.0011558234691619873, -0.001093164086341858, -0.0010305047035217285, -0.0009678453207015991, -0.0009051859378814697, -0.0008425265550613403, -0.0007798671722412109, -0.0007172077894210815, -0.0006545484066009521, -0.0005918890237808228, -0.0005292296409606934, -0.00046657025814056396, -0.00040391087532043457, -0.0003412514925003052, -0.0002785921096801758, -0.0002159327268600464, -0.000153273344039917, -9.06139612197876e-05, -2.7954578399658203e-05, 3.470480442047119e-05, 9.736418724060059e-05, 0.00016002357006072998, 0.00022268295288085938, 0.00028534233570098877, 0.00034800171852111816, 0.00041066110134124756, 0.00047332048416137695, 0.0005359798669815063, 0.0005986392498016357, 0.0006612986326217651, 0.0007239580154418945, 0.0007866173982620239, 0.0008492767810821533, 0.0009119361639022827, 0.0009745955467224121, 0.0010372549295425415, 0.001099914312362671, 0.0011625736951828003, 0.0012252330780029297, 0.001287892460823059, 0.0013505518436431885, 0.0014132112264633179, 0.0014758706092834473, 0.0015385299921035767, 0.001601189374923706, 0.0016638487577438354, 0.0017265081405639648, 0.0017891675233840942, 0.0018518269062042236, 0.001914486289024353, 0.0019771456718444824, 0.002039805054664612, 0.002102464437484741, 0.0021651238203048706, 0.002227783203125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 14.0, 21.0, 47.0, 81.0, 100.0, 175.0, 458.0, 2439.0, 1042431.0, 1828.0, 435.0, 180.0, 108.0, 76.0, 43.0, 25.0, 15.0, 17.0, 9.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047210693359375, -0.045879364013671875, -0.04454803466796875, -0.043216705322265625, -0.0418853759765625, -0.040554046630859375, -0.03922271728515625, -0.037891387939453125, -0.03656005859375, -0.035228729248046875, -0.03389739990234375, -0.032566070556640625, -0.0312347412109375, -0.029903411865234375, -0.02857208251953125, -0.027240753173828125, -0.025909423828125, -0.024578094482421875, -0.02324676513671875, -0.021915435791015625, -0.0205841064453125, -0.019252777099609375, -0.01792144775390625, -0.016590118408203125, -0.0152587890625, -0.013927459716796875, -0.01259613037109375, -0.011264801025390625, -0.0099334716796875, -0.008602142333984375, -0.00727081298828125, -0.005939483642578125, -0.004608154296875, -0.003276824951171875, -0.00194549560546875, -0.000614166259765625, 0.0007171630859375, 0.002048492431640625, 0.00337982177734375, 0.004711151123046875, 0.00604248046875, 0.007373809814453125, 0.00870513916015625, 0.010036468505859375, 0.0113677978515625, 0.012699127197265625, 0.01403045654296875, 0.015361785888671875, 0.016693115234375, 0.018024444580078125, 0.01935577392578125, 0.020687103271484375, 0.0220184326171875, 0.023349761962890625, 0.02468109130859375, 0.026012420654296875, 0.02734375, 0.028675079345703125, 0.03000640869140625, 0.031337738037109375, 0.0326690673828125, 0.034000396728515625, 0.03533172607421875, 0.036663055419921875, 0.037994384765625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 15.0, 81.0, 291.0, 426.0, 173.0, 20.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007463187794201076, -0.0006656402838416398, -0.000584961730055511, -0.0005042832344770432, -0.0004236047388985753, -0.00034292624332010746, -0.00026224771863780916, -0.00018156919395551085, -0.00010089069837704301, -2.0212188246659935e-05, 6.046632188372314e-05, 0.00014114483201410621, 0.0002218233421444893, 0.00030250183772295713, 0.00038318036240525544, 0.00046385888708755374, 0.0005445373826660216, 0.0006252158782444894, 0.0007058944320306182, 0.000786572927609086, 0.0008672514231875539, 0.0009479299187660217, 0.0010286084143444896, 0.0011092869099229574, 0.001189965521916747, 0.001270644017495215, 0.0013513225130736828, 0.0014320010086521506, 0.0015126795042306185, 0.0015933581162244081, 0.001674036611802876, 0.0017547151073813438, 0.0018353937193751335, 0.0019160722149536014, 0.001996750710532069, 0.002077429322525859, 0.002158107701689005, 0.0022387863136827946, 0.0023194646928459406, 0.0024001433048397303, 0.0024808216840028763, 0.002561500295996666, 0.002642178675159812, 0.0027228572871536016, 0.0028035356663167477, 0.0028842142783105373, 0.0029648926574736834, 0.003045571269467473, 0.0031262498814612627, 0.0032069284934550524, 0.0032876068726181984, 0.003368285484611988, 0.003448963863775134, 0.0035296424757689238, 0.0036103208549320698, 0.0036909994669258595, 0.003771678078919649, 0.003852356690913439, 0.0039330353029072285, 0.004013713449239731, 0.0040943920612335205, 0.00417507067322731, 0.0042557492852211, 0.0043364278972148895, 0.004417106043547392]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 18.0, 16.0, 10.0, 13.0, 21.0, 21.0, 20.0, 27.0, 37.0, 32.0, 34.0, 33.0, 44.0, 48.0, 38.0, 40.0, 34.0, 39.0, 40.0, 52.0, 46.0, 49.0, 36.0, 20.0, 30.0, 23.0, 28.0, 22.0, 11.0, 15.0, 18.0, 13.0, 12.0, 11.0, 7.0, 6.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0006743669509887695, -0.0006543491035699844, -0.0006343312561511993, -0.0006143134087324142, -0.0005942955613136292, -0.0005742777138948441, -0.000554259866476059, -0.0005342420190572739, -0.0005142241716384888, -0.0004942063242197037, -0.0004741884768009186, -0.0004541706293821335, -0.0004341527819633484, -0.0004141349345445633, -0.0003941170871257782, -0.0003740992397069931, -0.000354081392288208, -0.0003340635448694229, -0.0003140456974506378, -0.0002940278500318527, -0.0002740100026130676, -0.00025399215519428253, -0.00023397430777549744, -0.00021395646035671234, -0.00019393861293792725, -0.00017392076551914215, -0.00015390291810035706, -0.00013388507068157196, -0.00011386722326278687, -9.384937584400177e-05, -7.383152842521667e-05, -5.381368100643158e-05, -3.3795833587646484e-05, -1.377798616886139e-05, 6.239861249923706e-06, 2.62577086687088e-05, 4.6275556087493896e-05, 6.629340350627899e-05, 8.631125092506409e-05, 0.00010632909834384918, 0.00012634694576263428, 0.00014636479318141937, 0.00016638264060020447, 0.00018640048801898956, 0.00020641833543777466, 0.00022643618285655975, 0.00024645403027534485, 0.00026647187769412994, 0.00028648972511291504, 0.00030650757253170013, 0.00032652541995048523, 0.0003465432673692703, 0.0003665611147880554, 0.0003865789622068405, 0.0004065968096256256, 0.0004266146570444107, 0.0004466325044631958, 0.0004666503518819809, 0.000486668199300766, 0.0005066860467195511, 0.0005267038941383362, 0.0005467217415571213, 0.0005667395889759064, 0.0005867574363946915, 0.0006067752838134766]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 12.0, 13.0, 9.0, 8.0, 10.0, 10.0, 23.0, 29.0, 16.0, 32.0, 23.0, 28.0, 39.0, 36.0, 43.0, 37.0, 35.0, 36.0, 53.0, 38.0, 36.0, 51.0, 33.0, 36.0, 27.0, 27.0, 25.0, 36.0, 31.0, 20.0, 15.0, 13.0, 13.0, 19.0, 11.0, 10.0, 10.0, 9.0, 12.0, 4.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0], "bins": [-8.4453125, -8.19732666015625, -7.9493408203125, -7.70135498046875, -7.453369140625, -7.20538330078125, -6.9573974609375, -6.70941162109375, -6.46142578125, -6.21343994140625, -5.9654541015625, -5.71746826171875, -5.469482421875, -5.22149658203125, -4.9735107421875, -4.72552490234375, -4.4775390625, -4.22955322265625, -3.9815673828125, -3.73358154296875, -3.485595703125, -3.23760986328125, -2.9896240234375, -2.74163818359375, -2.49365234375, -2.24566650390625, -1.9976806640625, -1.74969482421875, -1.501708984375, -1.25372314453125, -1.0057373046875, -0.75775146484375, -0.509765625, -0.26177978515625, -0.0137939453125, 0.23419189453125, 0.482177734375, 0.73016357421875, 0.9781494140625, 1.22613525390625, 1.47412109375, 1.72210693359375, 1.9700927734375, 2.21807861328125, 2.466064453125, 2.71405029296875, 2.9620361328125, 3.21002197265625, 3.4580078125, 3.70599365234375, 3.9539794921875, 4.20196533203125, 4.449951171875, 4.69793701171875, 4.9459228515625, 5.19390869140625, 5.44189453125, 5.68988037109375, 5.9378662109375, 6.18585205078125, 6.433837890625, 6.68182373046875, 6.9298095703125, 7.17779541015625, 7.42578125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 10.0, 13.0, 22.0, 27.0, 29.0, 24.0, 32.0, 50.0, 65.0, 100.0, 115.0, 173.0, 221.0, 254.0, 363.0, 496.0, 705.0, 1463.0, 5140.0, 29306.0, 418790.0, 547810.0, 33147.0, 5872.0, 1527.0, 731.0, 504.0, 363.0, 255.0, 246.0, 184.0, 123.0, 91.0, 57.0, 45.0, 39.0, 30.0, 28.0, 19.0, 17.0, 16.0, 11.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0], "bins": [-21.3125, -20.686279296875, -20.06005859375, -19.433837890625, -18.8076171875, -18.181396484375, -17.55517578125, -16.928955078125, -16.302734375, -15.676513671875, -15.05029296875, -14.424072265625, -13.7978515625, -13.171630859375, -12.54541015625, -11.919189453125, -11.29296875, -10.666748046875, -10.04052734375, -9.414306640625, -8.7880859375, -8.161865234375, -7.53564453125, -6.909423828125, -6.283203125, -5.656982421875, -5.03076171875, -4.404541015625, -3.7783203125, -3.152099609375, -2.52587890625, -1.899658203125, -1.2734375, -0.647216796875, -0.02099609375, 0.605224609375, 1.2314453125, 1.857666015625, 2.48388671875, 3.110107421875, 3.736328125, 4.362548828125, 4.98876953125, 5.614990234375, 6.2412109375, 6.867431640625, 7.49365234375, 8.119873046875, 8.74609375, 9.372314453125, 9.99853515625, 10.624755859375, 11.2509765625, 11.877197265625, 12.50341796875, 13.129638671875, 13.755859375, 14.382080078125, 15.00830078125, 15.634521484375, 16.2607421875, 16.886962890625, 17.51318359375, 18.139404296875, 18.765625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 4.0, 4.0, 2.0, 11.0, 9.0, 18.0, 19.0, 8.0, 18.0, 28.0, 31.0, 23.0, 37.0, 29.0, 42.0, 47.0, 42.0, 60.0, 66.0, 229.0, 1687.0, 138.0, 67.0, 45.0, 50.0, 41.0, 49.0, 34.0, 30.0, 25.0, 37.0, 33.0, 13.0, 22.0, 16.0, 6.0, 6.0, 7.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.171875, -24.34326171875, -23.5146484375, -22.68603515625, -21.857421875, -21.02880859375, -20.2001953125, -19.37158203125, -18.54296875, -17.71435546875, -16.8857421875, -16.05712890625, -15.228515625, -14.39990234375, -13.5712890625, -12.74267578125, -11.9140625, -11.08544921875, -10.2568359375, -9.42822265625, -8.599609375, -7.77099609375, -6.9423828125, -6.11376953125, -5.28515625, -4.45654296875, -3.6279296875, -2.79931640625, -1.970703125, -1.14208984375, -0.3134765625, 0.51513671875, 1.34375, 2.17236328125, 3.0009765625, 3.82958984375, 4.658203125, 5.48681640625, 6.3154296875, 7.14404296875, 7.97265625, 8.80126953125, 9.6298828125, 10.45849609375, 11.287109375, 12.11572265625, 12.9443359375, 13.77294921875, 14.6015625, 15.43017578125, 16.2587890625, 17.08740234375, 17.916015625, 18.74462890625, 19.5732421875, 20.40185546875, 21.23046875, 22.05908203125, 22.8876953125, 23.71630859375, 24.544921875, 25.37353515625, 26.2021484375, 27.03076171875, 27.859375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 6.0, 10.0, 12.0, 19.0, 19.0, 19.0, 32.0, 46.0, 43.0, 38.0, 74.0, 93.0, 145.0, 199.0, 409.0, 1329.0, 53121.0, 3082833.0, 5545.0, 761.0, 287.0, 170.0, 100.0, 72.0, 46.0, 50.0, 34.0, 30.0, 29.0, 17.0, 18.0, 19.0, 14.0, 13.0, 10.0, 4.0, 4.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-78.625, -76.3310546875, -74.037109375, -71.7431640625, -69.44921875, -67.1552734375, -64.861328125, -62.5673828125, -60.2734375, -57.9794921875, -55.685546875, -53.3916015625, -51.09765625, -48.8037109375, -46.509765625, -44.2158203125, -41.921875, -39.6279296875, -37.333984375, -35.0400390625, -32.74609375, -30.4521484375, -28.158203125, -25.8642578125, -23.5703125, -21.2763671875, -18.982421875, -16.6884765625, -14.39453125, -12.1005859375, -9.806640625, -7.5126953125, -5.21875, -2.9248046875, -0.630859375, 1.6630859375, 3.95703125, 6.2509765625, 8.544921875, 10.8388671875, 13.1328125, 15.4267578125, 17.720703125, 20.0146484375, 22.30859375, 24.6025390625, 26.896484375, 29.1904296875, 31.484375, 33.7783203125, 36.072265625, 38.3662109375, 40.66015625, 42.9541015625, 45.248046875, 47.5419921875, 49.8359375, 52.1298828125, 54.423828125, 56.7177734375, 59.01171875, 61.3056640625, 63.599609375, 65.8935546875, 68.1875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 154.0, 841.0, 20.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.86680603027344, -111.4527359008789, -105.03866577148438, -98.62460327148438, -92.21052551269531, -85.79646301269531, -79.38239288330078, -72.96832275390625, -66.55425262451172, -60.14018249511719, -53.726112365722656, -47.31204605102539, -40.89797592163086, -34.48390579223633, -28.069839477539062, -21.65576934814453, -15.24169921875, -8.827630043029785, -2.4135608673095703, 4.000507354736328, 10.41457748413086, 16.82864761352539, 23.242713928222656, 29.656784057617188, 36.07085418701172, 42.48492431640625, 48.89899444580078, 55.31306076049805, 61.72713088989258, 68.14120483398438, 74.55526733398438, 80.9693374633789, 87.38339233398438, 93.7974624633789, 100.21153259277344, 106.62559509277344, 113.0396728515625, 119.4537353515625, 125.86780548095703, 132.28187561035156, 138.69595336914062, 145.11001586914062, 151.5240936279297, 157.9381561279297, 164.35223388671875, 170.76629638671875, 177.18035888671875, 183.5944366455078, 190.0084991455078, 196.4225616455078, 202.83663940429688, 209.25070190429688, 215.66477966308594, 222.07884216308594, 228.492919921875, 234.906982421875, 241.321044921875, 247.735107421875, 254.14918518066406, 260.5632629394531, 266.9773254394531, 273.3913879394531, 279.8054504394531, 286.21954345703125, 292.63360595703125]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 4.0, 8.0, 15.0, 14.0, 17.0, 16.0, 16.0, 20.0, 22.0, 32.0, 30.0, 28.0, 48.0, 43.0, 39.0, 36.0, 45.0, 31.0, 46.0, 53.0, 37.0, 40.0, 33.0, 31.0, 33.0, 27.0, 32.0, 24.0, 21.0, 26.0, 23.0, 16.0, 15.0, 13.0, 10.0, 8.0, 7.0, 5.0, 7.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.56169128417969, -63.66786575317383, -61.77404022216797, -59.880210876464844, -57.986385345458984, -56.092559814453125, -54.198734283447266, -52.304908752441406, -50.41107940673828, -48.51725387573242, -46.62342834472656, -44.72959899902344, -42.83577346801758, -40.94194793701172, -39.04812240600586, -37.154296875, -35.260467529296875, -33.366641998291016, -31.472814559936523, -29.578989028930664, -27.685161590576172, -25.791336059570312, -23.897510528564453, -22.00368309020996, -20.109859466552734, -18.216033935546875, -16.322206497192383, -14.428380966186523, -12.534553527832031, -10.640727996826172, -8.746901512145996, -6.85307502746582, -4.959247589111328, -3.0654211044311523, -1.1715948581695557, 0.722231388092041, 2.616057872772217, 4.509883880615234, 6.40371036529541, 8.297536849975586, 10.191363334655762, 12.085189819335938, 13.979016304016113, 15.872842788696289, 17.76666831970215, 19.66049575805664, 21.5543212890625, 23.44814682006836, 25.34197425842285, 27.23579978942871, 29.129627227783203, 31.023452758789062, 32.91727828979492, 34.81110382080078, 36.704933166503906, 38.598758697509766, 40.492584228515625, 42.386409759521484, 44.280235290527344, 46.17406463623047, 48.06789016723633, 49.96171569824219, 51.85554122924805, 53.749366760253906, 55.64319610595703]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 8.0, 7.0, 3.0, 10.0, 5.0, 10.0, 19.0, 9.0, 19.0, 30.0, 25.0, 21.0, 24.0, 25.0, 32.0, 35.0, 33.0, 33.0, 32.0, 42.0, 36.0, 40.0, 45.0, 47.0, 48.0, 38.0, 36.0, 35.0, 39.0, 25.0, 20.0, 24.0, 20.0, 14.0, 9.0, 19.0, 20.0, 9.0, 11.0, 16.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0], "bins": [-8.9296875, -8.67315673828125, -8.4166259765625, -8.16009521484375, -7.903564453125, -7.64703369140625, -7.3905029296875, -7.13397216796875, -6.87744140625, -6.62091064453125, -6.3643798828125, -6.10784912109375, -5.851318359375, -5.59478759765625, -5.3382568359375, -5.08172607421875, -4.8251953125, -4.56866455078125, -4.3121337890625, -4.05560302734375, -3.799072265625, -3.54254150390625, -3.2860107421875, -3.02947998046875, -2.77294921875, -2.51641845703125, -2.2598876953125, -2.00335693359375, -1.746826171875, -1.49029541015625, -1.2337646484375, -0.97723388671875, -0.720703125, -0.46417236328125, -0.2076416015625, 0.04888916015625, 0.305419921875, 0.56195068359375, 0.8184814453125, 1.07501220703125, 1.33154296875, 1.58807373046875, 1.8446044921875, 2.10113525390625, 2.357666015625, 2.61419677734375, 2.8707275390625, 3.12725830078125, 3.3837890625, 3.64031982421875, 3.8968505859375, 4.15338134765625, 4.409912109375, 4.66644287109375, 4.9229736328125, 5.17950439453125, 5.43603515625, 5.69256591796875, 5.9490966796875, 6.20562744140625, 6.462158203125, 6.71868896484375, 6.9752197265625, 7.23175048828125, 7.48828125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 11.0, 11.0, 11.0, 26.0, 19.0, 36.0, 41.0, 47.0, 60.0, 79.0, 95.0, 112.0, 156.0, 215.0, 272.0, 429.0, 873.0, 2057.0, 8013.0, 55034.0, 684392.0, 2617241.0, 752111.0, 59495.0, 8590.0, 2245.0, 907.0, 440.0, 306.0, 202.0, 137.0, 123.0, 87.0, 76.0, 58.0, 53.0, 37.0, 33.0, 29.0, 25.0, 16.0, 18.0, 13.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-18.078125, -17.522216796875, -16.96630859375, -16.410400390625, -15.8544921875, -15.298583984375, -14.74267578125, -14.186767578125, -13.630859375, -13.074951171875, -12.51904296875, -11.963134765625, -11.4072265625, -10.851318359375, -10.29541015625, -9.739501953125, -9.18359375, -8.627685546875, -8.07177734375, -7.515869140625, -6.9599609375, -6.404052734375, -5.84814453125, -5.292236328125, -4.736328125, -4.180419921875, -3.62451171875, -3.068603515625, -2.5126953125, -1.956787109375, -1.40087890625, -0.844970703125, -0.2890625, 0.266845703125, 0.82275390625, 1.378662109375, 1.9345703125, 2.490478515625, 3.04638671875, 3.602294921875, 4.158203125, 4.714111328125, 5.27001953125, 5.825927734375, 6.3818359375, 6.937744140625, 7.49365234375, 8.049560546875, 8.60546875, 9.161376953125, 9.71728515625, 10.273193359375, 10.8291015625, 11.385009765625, 11.94091796875, 12.496826171875, 13.052734375, 13.608642578125, 14.16455078125, 14.720458984375, 15.2763671875, 15.832275390625, 16.38818359375, 16.944091796875, 17.5]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 17.0, 15.0, 23.0, 42.0, 76.0, 111.0, 160.0, 224.0, 401.0, 530.0, 617.0, 534.0, 416.0, 285.0, 176.0, 148.0, 90.0, 48.0, 40.0, 28.0, 19.0, 12.0, 16.0, 11.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.36572265625, -14.8095703125, -14.25341796875, -13.697265625, -13.14111328125, -12.5849609375, -12.02880859375, -11.47265625, -10.91650390625, -10.3603515625, -9.80419921875, -9.248046875, -8.69189453125, -8.1357421875, -7.57958984375, -7.0234375, -6.46728515625, -5.9111328125, -5.35498046875, -4.798828125, -4.24267578125, -3.6865234375, -3.13037109375, -2.57421875, -2.01806640625, -1.4619140625, -0.90576171875, -0.349609375, 0.20654296875, 0.7626953125, 1.31884765625, 1.875, 2.43115234375, 2.9873046875, 3.54345703125, 4.099609375, 4.65576171875, 5.2119140625, 5.76806640625, 6.32421875, 6.88037109375, 7.4365234375, 7.99267578125, 8.548828125, 9.10498046875, 9.6611328125, 10.21728515625, 10.7734375, 11.32958984375, 11.8857421875, 12.44189453125, 12.998046875, 13.55419921875, 14.1103515625, 14.66650390625, 15.22265625, 15.77880859375, 16.3349609375, 16.89111328125, 17.447265625, 18.00341796875, 18.5595703125, 19.11572265625, 19.671875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 8.0, 6.0, 14.0, 13.0, 20.0, 29.0, 48.0, 63.0, 113.0, 128.0, 196.0, 288.0, 609.0, 2294.0, 70836.0, 4079427.0, 36998.0, 1947.0, 520.0, 258.0, 159.0, 98.0, 72.0, 49.0, 26.0, 23.0, 19.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.6875, -81.4521484375, -79.216796875, -76.9814453125, -74.74609375, -72.5107421875, -70.275390625, -68.0400390625, -65.8046875, -63.5693359375, -61.333984375, -59.0986328125, -56.86328125, -54.6279296875, -52.392578125, -50.1572265625, -47.921875, -45.6865234375, -43.451171875, -41.2158203125, -38.98046875, -36.7451171875, -34.509765625, -32.2744140625, -30.0390625, -27.8037109375, -25.568359375, -23.3330078125, -21.09765625, -18.8623046875, -16.626953125, -14.3916015625, -12.15625, -9.9208984375, -7.685546875, -5.4501953125, -3.21484375, -0.9794921875, 1.255859375, 3.4912109375, 5.7265625, 7.9619140625, 10.197265625, 12.4326171875, 14.66796875, 16.9033203125, 19.138671875, 21.3740234375, 23.609375, 25.8447265625, 28.080078125, 30.3154296875, 32.55078125, 34.7861328125, 37.021484375, 39.2568359375, 41.4921875, 43.7275390625, 45.962890625, 48.1982421875, 50.43359375, 52.6689453125, 54.904296875, 57.1396484375, 59.375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 576.0, 434.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-286.5056457519531, -269.5603942871094, -252.6151580810547, -235.66990661621094, -218.72467041015625, -201.7794189453125, -184.83416748046875, -167.888916015625, -150.9436798095703, -133.99842834472656, -117.05319213867188, -100.10794067382812, -83.1626968383789, -66.21745300292969, -49.27220153808594, -32.32695770263672, -15.3817138671875, 1.5635318756103516, 18.508777618408203, 35.45402526855469, 52.399269104003906, 69.34451293945312, 86.28976440429688, 103.2350082397461, 120.18025207519531, 137.12550354003906, 154.07073974609375, 171.0159912109375, 187.96124267578125, 204.90647888183594, 221.8517303466797, 238.79696655273438, 255.7421875, 272.68743896484375, 289.6326904296875, 306.57794189453125, 323.5231628417969, 340.4684143066406, 357.4136657714844, 374.3589172363281, 391.30413818359375, 408.2493896484375, 425.19464111328125, 442.139892578125, 459.0851135253906, 476.0303649902344, 492.9756164550781, 509.9208679199219, 526.8660888671875, 543.8113403320312, 560.756591796875, 577.7018432617188, 594.6470947265625, 611.59228515625, 628.53759765625, 645.4827880859375, 662.4281005859375, 679.3733520507812, 696.318603515625, 713.2638549804688, 730.2091064453125, 747.154296875, 764.099609375, 781.0447998046875, 797.9900512695312]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 8.0, 9.0, 11.0, 8.0, 12.0, 14.0, 19.0, 21.0, 28.0, 21.0, 34.0, 27.0, 30.0, 40.0, 25.0, 39.0, 45.0, 34.0, 39.0, 44.0, 47.0, 33.0, 34.0, 40.0, 45.0, 37.0, 30.0, 29.0, 17.0, 31.0, 26.0, 19.0, 18.0, 14.0, 17.0, 9.0, 9.0, 9.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.100006103515625, -42.65949249267578, -41.21897888183594, -39.778465270996094, -38.33795166015625, -36.897438049316406, -35.45692443847656, -34.01641082763672, -32.575897216796875, -31.13538360595703, -29.694869995117188, -28.254356384277344, -26.8138427734375, -25.373329162597656, -23.932817459106445, -22.4923038482666, -21.05179214477539, -19.611278533935547, -18.170764923095703, -16.73025131225586, -15.289738655090332, -13.849225044250488, -12.408712387084961, -10.968198776245117, -9.527685165405273, -8.08717155456543, -6.646658420562744, -5.206145286560059, -3.765631675720215, -2.325118064880371, -0.8846054077148438, 0.555908203125, 1.9964218139648438, 3.4369351863861084, 4.877448558807373, 6.317961692810059, 7.758475303649902, 9.198988914489746, 10.639501571655273, 12.080015182495117, 13.520528793334961, 14.961042404174805, 16.40155601501465, 17.84206771850586, 19.282581329345703, 20.723094940185547, 22.16360855102539, 23.604122161865234, 25.044635772705078, 26.485149383544922, 27.925662994384766, 29.36617660522461, 30.806690216064453, 32.2472038269043, 33.687713623046875, 35.12822723388672, 36.56874084472656, 38.009254455566406, 39.44976806640625, 40.890281677246094, 42.33079528808594, 43.77130889892578, 45.211822509765625, 46.65233612060547, 48.09284973144531]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 7.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 29.0, 25.0, 22.0, 27.0, 21.0, 31.0, 34.0, 30.0, 44.0, 36.0, 43.0, 40.0, 38.0, 52.0, 45.0, 28.0, 31.0, 33.0, 34.0, 37.0, 25.0, 21.0, 27.0, 27.0, 20.0, 18.0, 13.0, 22.0, 11.0, 14.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.140625, -8.87286376953125, -8.6051025390625, -8.33734130859375, -8.069580078125, -7.80181884765625, -7.5340576171875, -7.26629638671875, -6.99853515625, -6.73077392578125, -6.4630126953125, -6.19525146484375, -5.927490234375, -5.65972900390625, -5.3919677734375, -5.12420654296875, -4.8564453125, -4.58868408203125, -4.3209228515625, -4.05316162109375, -3.785400390625, -3.51763916015625, -3.2498779296875, -2.98211669921875, -2.71435546875, -2.44659423828125, -2.1788330078125, -1.91107177734375, -1.643310546875, -1.37554931640625, -1.1077880859375, -0.84002685546875, -0.572265625, -0.30450439453125, -0.0367431640625, 0.23101806640625, 0.498779296875, 0.76654052734375, 1.0343017578125, 1.30206298828125, 1.56982421875, 1.83758544921875, 2.1053466796875, 2.37310791015625, 2.640869140625, 2.90863037109375, 3.1763916015625, 3.44415283203125, 3.7119140625, 3.97967529296875, 4.2474365234375, 4.51519775390625, 4.782958984375, 5.05072021484375, 5.3184814453125, 5.58624267578125, 5.85400390625, 6.12176513671875, 6.3895263671875, 6.65728759765625, 6.925048828125, 7.19281005859375, 7.4605712890625, 7.72833251953125, 7.99609375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 14.0, 25.0, 27.0, 60.0, 63.0, 106.0, 187.0, 247.0, 410.0, 584.0, 842.0, 1332.0, 1939.0, 2943.0, 4412.0, 6547.0, 10009.0, 15489.0, 23968.0, 36990.0, 60034.0, 100488.0, 177163.0, 239744.0, 142199.0, 82301.0, 50067.0, 31524.0, 20123.0, 13081.0, 8687.0, 5711.0, 3787.0, 2475.0, 1689.0, 1090.0, 723.0, 484.0, 335.0, 227.0, 157.0, 87.0, 56.0, 44.0, 21.0, 23.0, 12.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.2275390625, -1.1906890869140625, -1.153839111328125, -1.1169891357421875, -1.08013916015625, -1.0432891845703125, -1.006439208984375, -0.9695892333984375, -0.9327392578125, -0.8958892822265625, -0.859039306640625, -0.8221893310546875, -0.78533935546875, -0.7484893798828125, -0.711639404296875, -0.6747894287109375, -0.637939453125, -0.6010894775390625, -0.564239501953125, -0.5273895263671875, -0.49053955078125, -0.4536895751953125, -0.416839599609375, -0.3799896240234375, -0.3431396484375, -0.3062896728515625, -0.269439697265625, -0.2325897216796875, -0.19573974609375, -0.1588897705078125, -0.122039794921875, -0.0851898193359375, -0.04833984375, -0.0114898681640625, 0.025360107421875, 0.0622100830078125, 0.09906005859375, 0.1359100341796875, 0.172760009765625, 0.2096099853515625, 0.2464599609375, 0.2833099365234375, 0.320159912109375, 0.3570098876953125, 0.39385986328125, 0.4307098388671875, 0.467559814453125, 0.5044097900390625, 0.541259765625, 0.5781097412109375, 0.614959716796875, 0.6518096923828125, 0.68865966796875, 0.7255096435546875, 0.762359619140625, 0.7992095947265625, 0.8360595703125, 0.8729095458984375, 0.909759521484375, 0.9466094970703125, 0.98345947265625, 1.0203094482421875, 1.057159423828125, 1.0940093994140625, 1.130859375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 2.0, 7.0, 10.0, 9.0, 8.0, 15.0, 17.0, 31.0, 27.0, 19.0, 24.0, 29.0, 33.0, 33.0, 34.0, 36.0, 41.0, 59.0, 46.0, 1067.0, 44.0, 46.0, 29.0, 38.0, 37.0, 29.0, 28.0, 35.0, 20.0, 24.0, 23.0, 23.0, 10.0, 19.0, 23.0, 15.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0], "bins": [-7.0234375, -6.83453369140625, -6.6456298828125, -6.45672607421875, -6.267822265625, -6.07891845703125, -5.8900146484375, -5.70111083984375, -5.51220703125, -5.32330322265625, -5.1343994140625, -4.94549560546875, -4.756591796875, -4.56768798828125, -4.3787841796875, -4.18988037109375, -4.0009765625, -3.81207275390625, -3.6231689453125, -3.43426513671875, -3.245361328125, -3.05645751953125, -2.8675537109375, -2.67864990234375, -2.48974609375, -2.30084228515625, -2.1119384765625, -1.92303466796875, -1.734130859375, -1.54522705078125, -1.3563232421875, -1.16741943359375, -0.978515625, -0.78961181640625, -0.6007080078125, -0.41180419921875, -0.222900390625, -0.03399658203125, 0.1549072265625, 0.34381103515625, 0.53271484375, 0.72161865234375, 0.9105224609375, 1.09942626953125, 1.288330078125, 1.47723388671875, 1.6661376953125, 1.85504150390625, 2.0439453125, 2.23284912109375, 2.4217529296875, 2.61065673828125, 2.799560546875, 2.98846435546875, 3.1773681640625, 3.36627197265625, 3.55517578125, 3.74407958984375, 3.9329833984375, 4.12188720703125, 4.310791015625, 4.49969482421875, 4.6885986328125, 4.87750244140625, 5.06640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 18.0, 15.0, 41.0, 57.0, 74.0, 110.0, 172.0, 231.0, 346.0, 542.0, 791.0, 1104.0, 1651.0, 2700.0, 4069.0, 6151.0, 9554.0, 14788.0, 23502.0, 38342.0, 66098.0, 115621.0, 224515.0, 1286260.0, 121842.0, 69081.0, 40469.0, 24602.0, 15469.0, 9942.0, 6511.0, 4252.0, 2781.0, 1852.0, 1183.0, 815.0, 528.0, 340.0, 234.0, 143.0, 106.0, 68.0, 50.0, 35.0, 23.0, 11.0, 9.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.23828125, -1.198394775390625, -1.15850830078125, -1.118621826171875, -1.0787353515625, -1.038848876953125, -0.99896240234375, -0.959075927734375, -0.919189453125, -0.879302978515625, -0.83941650390625, -0.799530029296875, -0.7596435546875, -0.719757080078125, -0.67987060546875, -0.639984130859375, -0.60009765625, -0.560211181640625, -0.52032470703125, -0.480438232421875, -0.4405517578125, -0.400665283203125, -0.36077880859375, -0.320892333984375, -0.281005859375, -0.241119384765625, -0.20123291015625, -0.161346435546875, -0.1214599609375, -0.081573486328125, -0.04168701171875, -0.001800537109375, 0.0380859375, 0.077972412109375, 0.11785888671875, 0.157745361328125, 0.1976318359375, 0.237518310546875, 0.27740478515625, 0.317291259765625, 0.357177734375, 0.397064208984375, 0.43695068359375, 0.476837158203125, 0.5167236328125, 0.556610107421875, 0.59649658203125, 0.636383056640625, 0.67626953125, 0.716156005859375, 0.75604248046875, 0.795928955078125, 0.8358154296875, 0.875701904296875, 0.91558837890625, 0.955474853515625, 0.995361328125, 1.035247802734375, 1.07513427734375, 1.115020751953125, 1.1549072265625, 1.194793701171875, 1.23468017578125, 1.274566650390625, 1.314453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 8.0, 7.0, 11.0, 15.0, 16.0, 17.0, 21.0, 28.0, 30.0, 24.0, 42.0, 36.0, 33.0, 58.0, 38.0, 58.0, 49.0, 47.0, 43.0, 60.0, 41.0, 50.0, 40.0, 28.0, 31.0, 27.0, 20.0, 17.0, 12.0, 15.0, 25.0, 7.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0011310577392578125, -0.0010954439640045166, -0.0010598301887512207, -0.0010242164134979248, -0.000988602638244629, -0.000952988862991333, -0.0009173750877380371, -0.0008817613124847412, -0.0008461475372314453, -0.0008105337619781494, -0.0007749199867248535, -0.0007393062114715576, -0.0007036924362182617, -0.0006680786609649658, -0.0006324648857116699, -0.000596851110458374, -0.0005612373352050781, -0.0005256235599517822, -0.0004900097846984863, -0.00045439600944519043, -0.00041878223419189453, -0.00038316845893859863, -0.00034755468368530273, -0.00031194090843200684, -0.00027632713317871094, -0.00024071335792541504, -0.00020509958267211914, -0.00016948580741882324, -0.00013387203216552734, -9.825825691223145e-05, -6.264448165893555e-05, -2.703070640563965e-05, 8.58306884765625e-06, 4.419684410095215e-05, 7.981061935424805e-05, 0.00011542439460754395, 0.00015103816986083984, 0.00018665194511413574, 0.00022226572036743164, 0.00025787949562072754, 0.00029349327087402344, 0.00032910704612731934, 0.00036472082138061523, 0.00040033459663391113, 0.00043594837188720703, 0.00047156214714050293, 0.0005071759223937988, 0.0005427896976470947, 0.0005784034729003906, 0.0006140172481536865, 0.0006496310234069824, 0.0006852447986602783, 0.0007208585739135742, 0.0007564723491668701, 0.000792086124420166, 0.0008276998996734619, 0.0008633136749267578, 0.0008989274501800537, 0.0009345412254333496, 0.0009701550006866455, 0.0010057687759399414, 0.0010413825511932373, 0.0010769963264465332, 0.001112610101699829, 0.001148223876953125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 6.0, 5.0, 6.0, 9.0, 15.0, 23.0, 24.0, 29.0, 34.0, 42.0, 52.0, 69.0, 95.0, 163.0, 230.0, 396.0, 808.0, 11864.0, 1027184.0, 5615.0, 754.0, 351.0, 202.0, 125.0, 123.0, 64.0, 64.0, 41.0, 29.0, 18.0, 19.0, 20.0, 15.0, 10.0, 8.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.02825927734375, -0.02741408348083496, -0.026568889617919922, -0.025723695755004883, -0.024878501892089844, -0.024033308029174805, -0.023188114166259766, -0.022342920303344727, -0.021497726440429688, -0.02065253257751465, -0.01980733871459961, -0.01896214485168457, -0.01811695098876953, -0.017271757125854492, -0.016426563262939453, -0.015581369400024414, -0.014736175537109375, -0.013890981674194336, -0.013045787811279297, -0.012200593948364258, -0.011355400085449219, -0.01051020622253418, -0.00966501235961914, -0.008819818496704102, -0.007974624633789062, -0.0071294307708740234, -0.006284236907958984, -0.005439043045043945, -0.004593849182128906, -0.003748655319213867, -0.002903461456298828, -0.002058267593383789, -0.00121307373046875, -0.00036787986755371094, 0.0004773139953613281, 0.0013225078582763672, 0.0021677017211914062, 0.0030128955841064453, 0.0038580894470214844, 0.0047032833099365234, 0.0055484771728515625, 0.0063936710357666016, 0.007238864898681641, 0.00808405876159668, 0.008929252624511719, 0.009774446487426758, 0.010619640350341797, 0.011464834213256836, 0.012310028076171875, 0.013155221939086914, 0.014000415802001953, 0.014845609664916992, 0.01569080352783203, 0.01653599739074707, 0.01738119125366211, 0.01822638511657715, 0.019071578979492188, 0.019916772842407227, 0.020761966705322266, 0.021607160568237305, 0.022452354431152344, 0.023297548294067383, 0.024142742156982422, 0.02498793601989746, 0.0258331298828125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 83.0, 825.0, 105.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002308284630998969, -0.0021083722822368145, -0.0019084600498899817, -0.0017085477011278272, -0.0015086354687809944, -0.0013087231200188398, -0.0011088107712566853, -0.0009088985389098525, -0.0007089861901476979, -0.0005090738995932043, -0.00030916157993488014, -0.00010924926027655602, 9.066303027793765e-05, 0.0002905753208324313, 0.0004904876695945859, 0.0006903999019414186, 0.0008903122507035732, 0.0010902245994657278, 0.0012901368318125606, 0.0014900491805747151, 0.0016899614129215479, 0.0018898737616837025, 0.002089786110445857, 0.0022896984592080116, 0.0024896105751395226, 0.002689522923901677, 0.0028894352726638317, 0.0030893473885953426, 0.003289259737357497, 0.003489172086119652, 0.0036890844348818064, 0.003888996783643961, 0.004088908899575472, 0.004288821015506983, 0.004488733597099781, 0.004688645713031292, 0.00488855829462409, 0.005088470410555601, 0.005288382992148399, 0.00548829510807991, 0.005688207224011421, 0.005888119339942932, 0.00608803192153573, 0.006287944037467241, 0.0064878566190600395, 0.0066877687349915504, 0.006887680850923061, 0.00708759343251586, 0.007287506014108658, 0.007487418130040169, 0.007687330711632967, 0.007887243293225765, 0.008087155409157276, 0.008287067525088787, 0.008486979641020298, 0.008686891756951809, 0.00888680387288332, 0.00908671598881483, 0.009286628104746342, 0.009486541152000427, 0.009686453267931938, 0.009886365383863449, 0.01008627749979496, 0.010286189615726471, 0.010486102662980556]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 7.0, 8.0, 9.0, 5.0, 9.0, 12.0, 18.0, 13.0, 16.0, 24.0, 25.0, 25.0, 32.0, 20.0, 36.0, 28.0, 32.0, 35.0, 37.0, 37.0, 35.0, 29.0, 41.0, 30.0, 46.0, 43.0, 43.0, 25.0, 38.0, 26.0, 20.0, 23.0, 29.0, 17.0, 22.0, 23.0, 13.0, 10.0, 14.0, 9.0, 8.0, 5.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0006107091903686523, -0.0005917353555560112, -0.0005727615207433701, -0.0005537876859307289, -0.0005348138511180878, -0.0005158400163054466, -0.0004968661814928055, -0.00047789234668016434, -0.0004589185118675232, -0.00043994467705488205, -0.0004209708422422409, -0.00040199700742959976, -0.0003830231726169586, -0.0003640493378043175, -0.00034507550299167633, -0.0003261016681790352, -0.00030712783336639404, -0.0002881539985537529, -0.00026918016374111176, -0.0002502063289284706, -0.00023123249411582947, -0.00021225865930318832, -0.00019328482449054718, -0.00017431098967790604, -0.0001553371548652649, -0.00013636332005262375, -0.0001173894852399826, -9.841565042734146e-05, -7.944181561470032e-05, -6.0467980802059174e-05, -4.149414598941803e-05, -2.2520311176776886e-05, -3.546476364135742e-06, 1.54273584485054e-05, 3.4401193261146545e-05, 5.337502807378769e-05, 7.234886288642883e-05, 9.132269769906998e-05, 0.00011029653251171112, 0.00012927036732435226, 0.0001482442021369934, 0.00016721803694963455, 0.0001861918717622757, 0.00020516570657491684, 0.00022413954138755798, 0.00024311337620019913, 0.00026208721101284027, 0.0002810610458254814, 0.00030003488063812256, 0.0003190087154507637, 0.00033798255026340485, 0.000356956385076046, 0.00037593021988868713, 0.0003949040547013283, 0.0004138778895139694, 0.00043285172432661057, 0.0004518255591392517, 0.00047079939395189285, 0.000489773228764534, 0.0005087470635771751, 0.0005277208983898163, 0.0005466947332024574, 0.0005656685680150986, 0.0005846424028277397, 0.0006036162376403809]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 7.0, 7.0, 8.0, 9.0, 15.0, 11.0, 17.0, 29.0, 25.0, 22.0, 27.0, 21.0, 31.0, 34.0, 30.0, 44.0, 36.0, 43.0, 40.0, 38.0, 52.0, 45.0, 28.0, 31.0, 33.0, 34.0, 37.0, 25.0, 21.0, 27.0, 27.0, 20.0, 18.0, 13.0, 22.0, 11.0, 14.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-9.140625, -8.87286376953125, -8.6051025390625, -8.33734130859375, -8.069580078125, -7.80181884765625, -7.5340576171875, -7.26629638671875, -6.99853515625, -6.73077392578125, -6.4630126953125, -6.19525146484375, -5.927490234375, -5.65972900390625, -5.3919677734375, -5.12420654296875, -4.8564453125, -4.58868408203125, -4.3209228515625, -4.05316162109375, -3.785400390625, -3.51763916015625, -3.2498779296875, -2.98211669921875, -2.71435546875, -2.44659423828125, -2.1788330078125, -1.91107177734375, -1.643310546875, -1.37554931640625, -1.1077880859375, -0.84002685546875, -0.572265625, -0.30450439453125, -0.0367431640625, 0.23101806640625, 0.498779296875, 0.76654052734375, 1.0343017578125, 1.30206298828125, 1.56982421875, 1.83758544921875, 2.1053466796875, 2.37310791015625, 2.640869140625, 2.90863037109375, 3.1763916015625, 3.44415283203125, 3.7119140625, 3.97967529296875, 4.2474365234375, 4.51519775390625, 4.782958984375, 5.05072021484375, 5.3184814453125, 5.58624267578125, 5.85400390625, 6.12176513671875, 6.3895263671875, 6.65728759765625, 6.925048828125, 7.19281005859375, 7.4605712890625, 7.72833251953125, 7.99609375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 7.0, 6.0, 19.0, 20.0, 15.0, 31.0, 32.0, 48.0, 64.0, 95.0, 103.0, 148.0, 205.0, 359.0, 603.0, 1062.0, 2353.0, 5357.0, 12599.0, 33849.0, 103893.0, 403023.0, 345033.0, 89283.0, 29598.0, 11374.0, 4600.0, 2110.0, 1035.0, 527.0, 309.0, 193.0, 137.0, 90.0, 90.0, 69.0, 55.0, 31.0, 28.0, 22.0, 21.0, 15.0, 12.0, 9.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.5, -11.1611328125, -10.822265625, -10.4833984375, -10.14453125, -9.8056640625, -9.466796875, -9.1279296875, -8.7890625, -8.4501953125, -8.111328125, -7.7724609375, -7.43359375, -7.0947265625, -6.755859375, -6.4169921875, -6.078125, -5.7392578125, -5.400390625, -5.0615234375, -4.72265625, -4.3837890625, -4.044921875, -3.7060546875, -3.3671875, -3.0283203125, -2.689453125, -2.3505859375, -2.01171875, -1.6728515625, -1.333984375, -0.9951171875, -0.65625, -0.3173828125, 0.021484375, 0.3603515625, 0.69921875, 1.0380859375, 1.376953125, 1.7158203125, 2.0546875, 2.3935546875, 2.732421875, 3.0712890625, 3.41015625, 3.7490234375, 4.087890625, 4.4267578125, 4.765625, 5.1044921875, 5.443359375, 5.7822265625, 6.12109375, 6.4599609375, 6.798828125, 7.1376953125, 7.4765625, 7.8154296875, 8.154296875, 8.4931640625, 8.83203125, 9.1708984375, 9.509765625, 9.8486328125, 10.1875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 0.0, 4.0, 6.0, 6.0, 4.0, 5.0, 13.0, 10.0, 16.0, 12.0, 24.0, 16.0, 12.0, 33.0, 29.0, 36.0, 34.0, 52.0, 45.0, 63.0, 83.0, 144.0, 1559.0, 291.0, 120.0, 80.0, 44.0, 38.0, 44.0, 36.0, 32.0, 22.0, 30.0, 25.0, 12.0, 18.0, 14.0, 12.0, 6.0, 5.0, 7.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.872802734375, -28.04248046875, -27.212158203125, -26.3818359375, -25.551513671875, -24.72119140625, -23.890869140625, -23.060546875, -22.230224609375, -21.39990234375, -20.569580078125, -19.7392578125, -18.908935546875, -18.07861328125, -17.248291015625, -16.41796875, -15.587646484375, -14.75732421875, -13.927001953125, -13.0966796875, -12.266357421875, -11.43603515625, -10.605712890625, -9.775390625, -8.945068359375, -8.11474609375, -7.284423828125, -6.4541015625, -5.623779296875, -4.79345703125, -3.963134765625, -3.1328125, -2.302490234375, -1.47216796875, -0.641845703125, 0.1884765625, 1.018798828125, 1.84912109375, 2.679443359375, 3.509765625, 4.340087890625, 5.17041015625, 6.000732421875, 6.8310546875, 7.661376953125, 8.49169921875, 9.322021484375, 10.15234375, 10.982666015625, 11.81298828125, 12.643310546875, 13.4736328125, 14.303955078125, 15.13427734375, 15.964599609375, 16.794921875, 17.625244140625, 18.45556640625, 19.285888671875, 20.1162109375, 20.946533203125, 21.77685546875, 22.607177734375, 23.4375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 13.0, 12.0, 14.0, 27.0, 40.0, 44.0, 73.0, 106.0, 161.0, 218.0, 371.0, 704.0, 3637.0, 162702.0, 2944948.0, 29609.0, 1582.0, 497.0, 286.0, 195.0, 135.0, 95.0, 65.0, 36.0, 37.0, 16.0, 23.0, 7.0, 7.0, 8.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.3125, -43.865234375, -42.41796875, -40.970703125, -39.5234375, -38.076171875, -36.62890625, -35.181640625, -33.734375, -32.287109375, -30.83984375, -29.392578125, -27.9453125, -26.498046875, -25.05078125, -23.603515625, -22.15625, -20.708984375, -19.26171875, -17.814453125, -16.3671875, -14.919921875, -13.47265625, -12.025390625, -10.578125, -9.130859375, -7.68359375, -6.236328125, -4.7890625, -3.341796875, -1.89453125, -0.447265625, 1.0, 2.447265625, 3.89453125, 5.341796875, 6.7890625, 8.236328125, 9.68359375, 11.130859375, 12.578125, 14.025390625, 15.47265625, 16.919921875, 18.3671875, 19.814453125, 21.26171875, 22.708984375, 24.15625, 25.603515625, 27.05078125, 28.498046875, 29.9453125, 31.392578125, 32.83984375, 34.287109375, 35.734375, 37.181640625, 38.62890625, 40.076171875, 41.5234375, 42.970703125, 44.41796875, 45.865234375, 47.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 42.0, 681.0, 289.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.56501770019531, -38.866973876953125, -32.16893005371094, -25.470890045166016, -18.772846221923828, -12.07480239868164, -5.376762390136719, 1.3212814331054688, 8.019325256347656, 14.717368125915527, 21.4154109954834, 28.113452911376953, 34.81149673461914, 41.50954055786133, 48.20758056640625, 54.90562438964844, 61.603668212890625, 68.30171203613281, 74.999755859375, 81.69779968261719, 88.39584350585938, 95.09388732910156, 101.79192352294922, 108.4899673461914, 115.1880111694336, 121.88605499267578, 128.58409118652344, 135.28213500976562, 141.9801788330078, 148.67822265625, 155.3762664794922, 162.07431030273438, 168.77236938476562, 175.4704132080078, 182.16845703125, 188.8665008544922, 195.56454467773438, 202.26258850097656, 208.96063232421875, 215.65866088867188, 222.35671997070312, 229.0547637939453, 235.7528076171875, 242.4508514404297, 249.14889526367188, 255.84693908691406, 262.54498291015625, 269.2430114746094, 275.9410400390625, 282.6390686035156, 289.3371276855469, 296.03515625, 302.73321533203125, 309.4312438964844, 316.1293029785156, 322.82733154296875, 329.525390625, 336.2234191894531, 342.9214782714844, 349.6195068359375, 356.31756591796875, 363.0155944824219, 369.7136535644531, 376.41168212890625, 383.1097412109375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 1.0, 3.0, 6.0, 5.0, 13.0, 14.0, 12.0, 15.0, 11.0, 13.0, 16.0, 33.0, 25.0, 37.0, 39.0, 47.0, 44.0, 54.0, 44.0, 40.0, 54.0, 45.0, 60.0, 54.0, 29.0, 39.0, 43.0, 43.0, 32.0, 25.0, 12.0, 12.0, 15.0, 17.0, 9.0, 15.0, 9.0, 8.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.05754089355469, -69.03910827636719, -67.02067565917969, -65.00224304199219, -62.98381423950195, -60.96538162231445, -58.94695281982422, -56.92852020263672, -54.91008758544922, -52.89165496826172, -50.87322235107422, -48.854793548583984, -46.836360931396484, -44.817928314208984, -42.79949951171875, -40.78106689453125, -38.76263427734375, -36.74420166015625, -34.72576904296875, -32.707340240478516, -30.688907623291016, -28.670475006103516, -26.65204429626465, -24.63361358642578, -22.61518096923828, -20.59674835205078, -18.578317642211914, -16.559886932373047, -14.541454315185547, -12.523022651672363, -10.50459098815918, -8.486159324645996, -6.4677276611328125, -4.449295997619629, -2.4308643341064453, -0.4124326705932617, 1.6059989929199219, 3.6244306564331055, 5.642862319946289, 7.661293983459473, 9.679725646972656, 11.69815731048584, 13.716588973999023, 15.735020637512207, 17.75345230102539, 19.77188491821289, 21.790315628051758, 23.808746337890625, 25.827178955078125, 27.845611572265625, 29.864042282104492, 31.88247299194336, 33.90090560913086, 35.91933822631836, 37.937767028808594, 39.956199645996094, 41.974632263183594, 43.993064880371094, 46.011497497558594, 48.02992630004883, 50.04835891723633, 52.06679153442383, 54.08522033691406, 56.10365295410156, 58.12208557128906]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 14.0, 13.0, 16.0, 20.0, 20.0, 24.0, 22.0, 21.0, 33.0, 40.0, 33.0, 31.0, 55.0, 45.0, 48.0, 34.0, 51.0, 36.0, 40.0, 31.0, 36.0, 40.0, 26.0, 24.0, 22.0, 34.0, 34.0, 20.0, 27.0, 17.0, 18.0, 12.0, 15.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.890625, -9.5947265625, -9.298828125, -9.0029296875, -8.70703125, -8.4111328125, -8.115234375, -7.8193359375, -7.5234375, -7.2275390625, -6.931640625, -6.6357421875, -6.33984375, -6.0439453125, -5.748046875, -5.4521484375, -5.15625, -4.8603515625, -4.564453125, -4.2685546875, -3.97265625, -3.6767578125, -3.380859375, -3.0849609375, -2.7890625, -2.4931640625, -2.197265625, -1.9013671875, -1.60546875, -1.3095703125, -1.013671875, -0.7177734375, -0.421875, -0.1259765625, 0.169921875, 0.4658203125, 0.76171875, 1.0576171875, 1.353515625, 1.6494140625, 1.9453125, 2.2412109375, 2.537109375, 2.8330078125, 3.12890625, 3.4248046875, 3.720703125, 4.0166015625, 4.3125, 4.6083984375, 4.904296875, 5.2001953125, 5.49609375, 5.7919921875, 6.087890625, 6.3837890625, 6.6796875, 6.9755859375, 7.271484375, 7.5673828125, 7.86328125, 8.1591796875, 8.455078125, 8.7509765625, 9.046875]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 5.0, 10.0, 6.0, 16.0, 14.0, 16.0, 26.0, 14.0, 33.0, 31.0, 49.0, 76.0, 112.0, 259.0, 684.0, 4031.0, 87364.0, 2829103.0, 1246305.0, 23060.0, 2005.0, 485.0, 172.0, 89.0, 71.0, 43.0, 32.0, 25.0, 15.0, 22.0, 15.0, 17.0, 6.0, 5.0, 12.0, 12.0, 8.0, 6.0, 10.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.724365234375, -27.79248046875, -26.860595703125, -25.9287109375, -24.996826171875, -24.06494140625, -23.133056640625, -22.201171875, -21.269287109375, -20.33740234375, -19.405517578125, -18.4736328125, -17.541748046875, -16.60986328125, -15.677978515625, -14.74609375, -13.814208984375, -12.88232421875, -11.950439453125, -11.0185546875, -10.086669921875, -9.15478515625, -8.222900390625, -7.291015625, -6.359130859375, -5.42724609375, -4.495361328125, -3.5634765625, -2.631591796875, -1.69970703125, -0.767822265625, 0.1640625, 1.095947265625, 2.02783203125, 2.959716796875, 3.8916015625, 4.823486328125, 5.75537109375, 6.687255859375, 7.619140625, 8.551025390625, 9.48291015625, 10.414794921875, 11.3466796875, 12.278564453125, 13.21044921875, 14.142333984375, 15.07421875, 16.006103515625, 16.93798828125, 17.869873046875, 18.8017578125, 19.733642578125, 20.66552734375, 21.597412109375, 22.529296875, 23.461181640625, 24.39306640625, 25.324951171875, 26.2568359375, 27.188720703125, 28.12060546875, 29.052490234375, 29.984375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 10.0, 5.0, 8.0, 14.0, 21.0, 19.0, 44.0, 58.0, 61.0, 101.0, 124.0, 212.0, 310.0, 400.0, 498.0, 514.0, 441.0, 344.0, 249.0, 183.0, 143.0, 76.0, 71.0, 37.0, 23.0, 24.0, 20.0, 17.0, 10.0, 6.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.609375, -16.185302734375, -15.76123046875, -15.337158203125, -14.9130859375, -14.489013671875, -14.06494140625, -13.640869140625, -13.216796875, -12.792724609375, -12.36865234375, -11.944580078125, -11.5205078125, -11.096435546875, -10.67236328125, -10.248291015625, -9.82421875, -9.400146484375, -8.97607421875, -8.552001953125, -8.1279296875, -7.703857421875, -7.27978515625, -6.855712890625, -6.431640625, -6.007568359375, -5.58349609375, -5.159423828125, -4.7353515625, -4.311279296875, -3.88720703125, -3.463134765625, -3.0390625, -2.614990234375, -2.19091796875, -1.766845703125, -1.3427734375, -0.918701171875, -0.49462890625, -0.070556640625, 0.353515625, 0.777587890625, 1.20166015625, 1.625732421875, 2.0498046875, 2.473876953125, 2.89794921875, 3.322021484375, 3.74609375, 4.170166015625, 4.59423828125, 5.018310546875, 5.4423828125, 5.866455078125, 6.29052734375, 6.714599609375, 7.138671875, 7.562744140625, 7.98681640625, 8.410888671875, 8.8349609375, 9.259033203125, 9.68310546875, 10.107177734375, 10.53125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 11.0, 6.0, 11.0, 11.0, 19.0, 37.0, 53.0, 70.0, 139.0, 196.0, 420.0, 1200.0, 5603.0, 70760.0, 3135176.0, 948953.0, 27116.0, 2964.0, 745.0, 324.0, 173.0, 112.0, 56.0, 31.0, 28.0, 16.0, 7.0, 9.0, 11.0, 2.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.59375, -37.48583984375, -36.3779296875, -35.27001953125, -34.162109375, -33.05419921875, -31.9462890625, -30.83837890625, -29.73046875, -28.62255859375, -27.5146484375, -26.40673828125, -25.298828125, -24.19091796875, -23.0830078125, -21.97509765625, -20.8671875, -19.75927734375, -18.6513671875, -17.54345703125, -16.435546875, -15.32763671875, -14.2197265625, -13.11181640625, -12.00390625, -10.89599609375, -9.7880859375, -8.68017578125, -7.572265625, -6.46435546875, -5.3564453125, -4.24853515625, -3.140625, -2.03271484375, -0.9248046875, 0.18310546875, 1.291015625, 2.39892578125, 3.5068359375, 4.61474609375, 5.72265625, 6.83056640625, 7.9384765625, 9.04638671875, 10.154296875, 11.26220703125, 12.3701171875, 13.47802734375, 14.5859375, 15.69384765625, 16.8017578125, 17.90966796875, 19.017578125, 20.12548828125, 21.2333984375, 22.34130859375, 23.44921875, 24.55712890625, 25.6650390625, 26.77294921875, 27.880859375, 28.98876953125, 30.0966796875, 31.20458984375, 32.3125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 227.0, 744.0, 37.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-696.3347778320312, -684.169921875, -672.0050659179688, -659.8402709960938, -647.6754150390625, -635.5105590820312, -623.345703125, -611.1808471679688, -599.0159912109375, -586.8511352539062, -574.686279296875, -562.521484375, -550.3566284179688, -538.1917724609375, -526.0269165039062, -513.862060546875, -501.697265625, -489.53240966796875, -477.3675842285156, -465.2027282714844, -453.03790283203125, -440.873046875, -428.70819091796875, -416.5433349609375, -404.3785095214844, -392.2136535644531, -380.048828125, -367.88397216796875, -355.7191162109375, -343.5542907714844, -331.3894348144531, -319.224609375, -307.0597229003906, -294.8948669433594, -282.73004150390625, -270.565185546875, -258.40032958984375, -246.23550415039062, -234.07064819335938, -221.9058074951172, -209.740966796875, -197.5761260986328, -185.41128540039062, -173.24642944335938, -161.0815887451172, -148.916748046875, -136.75189208984375, -124.58705139160156, -112.4222183227539, -100.25736999511719, -88.092529296875, -75.92768859863281, -63.762840270996094, -51.59799575805664, -39.43315124511719, -27.26830291748047, -15.103462219238281, -2.938617706298828, 9.226226806640625, 21.391071319580078, 33.55591583251953, 45.720760345458984, 57.88560485839844, 70.05045318603516, 82.21529388427734]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 1.0, 10.0, 9.0, 11.0, 10.0, 20.0, 13.0, 19.0, 29.0, 24.0, 30.0, 17.0, 20.0, 24.0, 31.0, 34.0, 44.0, 41.0, 33.0, 34.0, 37.0, 44.0, 37.0, 27.0, 35.0, 35.0, 25.0, 22.0, 30.0, 24.0, 28.0, 26.0, 20.0, 18.0, 20.0, 16.0, 19.0, 14.0, 7.0, 9.0, 10.0, 12.0, 6.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-46.863319396972656, -45.53775405883789, -44.212188720703125, -42.886619567871094, -41.56105422973633, -40.23548889160156, -38.9099235534668, -37.58435821533203, -36.2587890625, -34.933223724365234, -33.60765838623047, -32.28208923339844, -30.956523895263672, -29.630958557128906, -28.30539321899414, -26.979825973510742, -25.654260635375977, -24.32869529724121, -23.003128051757812, -21.677562713623047, -20.35199546813965, -19.026430130004883, -17.700862884521484, -16.37529754638672, -15.049731254577637, -13.724164962768555, -12.398598670959473, -11.07303237915039, -9.747467041015625, -8.421899795532227, -7.096334457397461, -5.770768165588379, -4.445201873779297, -3.119635581970215, -1.794069528579712, -0.468503475189209, 0.857062816619873, 2.182629108428955, 3.508194923400879, 4.833761215209961, 6.159327507019043, 7.484893798828125, 8.810460090637207, 10.136026382446289, 11.461591720581055, 12.787158966064453, 14.112724304199219, 15.4382905960083, 16.763856887817383, 18.08942222595215, 19.414989471435547, 20.740554809570312, 22.06612205505371, 23.391687393188477, 24.717254638671875, 26.04281997680664, 27.368385314941406, 28.693950653076172, 30.01951789855957, 31.345083236694336, 32.670650482177734, 33.9962158203125, 35.321781158447266, 36.64734649658203, 37.97291564941406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 6.0, 8.0, 8.0, 11.0, 13.0, 15.0, 21.0, 10.0, 30.0, 23.0, 20.0, 33.0, 36.0, 52.0, 43.0, 28.0, 39.0, 43.0, 44.0, 56.0, 45.0, 39.0, 28.0, 49.0, 32.0, 32.0, 35.0, 33.0, 31.0, 20.0, 27.0, 24.0, 16.0, 14.0, 8.0, 5.0, 4.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.65380859375, -8.3388671875, -8.02392578125, -7.708984375, -7.39404296875, -7.0791015625, -6.76416015625, -6.44921875, -6.13427734375, -5.8193359375, -5.50439453125, -5.189453125, -4.87451171875, -4.5595703125, -4.24462890625, -3.9296875, -3.61474609375, -3.2998046875, -2.98486328125, -2.669921875, -2.35498046875, -2.0400390625, -1.72509765625, -1.41015625, -1.09521484375, -0.7802734375, -0.46533203125, -0.150390625, 0.16455078125, 0.4794921875, 0.79443359375, 1.109375, 1.42431640625, 1.7392578125, 2.05419921875, 2.369140625, 2.68408203125, 2.9990234375, 3.31396484375, 3.62890625, 3.94384765625, 4.2587890625, 4.57373046875, 4.888671875, 5.20361328125, 5.5185546875, 5.83349609375, 6.1484375, 6.46337890625, 6.7783203125, 7.09326171875, 7.408203125, 7.72314453125, 8.0380859375, 8.35302734375, 8.66796875, 8.98291015625, 9.2978515625, 9.61279296875, 9.927734375, 10.24267578125, 10.5576171875, 10.87255859375, 11.1875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 18.0, 28.0, 47.0, 72.0, 108.0, 194.0, 288.0, 548.0, 903.0, 1523.0, 2516.0, 4187.0, 7288.0, 12065.0, 20838.0, 35623.0, 63270.0, 115329.0, 229149.0, 258577.0, 130010.0, 70473.0, 39592.0, 22966.0, 13525.0, 7861.0, 4724.0, 2765.0, 1630.0, 920.0, 579.0, 377.0, 213.0, 137.0, 76.0, 45.0, 26.0, 15.0, 11.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.412109375, -1.3635711669921875, -1.315032958984375, -1.2664947509765625, -1.21795654296875, -1.1694183349609375, -1.120880126953125, -1.0723419189453125, -1.0238037109375, -0.9752655029296875, -0.926727294921875, -0.8781890869140625, -0.82965087890625, -0.7811126708984375, -0.732574462890625, -0.6840362548828125, -0.635498046875, -0.5869598388671875, -0.538421630859375, -0.4898834228515625, -0.44134521484375, -0.3928070068359375, -0.344268798828125, -0.2957305908203125, -0.2471923828125, -0.1986541748046875, -0.150115966796875, -0.1015777587890625, -0.05303955078125, -0.0045013427734375, 0.044036865234375, 0.0925750732421875, 0.14111328125, 0.1896514892578125, 0.238189697265625, 0.2867279052734375, 0.33526611328125, 0.3838043212890625, 0.432342529296875, 0.4808807373046875, 0.5294189453125, 0.5779571533203125, 0.626495361328125, 0.6750335693359375, 0.72357177734375, 0.7721099853515625, 0.820648193359375, 0.8691864013671875, 0.917724609375, 0.9662628173828125, 1.014801025390625, 1.0633392333984375, 1.11187744140625, 1.1604156494140625, 1.208953857421875, 1.2574920654296875, 1.3060302734375, 1.3545684814453125, 1.403106689453125, 1.4516448974609375, 1.50018310546875, 1.5487213134765625, 1.597259521484375, 1.6457977294921875, 1.6943359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 11.0, 16.0, 10.0, 18.0, 10.0, 22.0, 18.0, 22.0, 21.0, 22.0, 27.0, 48.0, 40.0, 42.0, 44.0, 28.0, 47.0, 1062.0, 47.0, 44.0, 28.0, 30.0, 32.0, 32.0, 30.0, 27.0, 27.0, 27.0, 26.0, 19.0, 14.0, 13.0, 21.0, 15.0, 14.0, 12.0, 10.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.3125, -5.132568359375, -4.95263671875, -4.772705078125, -4.5927734375, -4.412841796875, -4.23291015625, -4.052978515625, -3.873046875, -3.693115234375, -3.51318359375, -3.333251953125, -3.1533203125, -2.973388671875, -2.79345703125, -2.613525390625, -2.43359375, -2.253662109375, -2.07373046875, -1.893798828125, -1.7138671875, -1.533935546875, -1.35400390625, -1.174072265625, -0.994140625, -0.814208984375, -0.63427734375, -0.454345703125, -0.2744140625, -0.094482421875, 0.08544921875, 0.265380859375, 0.4453125, 0.625244140625, 0.80517578125, 0.985107421875, 1.1650390625, 1.344970703125, 1.52490234375, 1.704833984375, 1.884765625, 2.064697265625, 2.24462890625, 2.424560546875, 2.6044921875, 2.784423828125, 2.96435546875, 3.144287109375, 3.32421875, 3.504150390625, 3.68408203125, 3.864013671875, 4.0439453125, 4.223876953125, 4.40380859375, 4.583740234375, 4.763671875, 4.943603515625, 5.12353515625, 5.303466796875, 5.4833984375, 5.663330078125, 5.84326171875, 6.023193359375, 6.203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 13.0, 14.0, 23.0, 40.0, 43.0, 83.0, 94.0, 137.0, 199.0, 299.0, 392.0, 618.0, 808.0, 1224.0, 1793.0, 2437.0, 3505.0, 5132.0, 7553.0, 10931.0, 16546.0, 24647.0, 38864.0, 62843.0, 103005.0, 174822.0, 1276958.0, 136090.0, 81617.0, 50302.0, 31558.0, 20443.0, 13815.0, 9368.0, 6368.0, 4363.0, 3081.0, 2109.0, 1495.0, 1100.0, 706.0, 517.0, 361.0, 243.0, 160.0, 130.0, 77.0, 61.0, 49.0, 22.0, 20.0, 15.0, 12.0, 5.0, 5.0, 2.0, 8.0], "bins": [-1.2001953125, -1.16412353515625, -1.1280517578125, -1.09197998046875, -1.055908203125, -1.01983642578125, -0.9837646484375, -0.94769287109375, -0.91162109375, -0.87554931640625, -0.8394775390625, -0.80340576171875, -0.767333984375, -0.73126220703125, -0.6951904296875, -0.65911865234375, -0.623046875, -0.58697509765625, -0.5509033203125, -0.51483154296875, -0.478759765625, -0.44268798828125, -0.4066162109375, -0.37054443359375, -0.33447265625, -0.29840087890625, -0.2623291015625, -0.22625732421875, -0.190185546875, -0.15411376953125, -0.1180419921875, -0.08197021484375, -0.0458984375, -0.00982666015625, 0.0262451171875, 0.06231689453125, 0.098388671875, 0.13446044921875, 0.1705322265625, 0.20660400390625, 0.24267578125, 0.27874755859375, 0.3148193359375, 0.35089111328125, 0.386962890625, 0.42303466796875, 0.4591064453125, 0.49517822265625, 0.53125, 0.56732177734375, 0.6033935546875, 0.63946533203125, 0.675537109375, 0.71160888671875, 0.7476806640625, 0.78375244140625, 0.81982421875, 0.85589599609375, 0.8919677734375, 0.92803955078125, 0.964111328125, 1.00018310546875, 1.0362548828125, 1.07232666015625, 1.1083984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 12.0, 19.0, 14.0, 23.0, 21.0, 33.0, 42.0, 44.0, 40.0, 57.0, 69.0, 66.0, 68.0, 59.0, 67.0, 58.0, 61.0, 39.0, 34.0, 31.0, 20.0, 14.0, 12.0, 7.0, 7.0, 10.0, 9.0, 7.0, 1.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0015668869018554688, -0.0015215426683425903, -0.001476198434829712, -0.0014308542013168335, -0.001385509967803955, -0.0013401657342910767, -0.0012948215007781982, -0.0012494772672653198, -0.0012041330337524414, -0.001158788800239563, -0.0011134445667266846, -0.0010681003332138062, -0.0010227560997009277, -0.0009774118661880493, -0.0009320676326751709, -0.0008867233991622925, -0.0008413791656494141, -0.0007960349321365356, -0.0007506906986236572, -0.0007053464651107788, -0.0006600022315979004, -0.000614657998085022, -0.0005693137645721436, -0.0005239695310592651, -0.0004786252975463867, -0.0004332810640335083, -0.0003879368305206299, -0.00034259259700775146, -0.00029724836349487305, -0.00025190412998199463, -0.0002065598964691162, -0.0001612156629562378, -0.00011587142944335938, -7.052719593048096e-05, -2.518296241760254e-05, 2.016127109527588e-05, 6.55055046081543e-05, 0.00011084973812103271, 0.00015619397163391113, 0.00020153820514678955, 0.00024688243865966797, 0.0002922266721725464, 0.0003375709056854248, 0.0003829151391983032, 0.00042825937271118164, 0.00047360360622406006, 0.0005189478397369385, 0.0005642920732498169, 0.0006096363067626953, 0.0006549805402755737, 0.0007003247737884521, 0.0007456690073013306, 0.000791013240814209, 0.0008363574743270874, 0.0008817017078399658, 0.0009270459413528442, 0.0009723901748657227, 0.001017734408378601, 0.0010630786418914795, 0.001108422875404358, 0.0011537671089172363, 0.0011991113424301147, 0.0012444555759429932, 0.0012897998094558716, 0.00133514404296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 8.0, 7.0, 7.0, 11.0, 13.0, 16.0, 22.0, 18.0, 16.0, 34.0, 54.0, 70.0, 124.0, 176.0, 307.0, 695.0, 24000.0, 1020271.0, 1485.0, 457.0, 231.0, 162.0, 97.0, 68.0, 38.0, 43.0, 31.0, 20.0, 11.0, 14.0, 15.0, 6.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029632568359375, -0.02850341796875, -0.027374267578125, -0.0262451171875, -0.025115966796875, -0.02398681640625, -0.022857666015625, -0.021728515625, -0.020599365234375, -0.01947021484375, -0.018341064453125, -0.0172119140625, -0.016082763671875, -0.01495361328125, -0.013824462890625, -0.0126953125, -0.011566162109375, -0.01043701171875, -0.009307861328125, -0.0081787109375, -0.007049560546875, -0.00592041015625, -0.004791259765625, -0.003662109375, -0.002532958984375, -0.00140380859375, -0.000274658203125, 0.0008544921875, 0.001983642578125, 0.00311279296875, 0.004241943359375, 0.00537109375, 0.006500244140625, 0.00762939453125, 0.008758544921875, 0.0098876953125, 0.011016845703125, 0.01214599609375, 0.013275146484375, 0.014404296875, 0.015533447265625, 0.01666259765625, 0.017791748046875, 0.0189208984375, 0.020050048828125, 0.02117919921875, 0.022308349609375, 0.0234375, 0.024566650390625, 0.02569580078125, 0.026824951171875, 0.0279541015625, 0.029083251953125, 0.03021240234375, 0.031341552734375, 0.032470703125, 0.033599853515625, 0.03472900390625, 0.035858154296875, 0.0369873046875, 0.038116455078125, 0.03924560546875, 0.040374755859375, 0.04150390625, 0.042633056640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 48.0, 196.0, 401.0, 278.0, 76.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022249564062803984, -0.0021471113432198763, -0.0020692660473287106, -0.0019914209842681885, -0.0019135759212076664, -0.0018357307417318225, -0.0017578855622559786, -0.0016800404991954565, -0.0016021953197196126, -0.0015243501402437687, -0.0014465050771832466, -0.0013686598977074027, -0.0012908147182315588, -0.0012129696551710367, -0.0011351244756951928, -0.001057279296219349, -0.0009794342331588268, -0.0009015891118906438, -0.0008237439906224608, -0.0007458988111466169, -0.0006680536898784339, -0.000590208568610251, -0.000512363389134407, -0.00043451826786622405, -0.00035667314659804106, -0.00027882802532985806, -0.00020098287495784461, -0.0001231377391377464, -4.529260331764817e-05, 3.255251795053482e-05, 0.00011039766832254827, 0.00018824281869456172, 0.00026608817279338837, 0.00034393329406157136, 0.0004217784444335848, 0.0004996235948055983, 0.0005774687160737813, 0.0006553138373419642, 0.0007331590168178082, 0.0008110041380859911, 0.0008888492593541741, 0.0009666943806223571, 0.0010445395018905401, 0.001122384681366384, 0.001200229860842228, 0.00127807492390275, 0.001355920103378594, 0.0014337652828544378, 0.00151161034591496, 0.0015894555253908038, 0.001667300588451326, 0.0017451457679271698, 0.0018229908309876919, 0.0019008360104635358, 0.0019786811899393797, 0.0020565262529999018, 0.0021343715488910675, 0.0022122166119515896, 0.0022900619078427553, 0.0023679069709032774, 0.0024457520339637995, 0.002523597329854965, 0.0026014423929154873, 0.0026792874559760094, 0.0027571325190365314]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 9.0, 10.0, 13.0, 15.0, 14.0, 10.0, 21.0, 27.0, 9.0, 35.0, 33.0, 34.0, 35.0, 41.0, 41.0, 37.0, 32.0, 38.0, 45.0, 40.0, 50.0, 44.0, 43.0, 46.0, 25.0, 27.0, 23.0, 34.0, 21.0, 31.0, 17.0, 25.0, 12.0, 8.0, 7.0, 8.0, 6.0, 10.0, 8.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000652313232421875, -0.000629751943051815, -0.0006071906536817551, -0.0005846293643116951, -0.0005620680749416351, -0.0005395067855715752, -0.0005169454962015152, -0.0004943842068314552, -0.00047182291746139526, -0.0004492616280913353, -0.00042670033872127533, -0.00040413904935121536, -0.0003815777599811554, -0.00035901647061109543, -0.00033645518124103546, -0.0003138938918709755, -0.00029133260250091553, -0.00026877131313085556, -0.0002462100237607956, -0.00022364873439073563, -0.00020108744502067566, -0.0001785261556506157, -0.00015596486628055573, -0.00013340357691049576, -0.00011084228754043579, -8.828099817037582e-05, -6.571970880031586e-05, -4.315841943025589e-05, -2.0597130060195923e-05, 1.964159309864044e-06, 2.452544867992401e-05, 4.708673804998398e-05, 6.964802742004395e-05, 9.220931679010391e-05, 0.00011477060616016388, 0.00013733189553022385, 0.0001598931849002838, 0.00018245447427034378, 0.00020501576364040375, 0.00022757705301046371, 0.0002501383423805237, 0.00027269963175058365, 0.0002952609211206436, 0.0003178222104907036, 0.00034038349986076355, 0.0003629447892308235, 0.0003855060786008835, 0.00040806736797094345, 0.0004306286573410034, 0.0004531899467110634, 0.00047575123608112335, 0.0004983125254511833, 0.0005208738148212433, 0.0005434351041913033, 0.0005659963935613632, 0.0005885576829314232, 0.0006111189723014832, 0.0006336802616715431, 0.0006562415510416031, 0.0006788028404116631, 0.000701364129781723, 0.000723925419151783, 0.000746486708521843, 0.0007690479978919029, 0.0007916092872619629]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 6.0, 8.0, 8.0, 11.0, 13.0, 15.0, 20.0, 11.0, 30.0, 23.0, 20.0, 33.0, 36.0, 52.0, 43.0, 28.0, 39.0, 43.0, 44.0, 56.0, 45.0, 39.0, 28.0, 49.0, 32.0, 32.0, 35.0, 33.0, 31.0, 20.0, 27.0, 24.0, 16.0, 14.0, 8.0, 5.0, 4.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.65380859375, -8.3388671875, -8.02392578125, -7.708984375, -7.39404296875, -7.0791015625, -6.76416015625, -6.44921875, -6.13427734375, -5.8193359375, -5.50439453125, -5.189453125, -4.87451171875, -4.5595703125, -4.24462890625, -3.9296875, -3.61474609375, -3.2998046875, -2.98486328125, -2.669921875, -2.35498046875, -2.0400390625, -1.72509765625, -1.41015625, -1.09521484375, -0.7802734375, -0.46533203125, -0.150390625, 0.16455078125, 0.4794921875, 0.79443359375, 1.109375, 1.42431640625, 1.7392578125, 2.05419921875, 2.369140625, 2.68408203125, 2.9990234375, 3.31396484375, 3.62890625, 3.94384765625, 4.2587890625, 4.57373046875, 4.888671875, 5.20361328125, 5.5185546875, 5.83349609375, 6.1484375, 6.46337890625, 6.7783203125, 7.09326171875, 7.408203125, 7.72314453125, 8.0380859375, 8.35302734375, 8.66796875, 8.98291015625, 9.2978515625, 9.61279296875, 9.927734375, 10.24267578125, 10.5576171875, 10.87255859375, 11.1875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 6.0, 14.0, 9.0, 14.0, 25.0, 33.0, 44.0, 54.0, 93.0, 126.0, 190.0, 190.0, 355.0, 521.0, 820.0, 1434.0, 3289.0, 7758.0, 21749.0, 70421.0, 271409.0, 466388.0, 140333.0, 39863.0, 12971.0, 5088.0, 2222.0, 1119.0, 630.0, 385.0, 301.0, 185.0, 152.0, 94.0, 75.0, 59.0, 38.0, 21.0, 27.0, 16.0, 16.0, 6.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.65625, -12.286865234375, -11.91748046875, -11.548095703125, -11.1787109375, -10.809326171875, -10.43994140625, -10.070556640625, -9.701171875, -9.331787109375, -8.96240234375, -8.593017578125, -8.2236328125, -7.854248046875, -7.48486328125, -7.115478515625, -6.74609375, -6.376708984375, -6.00732421875, -5.637939453125, -5.2685546875, -4.899169921875, -4.52978515625, -4.160400390625, -3.791015625, -3.421630859375, -3.05224609375, -2.682861328125, -2.3134765625, -1.944091796875, -1.57470703125, -1.205322265625, -0.8359375, -0.466552734375, -0.09716796875, 0.272216796875, 0.6416015625, 1.010986328125, 1.38037109375, 1.749755859375, 2.119140625, 2.488525390625, 2.85791015625, 3.227294921875, 3.5966796875, 3.966064453125, 4.33544921875, 4.704833984375, 5.07421875, 5.443603515625, 5.81298828125, 6.182373046875, 6.5517578125, 6.921142578125, 7.29052734375, 7.659912109375, 8.029296875, 8.398681640625, 8.76806640625, 9.137451171875, 9.5068359375, 9.876220703125, 10.24560546875, 10.614990234375, 10.984375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 14.0, 18.0, 18.0, 18.0, 20.0, 22.0, 35.0, 41.0, 42.0, 51.0, 52.0, 61.0, 95.0, 240.0, 1509.0, 259.0, 104.0, 66.0, 44.0, 42.0, 29.0, 47.0, 31.0, 30.0, 26.0, 16.0, 32.0, 15.0, 13.0, 11.0, 8.0, 5.0, 1.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.171875, -28.302490234375, -27.43310546875, -26.563720703125, -25.6943359375, -24.824951171875, -23.95556640625, -23.086181640625, -22.216796875, -21.347412109375, -20.47802734375, -19.608642578125, -18.7392578125, -17.869873046875, -17.00048828125, -16.131103515625, -15.26171875, -14.392333984375, -13.52294921875, -12.653564453125, -11.7841796875, -10.914794921875, -10.04541015625, -9.176025390625, -8.306640625, -7.437255859375, -6.56787109375, -5.698486328125, -4.8291015625, -3.959716796875, -3.09033203125, -2.220947265625, -1.3515625, -0.482177734375, 0.38720703125, 1.256591796875, 2.1259765625, 2.995361328125, 3.86474609375, 4.734130859375, 5.603515625, 6.472900390625, 7.34228515625, 8.211669921875, 9.0810546875, 9.950439453125, 10.81982421875, 11.689208984375, 12.55859375, 13.427978515625, 14.29736328125, 15.166748046875, 16.0361328125, 16.905517578125, 17.77490234375, 18.644287109375, 19.513671875, 20.383056640625, 21.25244140625, 22.121826171875, 22.9912109375, 23.860595703125, 24.72998046875, 25.599365234375, 26.46875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 8.0, 1.0, 7.0, 6.0, 9.0, 13.0, 7.0, 18.0, 14.0, 30.0, 35.0, 44.0, 70.0, 87.0, 102.0, 148.0, 197.0, 267.0, 456.0, 862.0, 4381.0, 122717.0, 2965029.0, 46489.0, 2643.0, 686.0, 403.0, 262.0, 167.0, 146.0, 101.0, 58.0, 51.0, 36.0, 31.0, 24.0, 20.0, 19.0, 16.0, 11.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-40.40625, -39.11865234375, -37.8310546875, -36.54345703125, -35.255859375, -33.96826171875, -32.6806640625, -31.39306640625, -30.10546875, -28.81787109375, -27.5302734375, -26.24267578125, -24.955078125, -23.66748046875, -22.3798828125, -21.09228515625, -19.8046875, -18.51708984375, -17.2294921875, -15.94189453125, -14.654296875, -13.36669921875, -12.0791015625, -10.79150390625, -9.50390625, -8.21630859375, -6.9287109375, -5.64111328125, -4.353515625, -3.06591796875, -1.7783203125, -0.49072265625, 0.796875, 2.08447265625, 3.3720703125, 4.65966796875, 5.947265625, 7.23486328125, 8.5224609375, 9.81005859375, 11.09765625, 12.38525390625, 13.6728515625, 14.96044921875, 16.248046875, 17.53564453125, 18.8232421875, 20.11083984375, 21.3984375, 22.68603515625, 23.9736328125, 25.26123046875, 26.548828125, 27.83642578125, 29.1240234375, 30.41162109375, 31.69921875, 32.98681640625, 34.2744140625, 35.56201171875, 36.849609375, 38.13720703125, 39.4248046875, 40.71240234375, 42.0]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 35.0, 564.0, 400.0, 15.0, 2.0, 0.0, 3.0], "bins": [-344.5450134277344, -338.6923828125, -332.8397521972656, -326.98712158203125, -321.1344909667969, -315.2818908691406, -309.42926025390625, -303.5766296386719, -297.7239990234375, -291.8713684082031, -286.01873779296875, -280.1661071777344, -274.3134765625, -268.46087646484375, -262.6082458496094, -256.755615234375, -250.90298461914062, -245.05035400390625, -239.19772338867188, -233.34510803222656, -227.4924774169922, -221.6398468017578, -215.78721618652344, -209.93460083007812, -204.0819549560547, -198.2293243408203, -192.37669372558594, -186.52407836914062, -180.67144775390625, -174.81881713867188, -168.9661865234375, -163.11355590820312, -157.26095581054688, -151.4083251953125, -145.55569458007812, -139.7030792236328, -133.85044860839844, -127.99781799316406, -122.14518737792969, -116.29256439208984, -110.43993377685547, -104.5873031616211, -98.73468017578125, -92.88204956054688, -87.02942657470703, -81.17679595947266, -75.32417297363281, -69.47154235839844, -63.61891174316406, -57.76628494262695, -51.913658142089844, -46.06102752685547, -40.208404541015625, -34.35577392578125, -28.50314712524414, -22.65052032470703, -16.797895431518555, -10.945268630981445, -5.0926408767700195, 0.7599868774414062, 6.612613677978516, 12.465240478515625, 18.317869186401367, 24.170495986938477, 30.023122787475586]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 4.0, 1.0, 12.0, 10.0, 11.0, 12.0, 15.0, 19.0, 21.0, 18.0, 28.0, 27.0, 27.0, 42.0, 38.0, 44.0, 50.0, 40.0, 51.0, 41.0, 42.0, 41.0, 47.0, 52.0, 40.0, 38.0, 35.0, 24.0, 32.0, 26.0, 20.0, 17.0, 19.0, 9.0, 8.0, 13.0, 7.0, 6.0, 7.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3016357421875, -63.2881965637207, -61.27476119995117, -59.261322021484375, -57.247886657714844, -55.23444747924805, -53.22100830078125, -51.20757293701172, -49.19413757324219, -47.18069839477539, -45.16726303100586, -43.15382385253906, -41.14038848876953, -39.126949310302734, -37.11351013183594, -35.100074768066406, -33.08663558959961, -31.073198318481445, -29.05976104736328, -27.046321868896484, -25.032886505126953, -23.019447326660156, -21.006010055541992, -18.992572784423828, -16.979135513305664, -14.9656982421875, -12.952260971069336, -10.938822746276855, -8.925385475158691, -6.911948204040527, -4.898509979248047, -2.885072708129883, -0.8716354370117188, 1.1418020725250244, 3.1552395820617676, 5.16867733001709, 7.182114601135254, 9.195551872253418, 11.208990097045898, 13.222427368164062, 15.235864639282227, 17.24930191040039, 19.262739181518555, 21.27617645263672, 23.289615631103516, 25.303050994873047, 27.316490173339844, 29.329927444458008, 31.343364715576172, 33.35680389404297, 35.3702392578125, 37.3836784362793, 39.39711380004883, 41.410552978515625, 43.423988342285156, 45.43742752075195, 47.45086669921875, 49.46430587768555, 51.47774124145508, 53.491180419921875, 55.504615783691406, 57.5180549621582, 59.531494140625, 61.54492950439453, 63.55836486816406]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 14.0, 9.0, 12.0, 13.0, 14.0, 23.0, 20.0, 34.0, 28.0, 33.0, 30.0, 27.0, 39.0, 59.0, 31.0, 43.0, 45.0, 49.0, 43.0, 40.0, 36.0, 38.0, 34.0, 34.0, 40.0, 26.0, 23.0, 25.0, 21.0, 17.0, 17.0, 16.0, 15.0, 12.0, 8.0, 5.0, 6.0, 3.0, 8.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.0447998046875, -7.730224609375, -7.4156494140625, -7.10107421875, -6.7864990234375, -6.471923828125, -6.1573486328125, -5.8427734375, -5.5281982421875, -5.213623046875, -4.8990478515625, -4.58447265625, -4.2698974609375, -3.955322265625, -3.6407470703125, -3.326171875, -3.0115966796875, -2.697021484375, -2.3824462890625, -2.06787109375, -1.7532958984375, -1.438720703125, -1.1241455078125, -0.8095703125, -0.4949951171875, -0.180419921875, 0.1341552734375, 0.44873046875, 0.7633056640625, 1.077880859375, 1.3924560546875, 1.70703125, 2.0216064453125, 2.336181640625, 2.6507568359375, 2.96533203125, 3.2799072265625, 3.594482421875, 3.9090576171875, 4.2236328125, 4.5382080078125, 4.852783203125, 5.1673583984375, 5.48193359375, 5.7965087890625, 6.111083984375, 6.4256591796875, 6.740234375, 7.0548095703125, 7.369384765625, 7.6839599609375, 7.99853515625, 8.3131103515625, 8.627685546875, 8.9422607421875, 9.2568359375, 9.5714111328125, 9.885986328125, 10.2005615234375, 10.51513671875, 10.8297119140625, 11.144287109375, 11.4588623046875, 11.7734375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 3.0, 10.0, 12.0, 19.0, 20.0, 26.0, 35.0, 38.0, 48.0, 79.0, 104.0, 140.0, 204.0, 273.0, 347.0, 523.0, 1554.0, 4187641.0, 1341.0, 482.0, 343.0, 268.0, 169.0, 158.0, 113.0, 70.0, 42.0, 35.0, 47.0, 24.0, 24.0, 13.0, 9.0, 9.0, 5.0, 17.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-260.0, -251.9921875, -243.984375, -235.9765625, -227.96875, -219.9609375, -211.953125, -203.9453125, -195.9375, -187.9296875, -179.921875, -171.9140625, -163.90625, -155.8984375, -147.890625, -139.8828125, -131.875, -123.8671875, -115.859375, -107.8515625, -99.84375, -91.8359375, -83.828125, -75.8203125, -67.8125, -59.8046875, -51.796875, -43.7890625, -35.78125, -27.7734375, -19.765625, -11.7578125, -3.75, 4.2578125, 12.265625, 20.2734375, 28.28125, 36.2890625, 44.296875, 52.3046875, 60.3125, 68.3203125, 76.328125, 84.3359375, 92.34375, 100.3515625, 108.359375, 116.3671875, 124.375, 132.3828125, 140.390625, 148.3984375, 156.40625, 164.4140625, 172.421875, 180.4296875, 188.4375, 196.4453125, 204.453125, 212.4609375, 220.46875, 228.4765625, 236.484375, 244.4921875, 252.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 8.0, 5.0, 10.0, 17.0, 23.0, 30.0, 41.0, 71.0, 131.0, 214.0, 318.0, 611.0, 869.0, 745.0, 408.0, 216.0, 132.0, 90.0, 42.0, 33.0, 20.0, 22.0, 10.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0, -27.275390625, -26.55078125, -25.826171875, -25.1015625, -24.376953125, -23.65234375, -22.927734375, -22.203125, -21.478515625, -20.75390625, -20.029296875, -19.3046875, -18.580078125, -17.85546875, -17.130859375, -16.40625, -15.681640625, -14.95703125, -14.232421875, -13.5078125, -12.783203125, -12.05859375, -11.333984375, -10.609375, -9.884765625, -9.16015625, -8.435546875, -7.7109375, -6.986328125, -6.26171875, -5.537109375, -4.8125, -4.087890625, -3.36328125, -2.638671875, -1.9140625, -1.189453125, -0.46484375, 0.259765625, 0.984375, 1.708984375, 2.43359375, 3.158203125, 3.8828125, 4.607421875, 5.33203125, 6.056640625, 6.78125, 7.505859375, 8.23046875, 8.955078125, 9.6796875, 10.404296875, 11.12890625, 11.853515625, 12.578125, 13.302734375, 14.02734375, 14.751953125, 15.4765625, 16.201171875, 16.92578125, 17.650390625, 18.375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 15.0, 6.0, 9.0, 12.0, 15.0, 25.0, 33.0, 31.0, 46.0, 54.0, 65.0, 95.0, 242.0, 1419.0, 4123106.0, 68066.0, 533.0, 129.0, 80.0, 48.0, 48.0, 37.0, 27.0, 24.0, 30.0, 21.0, 16.0, 8.0, 9.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.5, -156.0146484375, -151.529296875, -147.0439453125, -142.55859375, -138.0732421875, -133.587890625, -129.1025390625, -124.6171875, -120.1318359375, -115.646484375, -111.1611328125, -106.67578125, -102.1904296875, -97.705078125, -93.2197265625, -88.734375, -84.2490234375, -79.763671875, -75.2783203125, -70.79296875, -66.3076171875, -61.822265625, -57.3369140625, -52.8515625, -48.3662109375, -43.880859375, -39.3955078125, -34.91015625, -30.4248046875, -25.939453125, -21.4541015625, -16.96875, -12.4833984375, -7.998046875, -3.5126953125, 0.97265625, 5.4580078125, 9.943359375, 14.4287109375, 18.9140625, 23.3994140625, 27.884765625, 32.3701171875, 36.85546875, 41.3408203125, 45.826171875, 50.3115234375, 54.796875, 59.2822265625, 63.767578125, 68.2529296875, 72.73828125, 77.2236328125, 81.708984375, 86.1943359375, 90.6796875, 95.1650390625, 99.650390625, 104.1357421875, 108.62109375, 113.1064453125, 117.591796875, 122.0771484375, 126.5625]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 284.0, 712.0, 16.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.74394989013672, -53.90701675415039, -41.07008361816406, -28.233154296875, -15.396221160888672, -2.5592880249023438, 10.277641296386719, 23.114578247070312, 35.951507568359375, 48.7884407043457, 61.62537384033203, 74.4623031616211, 87.29924011230469, 100.13616943359375, 112.97309875488281, 125.8100357055664, 138.64697265625, 151.48390197753906, 164.32083129882812, 177.15777587890625, 189.9947052001953, 202.83163452148438, 215.66856384277344, 228.5054931640625, 241.34242248535156, 254.17935180664062, 267.01629638671875, 279.85321044921875, 292.6901550292969, 305.527099609375, 318.364013671875, 331.2009582519531, 344.0378723144531, 356.87481689453125, 369.71173095703125, 382.5486755371094, 395.3855895996094, 408.2225341796875, 421.0594482421875, 433.8963928222656, 446.73333740234375, 459.5702819824219, 472.4071960449219, 485.244140625, 498.0810546875, 510.9179992675781, 523.7549438476562, 536.5918579101562, 549.4287719726562, 562.2656860351562, 575.1026611328125, 587.9395751953125, 600.7764892578125, 613.6134033203125, 626.4503784179688, 639.2872924804688, 652.124267578125, 664.961181640625, 677.7981567382812, 690.6350708007812, 703.4719848632812, 716.3089599609375, 729.1458740234375, 741.9827880859375, 754.8197021484375]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 12.0, 13.0, 23.0, 23.0, 17.0, 23.0, 24.0, 36.0, 21.0, 38.0, 37.0, 47.0, 39.0, 49.0, 41.0, 38.0, 51.0, 45.0, 51.0, 33.0, 36.0, 37.0, 34.0, 35.0, 26.0, 24.0, 18.0, 20.0, 13.0, 18.0, 12.0, 12.0, 7.0, 5.0, 8.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.72625732421875, -47.906124114990234, -46.08599090576172, -44.2658576965332, -42.44572448730469, -40.625587463378906, -38.80545425415039, -36.985321044921875, -35.16518783569336, -33.345054626464844, -31.524921417236328, -29.70478630065918, -27.884653091430664, -26.06451988220215, -24.244384765625, -22.424251556396484, -20.60411834716797, -18.783985137939453, -16.963851928710938, -15.143716812133789, -13.323583602905273, -11.503450393676758, -9.683316230773926, -7.863182067871094, -6.043048858642578, -4.222915172576904, -2.4027814865112305, -0.5826478004455566, 1.2374858856201172, 3.057619094848633, 4.877753257751465, 6.697887420654297, 8.518020629882812, 10.338153839111328, 12.15828800201416, 13.978422164916992, 15.798555374145508, 17.618688583374023, 19.438823699951172, 21.258956909179688, 23.079090118408203, 24.89922332763672, 26.719356536865234, 28.539491653442383, 30.3596248626709, 32.17975616455078, 33.99989318847656, 35.82002639770508, 37.640159606933594, 39.46029281616211, 41.280426025390625, 43.10055923461914, 44.920692443847656, 46.74082946777344, 48.56096267700195, 50.38109588623047, 52.201229095458984, 54.0213623046875, 55.841495513916016, 57.66162872314453, 59.48176574707031, 61.30189514160156, 63.122032165527344, 64.94216918945312, 66.76229858398438]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 12.0, 13.0, 7.0, 21.0, 13.0, 21.0, 21.0, 22.0, 35.0, 28.0, 35.0, 38.0, 38.0, 33.0, 41.0, 54.0, 50.0, 39.0, 50.0, 40.0, 42.0, 35.0, 29.0, 33.0, 32.0, 37.0, 24.0, 25.0, 13.0, 12.0, 15.0, 14.0, 12.0, 8.0, 10.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7618408203125, -8.461181640625, -8.1605224609375, -7.85986328125, -7.5592041015625, -7.258544921875, -6.9578857421875, -6.6572265625, -6.3565673828125, -6.055908203125, -5.7552490234375, -5.45458984375, -5.1539306640625, -4.853271484375, -4.5526123046875, -4.251953125, -3.9512939453125, -3.650634765625, -3.3499755859375, -3.04931640625, -2.7486572265625, -2.447998046875, -2.1473388671875, -1.8466796875, -1.5460205078125, -1.245361328125, -0.9447021484375, -0.64404296875, -0.3433837890625, -0.042724609375, 0.2579345703125, 0.55859375, 0.8592529296875, 1.159912109375, 1.4605712890625, 1.76123046875, 2.0618896484375, 2.362548828125, 2.6632080078125, 2.9638671875, 3.2645263671875, 3.565185546875, 3.8658447265625, 4.16650390625, 4.4671630859375, 4.767822265625, 5.0684814453125, 5.369140625, 5.6697998046875, 5.970458984375, 6.2711181640625, 6.57177734375, 6.8724365234375, 7.173095703125, 7.4737548828125, 7.7744140625, 8.0750732421875, 8.375732421875, 8.6763916015625, 8.97705078125, 9.2777099609375, 9.578369140625, 9.8790283203125, 10.1796875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 13.0, 17.0, 22.0, 49.0, 54.0, 95.0, 137.0, 181.0, 305.0, 438.0, 696.0, 1060.0, 1528.0, 2389.0, 3706.0, 5570.0, 8496.0, 13269.0, 20466.0, 32945.0, 52916.0, 89555.0, 162895.0, 254775.0, 162549.0, 89635.0, 53135.0, 32971.0, 20665.0, 13253.0, 8520.0, 5595.0, 3679.0, 2376.0, 1586.0, 1048.0, 688.0, 422.0, 306.0, 169.0, 139.0, 83.0, 54.0, 32.0, 26.0, 15.0, 12.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.3955078125, -1.353851318359375, -1.31219482421875, -1.270538330078125, -1.2288818359375, -1.187225341796875, -1.14556884765625, -1.103912353515625, -1.062255859375, -1.020599365234375, -0.97894287109375, -0.937286376953125, -0.8956298828125, -0.853973388671875, -0.81231689453125, -0.770660400390625, -0.72900390625, -0.687347412109375, -0.64569091796875, -0.604034423828125, -0.5623779296875, -0.520721435546875, -0.47906494140625, -0.437408447265625, -0.395751953125, -0.354095458984375, -0.31243896484375, -0.270782470703125, -0.2291259765625, -0.187469482421875, -0.14581298828125, -0.104156494140625, -0.0625, -0.020843505859375, 0.02081298828125, 0.062469482421875, 0.1041259765625, 0.145782470703125, 0.18743896484375, 0.229095458984375, 0.270751953125, 0.312408447265625, 0.35406494140625, 0.395721435546875, 0.4373779296875, 0.479034423828125, 0.52069091796875, 0.562347412109375, 0.60400390625, 0.645660400390625, 0.68731689453125, 0.728973388671875, 0.7706298828125, 0.812286376953125, 0.85394287109375, 0.895599365234375, 0.937255859375, 0.978912353515625, 1.02056884765625, 1.062225341796875, 1.1038818359375, 1.145538330078125, 1.18719482421875, 1.228851318359375, 1.2705078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 0.0, 5.0, 10.0, 5.0, 4.0, 6.0, 12.0, 12.0, 9.0, 15.0, 11.0, 16.0, 16.0, 27.0, 32.0, 29.0, 45.0, 26.0, 33.0, 41.0, 35.0, 39.0, 40.0, 1067.0, 43.0, 37.0, 41.0, 43.0, 33.0, 32.0, 32.0, 22.0, 22.0, 27.0, 21.0, 19.0, 17.0, 22.0, 9.0, 21.0, 12.0, 11.0, 6.0, 4.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.15625, -5.98345947265625, -5.8106689453125, -5.63787841796875, -5.465087890625, -5.29229736328125, -5.1195068359375, -4.94671630859375, -4.77392578125, -4.60113525390625, -4.4283447265625, -4.25555419921875, -4.082763671875, -3.90997314453125, -3.7371826171875, -3.56439208984375, -3.3916015625, -3.21881103515625, -3.0460205078125, -2.87322998046875, -2.700439453125, -2.52764892578125, -2.3548583984375, -2.18206787109375, -2.00927734375, -1.83648681640625, -1.6636962890625, -1.49090576171875, -1.318115234375, -1.14532470703125, -0.9725341796875, -0.79974365234375, -0.626953125, -0.45416259765625, -0.2813720703125, -0.10858154296875, 0.064208984375, 0.23699951171875, 0.4097900390625, 0.58258056640625, 0.75537109375, 0.92816162109375, 1.1009521484375, 1.27374267578125, 1.446533203125, 1.61932373046875, 1.7921142578125, 1.96490478515625, 2.1376953125, 2.31048583984375, 2.4832763671875, 2.65606689453125, 2.828857421875, 3.00164794921875, 3.1744384765625, 3.34722900390625, 3.52001953125, 3.69281005859375, 3.8656005859375, 4.03839111328125, 4.211181640625, 4.38397216796875, 4.5567626953125, 4.72955322265625, 4.90234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 3.0, 5.0, 7.0, 11.0, 20.0, 28.0, 23.0, 52.0, 57.0, 58.0, 107.0, 155.0, 224.0, 308.0, 448.0, 596.0, 867.0, 1233.0, 1657.0, 2367.0, 3412.0, 5108.0, 7367.0, 10877.0, 16450.0, 25798.0, 40855.0, 66215.0, 112078.0, 196701.0, 1271213.0, 127038.0, 74986.0, 45535.0, 28668.0, 18202.0, 12021.0, 8211.0, 5692.0, 3760.0, 2639.0, 1825.0, 1252.0, 838.0, 616.0, 446.0, 324.0, 228.0, 168.0, 113.0, 68.0, 65.0, 30.0, 26.0, 26.0, 14.0, 11.0, 14.0, 9.0, 6.0, 8.0, 4.0, 4.0], "bins": [-1.1025390625, -1.067108154296875, -1.03167724609375, -0.996246337890625, -0.9608154296875, -0.925384521484375, -0.88995361328125, -0.854522705078125, -0.819091796875, -0.783660888671875, -0.74822998046875, -0.712799072265625, -0.6773681640625, -0.641937255859375, -0.60650634765625, -0.571075439453125, -0.53564453125, -0.500213623046875, -0.46478271484375, -0.429351806640625, -0.3939208984375, -0.358489990234375, -0.32305908203125, -0.287628173828125, -0.252197265625, -0.216766357421875, -0.18133544921875, -0.145904541015625, -0.1104736328125, -0.075042724609375, -0.03961181640625, -0.004180908203125, 0.03125, 0.066680908203125, 0.10211181640625, 0.137542724609375, 0.1729736328125, 0.208404541015625, 0.24383544921875, 0.279266357421875, 0.314697265625, 0.350128173828125, 0.38555908203125, 0.420989990234375, 0.4564208984375, 0.491851806640625, 0.52728271484375, 0.562713623046875, 0.59814453125, 0.633575439453125, 0.66900634765625, 0.704437255859375, 0.7398681640625, 0.775299072265625, 0.81072998046875, 0.846160888671875, 0.881591796875, 0.917022705078125, 0.95245361328125, 0.987884521484375, 1.0233154296875, 1.058746337890625, 1.09417724609375, 1.129608154296875, 1.1650390625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 1.0, 6.0, 11.0, 12.0, 6.0, 18.0, 14.0, 21.0, 17.0, 24.0, 28.0, 18.0, 29.0, 37.0, 53.0, 44.0, 52.0, 60.0, 62.0, 60.0, 45.0, 37.0, 60.0, 34.0, 27.0, 24.0, 23.0, 25.0, 23.0, 16.0, 17.0, 11.0, 13.0, 12.0, 10.0, 12.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0011568069458007812, -0.0011186301708221436, -0.0010804533958435059, -0.0010422766208648682, -0.0010040998458862305, -0.0009659230709075928, -0.0009277462959289551, -0.0008895695209503174, -0.0008513927459716797, -0.000813215970993042, -0.0007750391960144043, -0.0007368624210357666, -0.0006986856460571289, -0.0006605088710784912, -0.0006223320960998535, -0.0005841553211212158, -0.0005459785461425781, -0.0005078017711639404, -0.00046962499618530273, -0.00043144822120666504, -0.00039327144622802734, -0.00035509467124938965, -0.00031691789627075195, -0.00027874112129211426, -0.00024056434631347656, -0.00020238757133483887, -0.00016421079635620117, -0.00012603402137756348, -8.785724639892578e-05, -4.9680471420288086e-05, -1.150369644165039e-05, 2.6673078536987305e-05, 6.4849853515625e-05, 0.0001030266284942627, 0.0001412034034729004, 0.00017938017845153809, 0.00021755695343017578, 0.0002557337284088135, 0.00029391050338745117, 0.00033208727836608887, 0.00037026405334472656, 0.00040844082832336426, 0.00044661760330200195, 0.00048479437828063965, 0.0005229711532592773, 0.000561147928237915, 0.0005993247032165527, 0.0006375014781951904, 0.0006756782531738281, 0.0007138550281524658, 0.0007520318031311035, 0.0007902085781097412, 0.0008283853530883789, 0.0008665621280670166, 0.0009047389030456543, 0.000942915678024292, 0.0009810924530029297, 0.0010192692279815674, 0.001057446002960205, 0.0010956227779388428, 0.0011337995529174805, 0.0011719763278961182, 0.0012101531028747559, 0.0012483298778533936, 0.0012865066528320312]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 12.0, 13.0, 6.0, 23.0, 16.0, 24.0, 28.0, 36.0, 28.0, 56.0, 65.0, 70.0, 93.0, 135.0, 171.0, 285.0, 386.0, 717.0, 1728.0, 525917.0, 514719.0, 1688.0, 678.0, 430.0, 305.0, 205.0, 147.0, 103.0, 76.0, 77.0, 53.0, 42.0, 33.0, 32.0, 16.0, 24.0, 25.0, 12.0, 16.0, 8.0, 6.0, 7.0, 7.0, 5.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.023223876953125, -0.022540807723999023, -0.021857738494873047, -0.02117466926574707, -0.020491600036621094, -0.019808530807495117, -0.01912546157836914, -0.018442392349243164, -0.017759323120117188, -0.01707625389099121, -0.016393184661865234, -0.015710115432739258, -0.015027046203613281, -0.014343976974487305, -0.013660907745361328, -0.012977838516235352, -0.012294769287109375, -0.011611700057983398, -0.010928630828857422, -0.010245561599731445, -0.009562492370605469, -0.008879423141479492, -0.008196353912353516, -0.007513284683227539, -0.0068302154541015625, -0.006147146224975586, -0.005464076995849609, -0.004781007766723633, -0.004097938537597656, -0.0034148693084716797, -0.002731800079345703, -0.0020487308502197266, -0.00136566162109375, -0.0006825923919677734, 4.76837158203125e-07, 0.0006835460662841797, 0.0013666152954101562, 0.002049684524536133, 0.0027327537536621094, 0.003415822982788086, 0.0040988922119140625, 0.004781961441040039, 0.005465030670166016, 0.006148099899291992, 0.006831169128417969, 0.007514238357543945, 0.008197307586669922, 0.008880376815795898, 0.009563446044921875, 0.010246515274047852, 0.010929584503173828, 0.011612653732299805, 0.012295722961425781, 0.012978792190551758, 0.013661861419677734, 0.014344930648803711, 0.015027999877929688, 0.015711069107055664, 0.01639413833618164, 0.017077207565307617, 0.017760276794433594, 0.01844334602355957, 0.019126415252685547, 0.019809484481811523, 0.0204925537109375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 150.0, 644.0, 197.0, 15.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003165911417454481, -0.0030468497425317764, -0.0029277880676090717, -0.002808726392686367, -0.0026896647177636623, -0.0025706030428409576, -0.002451541367918253, -0.002332479925826192, -0.002213418250903487, -0.0020943565759807825, -0.001975294901058078, -0.0018562332261353731, -0.0017371716676279902, -0.0016181099927052855, -0.0014990483177825809, -0.001379986759275198, -0.0012609249679371715, -0.0011418632930144668, -0.001022801618091762, -0.0009037400013767183, -0.0007846783846616745, -0.0006656167097389698, -0.0005465550348162651, -0.0004274934181012213, -0.0003084317431785166, -0.00018937009735964239, -7.030843698885292e-05, 4.875322338193655e-05, 0.0001678148692008108, 0.00028687651501968503, 0.0004059381899423897, 0.0005249998066574335, 0.0006440614815801382, 0.0007631231565028429, 0.0008821847732178867, 0.0010012465063482523, 0.0011203080648556352, 0.0012393697397783399, 0.0013584314147010446, 0.0014774929732084274, 0.0015965546481311321, 0.0017156163230538368, 0.0018346779979765415, 0.001953739672899246, 0.002072801347821951, 0.0021918630227446556, 0.0023109246976673603, 0.0024299861397594213, 0.0025490480475127697, 0.0026681097224354744, 0.002787171397358179, 0.002906233072280884, 0.0030252947472035885, 0.003144356422126293, 0.003263418097048998, 0.003382479539141059, 0.0035015412140637636, 0.0036206028889864683, 0.003739664563909173, 0.0038587262388318777, 0.003977787680923939, 0.0040968493558466434, 0.004215911030769348, 0.004334972705692053, 0.0044540343806147575]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 5.0, 7.0, 8.0, 7.0, 12.0, 12.0, 18.0, 18.0, 22.0, 31.0, 27.0, 27.0, 40.0, 53.0, 37.0, 54.0, 43.0, 42.0, 40.0, 60.0, 53.0, 64.0, 43.0, 42.0, 43.0, 35.0, 33.0, 21.0, 20.0, 17.0, 14.0, 13.0, 8.0, 6.0, 10.0, 5.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009281039237976074, -0.0009013749659061432, -0.000874646008014679, -0.0008479170501232147, -0.0008211880922317505, -0.0007944591343402863, -0.000767730176448822, -0.0007410012185573578, -0.0007142722606658936, -0.0006875433027744293, -0.0006608143448829651, -0.0006340853869915009, -0.0006073564291000366, -0.0005806274712085724, -0.0005538985133171082, -0.0005271695554256439, -0.0005004405975341797, -0.00047371163964271545, -0.0004469826817512512, -0.000420253723859787, -0.00039352476596832275, -0.0003667958080768585, -0.0003400668501853943, -0.00031333789229393005, -0.0002866089344024658, -0.0002598799765110016, -0.00023315101861953735, -0.00020642206072807312, -0.0001796931028366089, -0.00015296414494514465, -0.00012623518705368042, -9.950622916221619e-05, -7.277727127075195e-05, -4.604831337928772e-05, -1.9319355487823486e-05, 7.409602403640747e-06, 3.413856029510498e-05, 6.0867518186569214e-05, 8.759647607803345e-05, 0.00011432543396949768, 0.00014105439186096191, 0.00016778334975242615, 0.00019451230764389038, 0.00022124126553535461, 0.00024797022342681885, 0.0002746991813182831, 0.0003014281392097473, 0.00032815709710121155, 0.0003548860549926758, 0.00038161501288414, 0.00040834397077560425, 0.0004350729286670685, 0.0004618018865585327, 0.000488530844449997, 0.0005152598023414612, 0.0005419887602329254, 0.0005687177181243896, 0.0005954466760158539, 0.0006221756339073181, 0.0006489045917987823, 0.0006756335496902466, 0.0007023625075817108, 0.000729091465473175, 0.0007558204233646393, 0.0007825493812561035]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 9.0, 12.0, 13.0, 7.0, 21.0, 13.0, 21.0, 21.0, 22.0, 35.0, 28.0, 35.0, 38.0, 38.0, 33.0, 41.0, 54.0, 50.0, 39.0, 50.0, 40.0, 42.0, 35.0, 29.0, 33.0, 32.0, 37.0, 24.0, 25.0, 13.0, 12.0, 15.0, 14.0, 12.0, 8.0, 10.0, 7.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0625, -8.7618408203125, -8.461181640625, -8.1605224609375, -7.85986328125, -7.5592041015625, -7.258544921875, -6.9578857421875, -6.6572265625, -6.3565673828125, -6.055908203125, -5.7552490234375, -5.45458984375, -5.1539306640625, -4.853271484375, -4.5526123046875, -4.251953125, -3.9512939453125, -3.650634765625, -3.3499755859375, -3.04931640625, -2.7486572265625, -2.447998046875, -2.1473388671875, -1.8466796875, -1.5460205078125, -1.245361328125, -0.9447021484375, -0.64404296875, -0.3433837890625, -0.042724609375, 0.2579345703125, 0.55859375, 0.8592529296875, 1.159912109375, 1.4605712890625, 1.76123046875, 2.0618896484375, 2.362548828125, 2.6632080078125, 2.9638671875, 3.2645263671875, 3.565185546875, 3.8658447265625, 4.16650390625, 4.4671630859375, 4.767822265625, 5.0684814453125, 5.369140625, 5.6697998046875, 5.970458984375, 6.2711181640625, 6.57177734375, 6.8724365234375, 7.173095703125, 7.4737548828125, 7.7744140625, 8.0750732421875, 8.375732421875, 8.6763916015625, 8.97705078125, 9.2777099609375, 9.578369140625, 9.8790283203125, 10.1796875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 20.0, 16.0, 21.0, 34.0, 55.0, 74.0, 92.0, 112.0, 150.0, 201.0, 249.0, 343.0, 419.0, 504.0, 652.0, 848.0, 1175.0, 2001.0, 4526.0, 17861.0, 99802.0, 488423.0, 347669.0, 61693.0, 11800.0, 3402.0, 1708.0, 1110.0, 831.0, 621.0, 485.0, 373.0, 290.0, 226.0, 183.0, 143.0, 110.0, 82.0, 55.0, 48.0, 32.0, 24.0, 22.0, 17.0, 10.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.7265625, -14.264404296875, -13.80224609375, -13.340087890625, -12.8779296875, -12.415771484375, -11.95361328125, -11.491455078125, -11.029296875, -10.567138671875, -10.10498046875, -9.642822265625, -9.1806640625, -8.718505859375, -8.25634765625, -7.794189453125, -7.33203125, -6.869873046875, -6.40771484375, -5.945556640625, -5.4833984375, -5.021240234375, -4.55908203125, -4.096923828125, -3.634765625, -3.172607421875, -2.71044921875, -2.248291015625, -1.7861328125, -1.323974609375, -0.86181640625, -0.399658203125, 0.0625, 0.524658203125, 0.98681640625, 1.448974609375, 1.9111328125, 2.373291015625, 2.83544921875, 3.297607421875, 3.759765625, 4.221923828125, 4.68408203125, 5.146240234375, 5.6083984375, 6.070556640625, 6.53271484375, 6.994873046875, 7.45703125, 7.919189453125, 8.38134765625, 8.843505859375, 9.3056640625, 9.767822265625, 10.22998046875, 10.692138671875, 11.154296875, 11.616455078125, 12.07861328125, 12.540771484375, 13.0029296875, 13.465087890625, 13.92724609375, 14.389404296875, 14.8515625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 9.0, 11.0, 16.0, 10.0, 18.0, 15.0, 29.0, 37.0, 35.0, 31.0, 28.0, 46.0, 48.0, 62.0, 108.0, 248.0, 1552.0, 241.0, 89.0, 50.0, 55.0, 40.0, 35.0, 36.0, 27.0, 23.0, 20.0, 19.0, 19.0, 14.0, 12.0, 9.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.58544921875, -21.7646484375, -20.94384765625, -20.123046875, -19.30224609375, -18.4814453125, -17.66064453125, -16.83984375, -16.01904296875, -15.1982421875, -14.37744140625, -13.556640625, -12.73583984375, -11.9150390625, -11.09423828125, -10.2734375, -9.45263671875, -8.6318359375, -7.81103515625, -6.990234375, -6.16943359375, -5.3486328125, -4.52783203125, -3.70703125, -2.88623046875, -2.0654296875, -1.24462890625, -0.423828125, 0.39697265625, 1.2177734375, 2.03857421875, 2.859375, 3.68017578125, 4.5009765625, 5.32177734375, 6.142578125, 6.96337890625, 7.7841796875, 8.60498046875, 9.42578125, 10.24658203125, 11.0673828125, 11.88818359375, 12.708984375, 13.52978515625, 14.3505859375, 15.17138671875, 15.9921875, 16.81298828125, 17.6337890625, 18.45458984375, 19.275390625, 20.09619140625, 20.9169921875, 21.73779296875, 22.55859375, 23.37939453125, 24.2001953125, 25.02099609375, 25.841796875, 26.66259765625, 27.4833984375, 28.30419921875, 29.125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 11.0, 6.0, 8.0, 18.0, 19.0, 18.0, 31.0, 45.0, 46.0, 44.0, 84.0, 135.0, 199.0, 332.0, 688.0, 2140.0, 2874876.0, 263693.0, 1670.0, 672.0, 314.0, 183.0, 129.0, 95.0, 58.0, 45.0, 40.0, 32.0, 16.0, 15.0, 12.0, 9.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.125, -66.45703125, -63.7890625, -61.12109375, -58.453125, -55.78515625, -53.1171875, -50.44921875, -47.78125, -45.11328125, -42.4453125, -39.77734375, -37.109375, -34.44140625, -31.7734375, -29.10546875, -26.4375, -23.76953125, -21.1015625, -18.43359375, -15.765625, -13.09765625, -10.4296875, -7.76171875, -5.09375, -2.42578125, 0.2421875, 2.91015625, 5.578125, 8.24609375, 10.9140625, 13.58203125, 16.25, 18.91796875, 21.5859375, 24.25390625, 26.921875, 29.58984375, 32.2578125, 34.92578125, 37.59375, 40.26171875, 42.9296875, 45.59765625, 48.265625, 50.93359375, 53.6015625, 56.26953125, 58.9375, 61.60546875, 64.2734375, 66.94140625, 69.609375, 72.27734375, 74.9453125, 77.61328125, 80.28125, 82.94921875, 85.6171875, 88.28515625, 90.953125, 93.62109375, 96.2890625, 98.95703125, 101.625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 16.0, 669.0, 325.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.07740783691406, -142.48468017578125, -132.89195251464844, -123.29922485351562, -113.70649719238281, -104.11376953125, -94.52104949951172, -84.9283218383789, -75.3355941772461, -65.74286651611328, -56.15013885498047, -46.55741500854492, -36.96468734741211, -27.371959686279297, -17.77923583984375, -8.186508178710938, 1.406219482421875, 10.998946189880371, 20.591672897338867, 30.184398651123047, 39.77712631225586, 49.36985397338867, 58.96257781982422, 68.55530548095703, 78.14803314208984, 87.74076080322266, 97.33348846435547, 106.92620849609375, 116.51893615722656, 126.11166381835938, 135.7043914794922, 145.297119140625, 154.88986206054688, 164.4825897216797, 174.0753173828125, 183.6680450439453, 193.26077270507812, 202.85350036621094, 212.44622802734375, 222.0389404296875, 231.63168334960938, 241.2244110107422, 250.817138671875, 260.40985107421875, 270.0025939941406, 279.5953063964844, 289.18804931640625, 298.78076171875, 308.37347412109375, 317.9661865234375, 327.5589294433594, 337.1516418457031, 346.744384765625, 356.33709716796875, 365.9298400878906, 375.5225524902344, 385.11529541015625, 394.7080078125, 404.3007507324219, 413.8934631347656, 423.4862060546875, 433.07891845703125, 442.6716613769531, 452.2643737792969, 461.85711669921875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 4.0, 9.0, 9.0, 9.0, 14.0, 14.0, 11.0, 15.0, 30.0, 26.0, 22.0, 36.0, 22.0, 35.0, 24.0, 36.0, 36.0, 38.0, 41.0, 30.0, 37.0, 42.0, 56.0, 52.0, 29.0, 35.0, 29.0, 26.0, 33.0, 33.0, 16.0, 19.0, 16.0, 18.0, 19.0, 11.0, 8.0, 8.0, 11.0, 4.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-59.838531494140625, -57.937252044677734, -56.03597640991211, -54.13469696044922, -52.23341751098633, -50.3321418762207, -48.43086242675781, -46.52958679199219, -44.6283073425293, -42.727027893066406, -40.82575225830078, -38.92447280883789, -37.023193359375, -35.121917724609375, -33.220638275146484, -31.319360733032227, -29.418081283569336, -27.516803741455078, -25.615524291992188, -23.71424674987793, -21.812969207763672, -19.91168975830078, -18.010412216186523, -16.109134674072266, -14.207856178283691, -12.306577682495117, -10.40530014038086, -8.504021644592285, -6.602743625640869, -4.701465606689453, -2.800187110900879, -0.8989095687866211, 1.0023689270019531, 2.903646945953369, 4.804924964904785, 6.706203460693359, 8.607481002807617, 10.508759498596191, 12.410037994384766, 14.311315536499023, 16.21259307861328, 18.11387062072754, 20.01515007019043, 21.916427612304688, 23.817705154418945, 25.718982696533203, 27.620262145996094, 29.52153968811035, 31.422819137573242, 33.3240966796875, 35.22537612915039, 37.12665557861328, 39.027931213378906, 40.9292106628418, 42.83049011230469, 44.73176574707031, 46.6330451965332, 48.534324645996094, 50.43560028076172, 52.33687973022461, 54.2381591796875, 56.139434814453125, 58.040714263916016, 59.941993713378906, 61.84326934814453]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 8.0, 9.0, 12.0, 13.0, 9.0, 18.0, 20.0, 18.0, 18.0, 21.0, 25.0, 30.0, 28.0, 35.0, 40.0, 40.0, 41.0, 30.0, 39.0, 35.0, 46.0, 45.0, 35.0, 37.0, 39.0, 35.0, 28.0, 34.0, 22.0, 23.0, 28.0, 23.0, 20.0, 9.0, 11.0, 11.0, 10.0, 10.0, 8.0, 3.0, 8.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.15576171875, -7.8818359375, -7.60791015625, -7.333984375, -7.06005859375, -6.7861328125, -6.51220703125, -6.23828125, -5.96435546875, -5.6904296875, -5.41650390625, -5.142578125, -4.86865234375, -4.5947265625, -4.32080078125, -4.046875, -3.77294921875, -3.4990234375, -3.22509765625, -2.951171875, -2.67724609375, -2.4033203125, -2.12939453125, -1.85546875, -1.58154296875, -1.3076171875, -1.03369140625, -0.759765625, -0.48583984375, -0.2119140625, 0.06201171875, 0.3359375, 0.60986328125, 0.8837890625, 1.15771484375, 1.431640625, 1.70556640625, 1.9794921875, 2.25341796875, 2.52734375, 2.80126953125, 3.0751953125, 3.34912109375, 3.623046875, 3.89697265625, 4.1708984375, 4.44482421875, 4.71875, 4.99267578125, 5.2666015625, 5.54052734375, 5.814453125, 6.08837890625, 6.3623046875, 6.63623046875, 6.91015625, 7.18408203125, 7.4580078125, 7.73193359375, 8.005859375, 8.27978515625, 8.5537109375, 8.82763671875, 9.1015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 8.0, 16.0, 10.0, 20.0, 28.0, 29.0, 48.0, 55.0, 74.0, 88.0, 108.0, 138.0, 205.0, 377.0, 964.0, 4506.0, 67149.0, 2527883.0, 1554991.0, 32531.0, 3193.0, 736.0, 297.0, 173.0, 149.0, 98.0, 84.0, 66.0, 47.0, 45.0, 41.0, 22.0, 30.0, 20.0, 17.0, 13.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-38.28125, -37.271240234375, -36.26123046875, -35.251220703125, -34.2412109375, -33.231201171875, -32.22119140625, -31.211181640625, -30.201171875, -29.191162109375, -28.18115234375, -27.171142578125, -26.1611328125, -25.151123046875, -24.14111328125, -23.131103515625, -22.12109375, -21.111083984375, -20.10107421875, -19.091064453125, -18.0810546875, -17.071044921875, -16.06103515625, -15.051025390625, -14.041015625, -13.031005859375, -12.02099609375, -11.010986328125, -10.0009765625, -8.990966796875, -7.98095703125, -6.970947265625, -5.9609375, -4.950927734375, -3.94091796875, -2.930908203125, -1.9208984375, -0.910888671875, 0.09912109375, 1.109130859375, 2.119140625, 3.129150390625, 4.13916015625, 5.149169921875, 6.1591796875, 7.169189453125, 8.17919921875, 9.189208984375, 10.19921875, 11.209228515625, 12.21923828125, 13.229248046875, 14.2392578125, 15.249267578125, 16.25927734375, 17.269287109375, 18.279296875, 19.289306640625, 20.29931640625, 21.309326171875, 22.3193359375, 23.329345703125, 24.33935546875, 25.349365234375, 26.359375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 7.0, 14.0, 27.0, 31.0, 36.0, 59.0, 64.0, 98.0, 148.0, 183.0, 230.0, 349.0, 494.0, 598.0, 536.0, 330.0, 226.0, 169.0, 108.0, 107.0, 59.0, 61.0, 33.0, 23.0, 19.0, 21.0, 13.0, 8.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4609375, -14.8780517578125, -14.295166015625, -13.7122802734375, -13.12939453125, -12.5465087890625, -11.963623046875, -11.3807373046875, -10.7978515625, -10.2149658203125, -9.632080078125, -9.0491943359375, -8.46630859375, -7.8834228515625, -7.300537109375, -6.7176513671875, -6.134765625, -5.5518798828125, -4.968994140625, -4.3861083984375, -3.80322265625, -3.2203369140625, -2.637451171875, -2.0545654296875, -1.4716796875, -0.8887939453125, -0.305908203125, 0.2769775390625, 0.85986328125, 1.4427490234375, 2.025634765625, 2.6085205078125, 3.19140625, 3.7742919921875, 4.357177734375, 4.9400634765625, 5.52294921875, 6.1058349609375, 6.688720703125, 7.2716064453125, 7.8544921875, 8.4373779296875, 9.020263671875, 9.6031494140625, 10.18603515625, 10.7689208984375, 11.351806640625, 11.9346923828125, 12.517578125, 13.1004638671875, 13.683349609375, 14.2662353515625, 14.84912109375, 15.4320068359375, 16.014892578125, 16.5977783203125, 17.1806640625, 17.7635498046875, 18.346435546875, 18.9293212890625, 19.51220703125, 20.0950927734375, 20.677978515625, 21.2608642578125, 21.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 20.0, 26.0, 78.0, 206.0, 646.0, 3477.0, 3307994.0, 878259.0, 2616.0, 539.0, 205.0, 83.0, 57.0, 24.0, 8.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-116.25, -113.1025390625, -109.955078125, -106.8076171875, -103.66015625, -100.5126953125, -97.365234375, -94.2177734375, -91.0703125, -87.9228515625, -84.775390625, -81.6279296875, -78.48046875, -75.3330078125, -72.185546875, -69.0380859375, -65.890625, -62.7431640625, -59.595703125, -56.4482421875, -53.30078125, -50.1533203125, -47.005859375, -43.8583984375, -40.7109375, -37.5634765625, -34.416015625, -31.2685546875, -28.12109375, -24.9736328125, -21.826171875, -18.6787109375, -15.53125, -12.3837890625, -9.236328125, -6.0888671875, -2.94140625, 0.2060546875, 3.353515625, 6.5009765625, 9.6484375, 12.7958984375, 15.943359375, 19.0908203125, 22.23828125, 25.3857421875, 28.533203125, 31.6806640625, 34.828125, 37.9755859375, 41.123046875, 44.2705078125, 47.41796875, 50.5654296875, 53.712890625, 56.8603515625, 60.0078125, 63.1552734375, 66.302734375, 69.4501953125, 72.59765625, 75.7451171875, 78.892578125, 82.0400390625, 85.1875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 668.0, 342.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.57977294921875, -272.93023681640625, -242.28067016601562, -211.63111877441406, -180.9815673828125, -150.33201599121094, -119.68246459960938, -89.03291320800781, -58.38336181640625, -27.733810424804688, 2.915740966796875, 33.56529235839844, 64.21484375, 94.86439514160156, 125.51394653320312, 156.1634979248047, 186.81304931640625, 217.4626007080078, 248.11215209960938, 278.76171875, 309.4112548828125, 340.060791015625, 370.7103576660156, 401.35992431640625, 432.00946044921875, 462.65899658203125, 493.3085632324219, 523.9581298828125, 554.607666015625, 585.2572021484375, 615.90673828125, 646.5563354492188, 677.205810546875, 707.8553466796875, 738.5048828125, 769.1544799804688, 799.8040161132812, 830.4535522460938, 861.1031494140625, 891.752685546875, 922.4022216796875, 953.0517578125, 983.7012939453125, 1014.3508911132812, 1045.00048828125, 1075.6500244140625, 1106.299560546875, 1136.9490966796875, 1167.5986328125, 1198.2481689453125, 1228.897705078125, 1259.5472412109375, 1290.19677734375, 1320.846435546875, 1351.4959716796875, 1382.1455078125, 1412.7950439453125, 1443.444580078125, 1474.0941162109375, 1504.74365234375, 1535.393310546875, 1566.0428466796875, 1596.6923828125, 1627.3419189453125, 1657.991455078125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 13.0, 9.0, 12.0, 16.0, 19.0, 22.0, 23.0, 37.0, 36.0, 45.0, 58.0, 47.0, 66.0, 46.0, 55.0, 66.0, 71.0, 67.0, 56.0, 35.0, 39.0, 23.0, 32.0, 28.0, 24.0, 19.0, 14.0, 13.0, 6.0, 9.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-110.69964599609375, -107.9478530883789, -105.19606018066406, -102.44426727294922, -99.69247436523438, -96.94068145751953, -94.18888854980469, -91.43710327148438, -88.685302734375, -85.93350982666016, -83.18171691894531, -80.42992401123047, -77.67813110351562, -74.92633819580078, -72.17454528808594, -69.42276000976562, -66.67096710205078, -63.91917419433594, -61.167381286621094, -58.41558837890625, -55.663795471191406, -52.91200256347656, -50.160213470458984, -47.40842056274414, -44.6566276550293, -41.90483474731445, -39.15304183959961, -36.40125274658203, -33.64945983886719, -30.89766502380371, -28.1458740234375, -25.394081115722656, -22.642288208007812, -19.89049530029297, -17.138702392578125, -14.386911392211914, -11.63511848449707, -8.883325576782227, -6.131534576416016, -3.379741668701172, -0.6279487609863281, 2.1238436698913574, 4.875636100769043, 7.62742805480957, 10.379220962524414, 13.131013870239258, 15.882804870605469, 18.634597778320312, 21.386390686035156, 24.13818359375, 26.889976501464844, 29.641767501831055, 32.39356231689453, 35.145355224609375, 37.89714431762695, 40.6489372253418, 43.40073013305664, 46.152523040771484, 48.90431594848633, 51.656105041503906, 54.40789794921875, 57.159690856933594, 59.91148376464844, 62.66327667236328, 65.41506958007812]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 13.0, 14.0, 14.0, 26.0, 19.0, 27.0, 30.0, 31.0, 30.0, 43.0, 41.0, 35.0, 45.0, 48.0, 44.0, 35.0, 45.0, 51.0, 39.0, 38.0, 35.0, 39.0, 36.0, 36.0, 28.0, 16.0, 22.0, 20.0, 15.0, 11.0, 14.0, 4.0, 6.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4954833984375, -8.240966796875, -7.9864501953125, -7.73193359375, -7.4774169921875, -7.222900390625, -6.9683837890625, -6.7138671875, -6.4593505859375, -6.204833984375, -5.9503173828125, -5.69580078125, -5.4412841796875, -5.186767578125, -4.9322509765625, -4.677734375, -4.4232177734375, -4.168701171875, -3.9141845703125, -3.65966796875, -3.4051513671875, -3.150634765625, -2.8961181640625, -2.6416015625, -2.3870849609375, -2.132568359375, -1.8780517578125, -1.62353515625, -1.3690185546875, -1.114501953125, -0.8599853515625, -0.60546875, -0.3509521484375, -0.096435546875, 0.1580810546875, 0.41259765625, 0.6671142578125, 0.921630859375, 1.1761474609375, 1.4306640625, 1.6851806640625, 1.939697265625, 2.1942138671875, 2.44873046875, 2.7032470703125, 2.957763671875, 3.2122802734375, 3.466796875, 3.7213134765625, 3.975830078125, 4.2303466796875, 4.48486328125, 4.7393798828125, 4.993896484375, 5.2484130859375, 5.5029296875, 5.7574462890625, 6.011962890625, 6.2664794921875, 6.52099609375, 6.7755126953125, 7.030029296875, 7.2845458984375, 7.5390625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 11.0, 19.0, 20.0, 33.0, 44.0, 88.0, 100.0, 165.0, 258.0, 373.0, 583.0, 808.0, 1341.0, 1960.0, 3249.0, 5064.0, 8103.0, 13139.0, 21121.0, 34820.0, 58454.0, 102688.0, 187299.0, 249305.0, 150503.0, 83523.0, 48597.0, 29219.0, 17842.0, 10823.0, 6740.0, 4406.0, 2785.0, 1763.0, 1126.0, 770.0, 464.0, 315.0, 221.0, 117.0, 99.0, 63.0, 40.0, 27.0, 22.0, 11.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1025390625, -1.0661773681640625, -1.029815673828125, -0.9934539794921875, -0.95709228515625, -0.9207305908203125, -0.884368896484375, -0.8480072021484375, -0.8116455078125, -0.7752838134765625, -0.738922119140625, -0.7025604248046875, -0.66619873046875, -0.6298370361328125, -0.593475341796875, -0.5571136474609375, -0.520751953125, -0.4843902587890625, -0.448028564453125, -0.4116668701171875, -0.37530517578125, -0.3389434814453125, -0.302581787109375, -0.2662200927734375, -0.2298583984375, -0.1934967041015625, -0.157135009765625, -0.1207733154296875, -0.08441162109375, -0.0480499267578125, -0.011688232421875, 0.0246734619140625, 0.06103515625, 0.0973968505859375, 0.133758544921875, 0.1701202392578125, 0.20648193359375, 0.2428436279296875, 0.279205322265625, 0.3155670166015625, 0.3519287109375, 0.3882904052734375, 0.424652099609375, 0.4610137939453125, 0.49737548828125, 0.5337371826171875, 0.570098876953125, 0.6064605712890625, 0.642822265625, 0.6791839599609375, 0.715545654296875, 0.7519073486328125, 0.78826904296875, 0.8246307373046875, 0.860992431640625, 0.8973541259765625, 0.9337158203125, 0.9700775146484375, 1.006439208984375, 1.0428009033203125, 1.07916259765625, 1.1155242919921875, 1.151885986328125, 1.1882476806640625, 1.224609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 1.0, 7.0, 12.0, 10.0, 4.0, 13.0, 15.0, 15.0, 24.0, 16.0, 27.0, 24.0, 30.0, 21.0, 37.0, 35.0, 45.0, 30.0, 31.0, 41.0, 1062.0, 36.0, 32.0, 55.0, 49.0, 37.0, 38.0, 26.0, 33.0, 39.0, 20.0, 35.0, 24.0, 17.0, 14.0, 17.0, 8.0, 6.0, 12.0, 5.0, 4.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.769287109375, -4.62060546875, -4.471923828125, -4.3232421875, -4.174560546875, -4.02587890625, -3.877197265625, -3.728515625, -3.579833984375, -3.43115234375, -3.282470703125, -3.1337890625, -2.985107421875, -2.83642578125, -2.687744140625, -2.5390625, -2.390380859375, -2.24169921875, -2.093017578125, -1.9443359375, -1.795654296875, -1.64697265625, -1.498291015625, -1.349609375, -1.200927734375, -1.05224609375, -0.903564453125, -0.7548828125, -0.606201171875, -0.45751953125, -0.308837890625, -0.16015625, -0.011474609375, 0.13720703125, 0.285888671875, 0.4345703125, 0.583251953125, 0.73193359375, 0.880615234375, 1.029296875, 1.177978515625, 1.32666015625, 1.475341796875, 1.6240234375, 1.772705078125, 1.92138671875, 2.070068359375, 2.21875, 2.367431640625, 2.51611328125, 2.664794921875, 2.8134765625, 2.962158203125, 3.11083984375, 3.259521484375, 3.408203125, 3.556884765625, 3.70556640625, 3.854248046875, 4.0029296875, 4.151611328125, 4.30029296875, 4.448974609375, 4.59765625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 6.0, 10.0, 11.0, 16.0, 20.0, 36.0, 58.0, 70.0, 101.0, 122.0, 197.0, 258.0, 417.0, 546.0, 757.0, 1161.0, 1653.0, 2376.0, 3331.0, 4937.0, 7096.0, 10737.0, 16291.0, 25485.0, 40160.0, 65370.0, 107687.0, 176560.0, 1261117.0, 138937.0, 84845.0, 51343.0, 32533.0, 20592.0, 13621.0, 9115.0, 6109.0, 4192.0, 2830.0, 1928.0, 1303.0, 953.0, 646.0, 501.0, 327.0, 235.0, 165.0, 116.0, 85.0, 66.0, 36.0, 25.0, 19.0, 12.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0], "bins": [-0.9267578125, -0.8980331420898438, -0.8693084716796875, -0.8405838012695312, -0.811859130859375, -0.7831344604492188, -0.7544097900390625, -0.7256851196289062, -0.69696044921875, -0.6682357788085938, -0.6395111083984375, -0.6107864379882812, -0.582061767578125, -0.5533370971679688, -0.5246124267578125, -0.49588775634765625, -0.4671630859375, -0.43843841552734375, -0.4097137451171875, -0.38098907470703125, -0.352264404296875, -0.32353973388671875, -0.2948150634765625, -0.26609039306640625, -0.23736572265625, -0.20864105224609375, -0.1799163818359375, -0.15119171142578125, -0.122467041015625, -0.09374237060546875, -0.0650177001953125, -0.03629302978515625, -0.007568359375, 0.02115631103515625, 0.0498809814453125, 0.07860565185546875, 0.107330322265625, 0.13605499267578125, 0.1647796630859375, 0.19350433349609375, 0.22222900390625, 0.25095367431640625, 0.2796783447265625, 0.30840301513671875, 0.337127685546875, 0.36585235595703125, 0.3945770263671875, 0.42330169677734375, 0.4520263671875, 0.48075103759765625, 0.5094757080078125, 0.5382003784179688, 0.566925048828125, 0.5956497192382812, 0.6243743896484375, 0.6530990600585938, 0.68182373046875, 0.7105484008789062, 0.7392730712890625, 0.7679977416992188, 0.796722412109375, 0.8254470825195312, 0.8541717529296875, 0.8828964233398438, 0.91162109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 8.0, 4.0, 10.0, 12.0, 10.0, 11.0, 13.0, 12.0, 16.0, 20.0, 23.0, 27.0, 33.0, 35.0, 40.0, 46.0, 51.0, 50.0, 60.0, 58.0, 51.0, 48.0, 44.0, 37.0, 24.0, 26.0, 35.0, 31.0, 21.0, 19.0, 23.0, 16.0, 14.0, 10.0, 13.0, 7.0, 5.0, 9.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0010328292846679688, -0.0010015815496444702, -0.0009703338146209717, -0.0009390860795974731, -0.0009078383445739746, -0.0008765906095504761, -0.0008453428745269775, -0.000814095139503479, -0.0007828474044799805, -0.0007515996694564819, -0.0007203519344329834, -0.0006891041994094849, -0.0006578564643859863, -0.0006266087293624878, -0.0005953609943389893, -0.0005641132593154907, -0.0005328655242919922, -0.0005016177892684937, -0.0004703700542449951, -0.0004391223192214966, -0.00040787458419799805, -0.0003766268491744995, -0.000345379114151001, -0.00031413137912750244, -0.0002828836441040039, -0.00025163590908050537, -0.00022038817405700684, -0.0001891404390335083, -0.00015789270401000977, -0.00012664496898651123, -9.53972339630127e-05, -6.414949893951416e-05, -3.2901763916015625e-05, -1.6540288925170898e-06, 2.9593706130981445e-05, 6.084144115447998e-05, 9.208917617797852e-05, 0.00012333691120147705, 0.00015458464622497559, 0.00018583238124847412, 0.00021708011627197266, 0.0002483278512954712, 0.0002795755863189697, 0.00031082332134246826, 0.0003420710563659668, 0.00037331879138946533, 0.00040456652641296387, 0.0004358142614364624, 0.00046706199645996094, 0.0004983097314834595, 0.000529557466506958, 0.0005608052015304565, 0.0005920529365539551, 0.0006233006715774536, 0.0006545484066009521, 0.0006857961416244507, 0.0007170438766479492, 0.0007482916116714478, 0.0007795393466949463, 0.0008107870817184448, 0.0008420348167419434, 0.0008732825517654419, 0.0009045302867889404, 0.000935778021812439, 0.0009670257568359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 5.0, 9.0, 14.0, 22.0, 20.0, 23.0, 32.0, 54.0, 61.0, 68.0, 113.0, 120.0, 160.0, 256.0, 337.0, 640.0, 1477.0, 653700.0, 388176.0, 1372.0, 575.0, 350.0, 238.0, 172.0, 131.0, 88.0, 53.0, 55.0, 43.0, 34.0, 24.0, 24.0, 29.0, 12.0, 8.0, 14.0, 9.0, 4.0, 5.0, 4.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0212860107421875, -0.020598649978637695, -0.01991128921508789, -0.019223928451538086, -0.01853656768798828, -0.017849206924438477, -0.017161846160888672, -0.016474485397338867, -0.015787124633789062, -0.015099763870239258, -0.014412403106689453, -0.013725042343139648, -0.013037681579589844, -0.012350320816040039, -0.011662960052490234, -0.01097559928894043, -0.010288238525390625, -0.00960087776184082, -0.008913516998291016, -0.008226156234741211, -0.007538795471191406, -0.0068514347076416016, -0.006164073944091797, -0.005476713180541992, -0.0047893524169921875, -0.004101991653442383, -0.003414630889892578, -0.0027272701263427734, -0.0020399093627929688, -0.001352548599243164, -0.0006651878356933594, 2.2172927856445312e-05, 0.00070953369140625, 0.0013968944549560547, 0.0020842552185058594, 0.002771615982055664, 0.0034589767456054688, 0.0041463375091552734, 0.004833698272705078, 0.005521059036254883, 0.0062084197998046875, 0.006895780563354492, 0.007583141326904297, 0.008270502090454102, 0.008957862854003906, 0.009645223617553711, 0.010332584381103516, 0.01101994514465332, 0.011707305908203125, 0.01239466667175293, 0.013082027435302734, 0.013769388198852539, 0.014456748962402344, 0.015144109725952148, 0.015831470489501953, 0.016518831253051758, 0.017206192016601562, 0.017893552780151367, 0.018580913543701172, 0.019268274307250977, 0.01995563507080078, 0.020642995834350586, 0.02133035659790039, 0.022017717361450195, 0.022705078125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 58.0, 642.0, 288.0, 18.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002762339310720563, -0.002640713471919298, -0.002519087865948677, -0.0023974620271474123, -0.0022758361883461475, -0.0021542105823755264, -0.0020325847435742617, -0.001910958904772997, -0.001789333182387054, -0.001667707460001111, -0.0015460816211998463, -0.0014244558988139033, -0.0013028301764279604, -0.0011812043376266956, -0.0010595786152407527, -0.0009379528346471488, -0.000816327054053545, -0.0006947012734599411, -0.0005730754928663373, -0.00045144977048039436, -0.0003298239898867905, -0.00020819820929318666, -8.657248690724373e-05, 3.505329368636012e-05, 0.00015667907427996397, 0.0002783048548735678, 0.0003999306063633412, 0.0005215563578531146, 0.0006431821384467185, 0.0007648079190403223, 0.0008864336414262652, 0.0010080593638122082, 0.0011296849697828293, 0.0012513106921687722, 0.001372936530970037, 0.00149456225335598, 0.0016161880921572447, 0.0017378138145431876, 0.0018594395369291306, 0.0019810653757303953, 0.00210269121453166, 0.002224317053332925, 0.002345942659303546, 0.0024675684981048107, 0.0025891943369060755, 0.0027108201757073402, 0.0028324457816779613, 0.002954071620479226, 0.0030756972264498472, 0.003197323065251112, 0.003318948671221733, 0.003440574510022998, 0.0035622003488242626, 0.0036838259547948837, 0.0038054517935961485, 0.003927077632397413, 0.004048703238368034, 0.0041703288443386555, 0.004291954915970564, 0.004413580521941185, 0.004535206127911806, 0.0046568321995437145, 0.004778457805514336, 0.004900083411484957, 0.005021709483116865]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 10.0, 12.0, 15.0, 17.0, 15.0, 11.0, 18.0, 21.0, 15.0, 26.0, 22.0, 21.0, 32.0, 36.0, 38.0, 30.0, 47.0, 45.0, 45.0, 37.0, 42.0, 43.0, 47.0, 53.0, 37.0, 35.0, 34.0, 27.0, 26.0, 28.0, 22.0, 22.0, 18.0, 16.0, 7.0, 6.0, 4.0, 8.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006539821624755859, -0.0006332891061902046, -0.0006125960499048233, -0.000591902993619442, -0.0005712099373340607, -0.0005505168810486794, -0.000529823824763298, -0.0005091307684779167, -0.0004884377121925354, -0.0004677446559071541, -0.00044705159962177277, -0.00042635854333639145, -0.00040566548705101013, -0.0003849724307656288, -0.0003642793744802475, -0.0003435863181948662, -0.00032289326190948486, -0.00030220020562410355, -0.00028150714933872223, -0.0002608140930533409, -0.0002401210367679596, -0.00021942798048257828, -0.00019873492419719696, -0.00017804186791181564, -0.00015734881162643433, -0.000136655755341053, -0.00011596269905567169, -9.526964277029037e-05, -7.457658648490906e-05, -5.388353019952774e-05, -3.319047391414642e-05, -1.2497417628765106e-05, 8.195638656616211e-06, 2.8888694941997528e-05, 4.9581751227378845e-05, 7.027480751276016e-05, 9.096786379814148e-05, 0.0001116609200835228, 0.00013235397636890411, 0.00015304703265428543, 0.00017374008893966675, 0.00019443314522504807, 0.00021512620151042938, 0.0002358192577958107, 0.000256512314081192, 0.00027720537036657333, 0.00029789842665195465, 0.00031859148293733597, 0.0003392845392227173, 0.0003599775955080986, 0.0003806706517934799, 0.00040136370807886124, 0.00042205676436424255, 0.00044274982064962387, 0.0004634428769350052, 0.0004841359332203865, 0.0005048289895057678, 0.0005255220457911491, 0.0005462151020765305, 0.0005669081583619118, 0.0005876012146472931, 0.0006082942709326744, 0.0006289873272180557, 0.000649680383503437, 0.0006703734397888184]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 13.0, 14.0, 15.0, 25.0, 19.0, 27.0, 30.0, 31.0, 30.0, 43.0, 41.0, 35.0, 45.0, 48.0, 44.0, 35.0, 45.0, 51.0, 39.0, 38.0, 35.0, 39.0, 36.0, 36.0, 28.0, 16.0, 22.0, 20.0, 15.0, 11.0, 14.0, 4.0, 6.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4954833984375, -8.240966796875, -7.9864501953125, -7.73193359375, -7.4774169921875, -7.222900390625, -6.9683837890625, -6.7138671875, -6.4593505859375, -6.204833984375, -5.9503173828125, -5.69580078125, -5.4412841796875, -5.186767578125, -4.9322509765625, -4.677734375, -4.4232177734375, -4.168701171875, -3.9141845703125, -3.65966796875, -3.4051513671875, -3.150634765625, -2.8961181640625, -2.6416015625, -2.3870849609375, -2.132568359375, -1.8780517578125, -1.62353515625, -1.3690185546875, -1.114501953125, -0.8599853515625, -0.60546875, -0.3509521484375, -0.096435546875, 0.1580810546875, 0.41259765625, 0.6671142578125, 0.921630859375, 1.1761474609375, 1.4306640625, 1.6851806640625, 1.939697265625, 2.1942138671875, 2.44873046875, 2.7032470703125, 2.957763671875, 3.2122802734375, 3.466796875, 3.7213134765625, 3.975830078125, 4.2303466796875, 4.48486328125, 4.7393798828125, 4.993896484375, 5.2484130859375, 5.5029296875, 5.7574462890625, 6.011962890625, 6.2664794921875, 6.52099609375, 6.7755126953125, 7.030029296875, 7.2845458984375, 7.5390625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 10.0, 13.0, 15.0, 23.0, 30.0, 43.0, 81.0, 103.0, 130.0, 194.0, 289.0, 403.0, 601.0, 898.0, 1398.0, 2201.0, 4000.0, 12355.0, 110721.0, 759753.0, 130607.0, 13802.0, 4245.0, 2198.0, 1489.0, 943.0, 611.0, 431.0, 297.0, 186.0, 145.0, 97.0, 61.0, 45.0, 40.0, 22.0, 17.0, 8.0, 15.0, 11.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.296875, -19.632080078125, -18.96728515625, -18.302490234375, -17.6376953125, -16.972900390625, -16.30810546875, -15.643310546875, -14.978515625, -14.313720703125, -13.64892578125, -12.984130859375, -12.3193359375, -11.654541015625, -10.98974609375, -10.324951171875, -9.66015625, -8.995361328125, -8.33056640625, -7.665771484375, -7.0009765625, -6.336181640625, -5.67138671875, -5.006591796875, -4.341796875, -3.677001953125, -3.01220703125, -2.347412109375, -1.6826171875, -1.017822265625, -0.35302734375, 0.311767578125, 0.9765625, 1.641357421875, 2.30615234375, 2.970947265625, 3.6357421875, 4.300537109375, 4.96533203125, 5.630126953125, 6.294921875, 6.959716796875, 7.62451171875, 8.289306640625, 8.9541015625, 9.618896484375, 10.28369140625, 10.948486328125, 11.61328125, 12.278076171875, 12.94287109375, 13.607666015625, 14.2724609375, 14.937255859375, 15.60205078125, 16.266845703125, 16.931640625, 17.596435546875, 18.26123046875, 18.926025390625, 19.5908203125, 20.255615234375, 20.92041015625, 21.585205078125, 22.25]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 12.0, 7.0, 13.0, 17.0, 15.0, 22.0, 19.0, 30.0, 41.0, 56.0, 55.0, 49.0, 56.0, 159.0, 1562.0, 363.0, 141.0, 57.0, 51.0, 45.0, 26.0, 30.0, 36.0, 18.0, 16.0, 30.0, 23.0, 10.0, 10.0, 7.0, 5.0, 8.0, 5.0, 7.0, 1.0, 1.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.96875, -22.270751953125, -21.57275390625, -20.874755859375, -20.1767578125, -19.478759765625, -18.78076171875, -18.082763671875, -17.384765625, -16.686767578125, -15.98876953125, -15.290771484375, -14.5927734375, -13.894775390625, -13.19677734375, -12.498779296875, -11.80078125, -11.102783203125, -10.40478515625, -9.706787109375, -9.0087890625, -8.310791015625, -7.61279296875, -6.914794921875, -6.216796875, -5.518798828125, -4.82080078125, -4.122802734375, -3.4248046875, -2.726806640625, -2.02880859375, -1.330810546875, -0.6328125, 0.065185546875, 0.76318359375, 1.461181640625, 2.1591796875, 2.857177734375, 3.55517578125, 4.253173828125, 4.951171875, 5.649169921875, 6.34716796875, 7.045166015625, 7.7431640625, 8.441162109375, 9.13916015625, 9.837158203125, 10.53515625, 11.233154296875, 11.93115234375, 12.629150390625, 13.3271484375, 14.025146484375, 14.72314453125, 15.421142578125, 16.119140625, 16.817138671875, 17.51513671875, 18.213134765625, 18.9111328125, 19.609130859375, 20.30712890625, 21.005126953125, 21.703125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 9.0, 5.0, 19.0, 21.0, 27.0, 47.0, 41.0, 47.0, 64.0, 90.0, 128.0, 178.0, 291.0, 650.0, 1815.0, 516496.0, 2621798.0, 2150.0, 718.0, 355.0, 193.0, 130.0, 96.0, 72.0, 64.0, 37.0, 28.0, 20.0, 23.0, 14.0, 19.0, 7.0, 11.0, 7.0, 3.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.46875, -61.42431640625, -59.3798828125, -57.33544921875, -55.291015625, -53.24658203125, -51.2021484375, -49.15771484375, -47.11328125, -45.06884765625, -43.0244140625, -40.97998046875, -38.935546875, -36.89111328125, -34.8466796875, -32.80224609375, -30.7578125, -28.71337890625, -26.6689453125, -24.62451171875, -22.580078125, -20.53564453125, -18.4912109375, -16.44677734375, -14.40234375, -12.35791015625, -10.3134765625, -8.26904296875, -6.224609375, -4.18017578125, -2.1357421875, -0.09130859375, 1.953125, 3.99755859375, 6.0419921875, 8.08642578125, 10.130859375, 12.17529296875, 14.2197265625, 16.26416015625, 18.30859375, 20.35302734375, 22.3974609375, 24.44189453125, 26.486328125, 28.53076171875, 30.5751953125, 32.61962890625, 34.6640625, 36.70849609375, 38.7529296875, 40.79736328125, 42.841796875, 44.88623046875, 46.9306640625, 48.97509765625, 51.01953125, 53.06396484375, 55.1083984375, 57.15283203125, 59.197265625, 61.24169921875, 63.2861328125, 65.33056640625, 67.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 34.0, 366.0, 523.0, 84.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.62710571289062, -93.45428466796875, -87.28146362304688, -81.108642578125, -74.93582153320312, -68.76300048828125, -62.59018325805664, -56.417362213134766, -50.24454116821289, -44.071720123291016, -37.89889907836914, -31.7260799407959, -25.553258895874023, -19.38043785095215, -13.207618713378906, -7.034797668457031, -0.8619766235351562, 5.3108439445495605, 11.483664512634277, 17.656484603881836, 23.82930564880371, 30.002126693725586, 36.17494583129883, 42.3477668762207, 48.52058792114258, 54.69340896606445, 60.86623001098633, 67.03904724121094, 73.21186828613281, 79.38468933105469, 85.55751037597656, 91.73033142089844, 97.90315246582031, 104.07597351074219, 110.24879455566406, 116.42161560058594, 122.59443664550781, 128.7672576904297, 134.94007873535156, 141.11289978027344, 147.2857208251953, 153.4585418701172, 159.63136291503906, 165.80418395996094, 171.9770050048828, 178.1498260498047, 184.32264709472656, 190.49546813964844, 196.66827392578125, 202.84109497070312, 209.013916015625, 215.18673706054688, 221.35955810546875, 227.53237915039062, 233.7052001953125, 239.87802124023438, 246.05084228515625, 252.22366333007812, 258.396484375, 264.5693054199219, 270.74212646484375, 276.9149475097656, 283.0877685546875, 289.2605895996094, 295.43341064453125]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 11.0, 12.0, 8.0, 14.0, 14.0, 14.0, 12.0, 20.0, 28.0, 39.0, 17.0, 37.0, 40.0, 37.0, 34.0, 55.0, 41.0, 52.0, 55.0, 39.0, 54.0, 50.0, 44.0, 37.0, 40.0, 16.0, 35.0, 19.0, 32.0, 14.0, 15.0, 14.0, 13.0, 5.0, 14.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.06529235839844, -62.96030044555664, -60.85531234741211, -58.75032043457031, -56.645328521728516, -54.54033660888672, -52.43534851074219, -50.33035659790039, -48.225364685058594, -46.1203727722168, -44.015384674072266, -41.91039276123047, -39.80540084838867, -37.700408935546875, -35.595420837402344, -33.49042892456055, -31.385440826416016, -29.28045082092285, -27.175458908081055, -25.07046890258789, -22.965476989746094, -20.86048698425293, -18.755496978759766, -16.65050506591797, -14.545515060424805, -12.440524101257324, -10.335533142089844, -8.23054313659668, -6.125552177429199, -4.020561218261719, -1.9155712127685547, 0.18941974639892578, 2.2944107055664062, 4.399401664733887, 6.504392147064209, 8.609382629394531, 10.714373588562012, 12.819364547729492, 14.924354553222656, 17.029346466064453, 19.134336471557617, 21.23932647705078, 23.344318389892578, 25.449308395385742, 27.554298400878906, 29.659290313720703, 31.764280319213867, 33.86927032470703, 35.97426223754883, 38.079254150390625, 40.184242248535156, 42.28923416137695, 44.39422607421875, 46.49921417236328, 48.60420608520508, 50.709197998046875, 52.814186096191406, 54.9191780090332, 57.024166107177734, 59.12915802001953, 61.23414993286133, 63.339141845703125, 65.44412994384766, 67.54911804199219, 69.65411376953125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 10.0, 8.0, 12.0, 14.0, 14.0, 10.0, 18.0, 19.0, 28.0, 23.0, 26.0, 32.0, 34.0, 34.0, 32.0, 41.0, 34.0, 41.0, 41.0, 35.0, 36.0, 43.0, 45.0, 33.0, 30.0, 46.0, 25.0, 34.0, 24.0, 20.0, 18.0, 20.0, 10.0, 16.0, 15.0, 12.0, 11.0, 7.0, 5.0, 3.0, 5.0, 5.0, 8.0, 6.0, 5.0, 2.0, 1.0], "bins": [-8.484375, -8.2501220703125, -8.015869140625, -7.7816162109375, -7.54736328125, -7.3131103515625, -7.078857421875, -6.8446044921875, -6.6103515625, -6.3760986328125, -6.141845703125, -5.9075927734375, -5.67333984375, -5.4390869140625, -5.204833984375, -4.9705810546875, -4.736328125, -4.5020751953125, -4.267822265625, -4.0335693359375, -3.79931640625, -3.5650634765625, -3.330810546875, -3.0965576171875, -2.8623046875, -2.6280517578125, -2.393798828125, -2.1595458984375, -1.92529296875, -1.6910400390625, -1.456787109375, -1.2225341796875, -0.98828125, -0.7540283203125, -0.519775390625, -0.2855224609375, -0.05126953125, 0.1829833984375, 0.417236328125, 0.6514892578125, 0.8857421875, 1.1199951171875, 1.354248046875, 1.5885009765625, 1.82275390625, 2.0570068359375, 2.291259765625, 2.5255126953125, 2.759765625, 2.9940185546875, 3.228271484375, 3.4625244140625, 3.69677734375, 3.9310302734375, 4.165283203125, 4.3995361328125, 4.6337890625, 4.8680419921875, 5.102294921875, 5.3365478515625, 5.57080078125, 5.8050537109375, 6.039306640625, 6.2735595703125, 6.5078125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 7.0, 12.0, 12.0, 20.0, 22.0, 38.0, 54.0, 61.0, 93.0, 133.0, 181.0, 306.0, 501.0, 863.0, 1887.0, 4248.0, 11589.0, 40002.0, 264477.0, 1571574.0, 1878758.0, 345978.0, 50843.0, 13293.0, 4724.0, 2102.0, 980.0, 533.0, 303.0, 208.0, 134.0, 106.0, 62.0, 46.0, 32.0, 32.0, 21.0, 22.0, 14.0, 9.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.56787109375, -12.1201171875, -11.67236328125, -11.224609375, -10.77685546875, -10.3291015625, -9.88134765625, -9.43359375, -8.98583984375, -8.5380859375, -8.09033203125, -7.642578125, -7.19482421875, -6.7470703125, -6.29931640625, -5.8515625, -5.40380859375, -4.9560546875, -4.50830078125, -4.060546875, -3.61279296875, -3.1650390625, -2.71728515625, -2.26953125, -1.82177734375, -1.3740234375, -0.92626953125, -0.478515625, -0.03076171875, 0.4169921875, 0.86474609375, 1.3125, 1.76025390625, 2.2080078125, 2.65576171875, 3.103515625, 3.55126953125, 3.9990234375, 4.44677734375, 4.89453125, 5.34228515625, 5.7900390625, 6.23779296875, 6.685546875, 7.13330078125, 7.5810546875, 8.02880859375, 8.4765625, 8.92431640625, 9.3720703125, 9.81982421875, 10.267578125, 10.71533203125, 11.1630859375, 11.61083984375, 12.05859375, 12.50634765625, 12.9541015625, 13.40185546875, 13.849609375, 14.29736328125, 14.7451171875, 15.19287109375, 15.640625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 0.0, 4.0, 7.0, 17.0, 23.0, 25.0, 45.0, 90.0, 147.0, 228.0, 392.0, 597.0, 863.0, 630.0, 405.0, 262.0, 140.0, 83.0, 38.0, 28.0, 12.0, 9.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.90625, -20.145263671875, -19.38427734375, -18.623291015625, -17.8623046875, -17.101318359375, -16.34033203125, -15.579345703125, -14.818359375, -14.057373046875, -13.29638671875, -12.535400390625, -11.7744140625, -11.013427734375, -10.25244140625, -9.491455078125, -8.73046875, -7.969482421875, -7.20849609375, -6.447509765625, -5.6865234375, -4.925537109375, -4.16455078125, -3.403564453125, -2.642578125, -1.881591796875, -1.12060546875, -0.359619140625, 0.4013671875, 1.162353515625, 1.92333984375, 2.684326171875, 3.4453125, 4.206298828125, 4.96728515625, 5.728271484375, 6.4892578125, 7.250244140625, 8.01123046875, 8.772216796875, 9.533203125, 10.294189453125, 11.05517578125, 11.816162109375, 12.5771484375, 13.338134765625, 14.09912109375, 14.860107421875, 15.62109375, 16.382080078125, 17.14306640625, 17.904052734375, 18.6650390625, 19.426025390625, 20.18701171875, 20.947998046875, 21.708984375, 22.469970703125, 23.23095703125, 23.991943359375, 24.7529296875, 25.513916015625, 26.27490234375, 27.035888671875, 27.796875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 5.0, 17.0, 10.0, 21.0, 39.0, 78.0, 140.0, 300.0, 827.0, 2836.0, 251292.0, 3931760.0, 4918.0, 1110.0, 422.0, 200.0, 108.0, 61.0, 45.0, 28.0, 13.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-76.375, -74.0, -71.625, -69.25, -66.875, -64.5, -62.125, -59.75, -57.375, -55.0, -52.625, -50.25, -47.875, -45.5, -43.125, -40.75, -38.375, -36.0, -33.625, -31.25, -28.875, -26.5, -24.125, -21.75, -19.375, -17.0, -14.625, -12.25, -9.875, -7.5, -5.125, -2.75, -0.375, 2.0, 4.375, 6.75, 9.125, 11.5, 13.875, 16.25, 18.625, 21.0, 23.375, 25.75, 28.125, 30.5, 32.875, 35.25, 37.625, 40.0, 42.375, 44.75, 47.125, 49.5, 51.875, 54.25, 56.625, 59.0, 61.375, 63.75, 66.125, 68.5, 70.875, 73.25, 75.625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 77.0, 885.0, 51.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.1205825805664, -69.49803161621094, -53.875484466552734, -38.25293731689453, -22.630386352539062, -7.007835388183594, 8.614707946777344, 24.237258911132812, 39.85980987548828, 55.48236083984375, 71.10490417480469, 86.72745513916016, 102.35000610351562, 117.9725570678711, 133.5950927734375, 149.2176513671875, 164.8402099609375, 180.46275329589844, 196.08531188964844, 211.70785522460938, 227.33041381835938, 242.9529571533203, 258.57550048828125, 274.19805908203125, 289.8205871582031, 305.4431457519531, 321.065673828125, 336.688232421875, 352.310791015625, 367.933349609375, 383.5558776855469, 399.1784362792969, 414.80096435546875, 430.42352294921875, 446.0460510253906, 461.6686096191406, 477.2911682128906, 492.9136962890625, 508.5362548828125, 524.1588134765625, 539.7813720703125, 555.4039306640625, 571.0264892578125, 586.6490478515625, 602.2715454101562, 617.8941040039062, 633.5166625976562, 649.1392211914062, 664.76171875, 680.38427734375, 696.0068359375, 711.62939453125, 727.2518920898438, 742.8744506835938, 758.4970092773438, 774.1195678710938, 789.7421264648438, 805.3646850585938, 820.9872436523438, 836.6097412109375, 852.2322998046875, 867.8548583984375, 883.4774169921875, 899.0999755859375, 914.7225341796875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 7.0, 5.0, 12.0, 8.0, 20.0, 15.0, 11.0, 21.0, 22.0, 26.0, 20.0, 37.0, 40.0, 41.0, 27.0, 53.0, 50.0, 43.0, 55.0, 42.0, 33.0, 49.0, 50.0, 37.0, 40.0, 27.0, 34.0, 24.0, 19.0, 23.0, 25.0, 12.0, 21.0, 11.0, 7.0, 13.0, 6.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.96221923828125, -56.095001220703125, -54.227783203125, -52.36056137084961, -50.493343353271484, -48.62612533569336, -46.75890350341797, -44.891685485839844, -43.02446746826172, -41.157249450683594, -39.29003143310547, -37.42280960083008, -35.55559158325195, -33.68837356567383, -31.82115364074707, -29.953933715820312, -28.086715698242188, -26.219497680664062, -24.352277755737305, -22.485057830810547, -20.617839813232422, -18.750621795654297, -16.88340187072754, -15.016182899475098, -13.148963928222656, -11.281744956970215, -9.414525985717773, -7.547307014465332, -5.680088043212891, -3.812869071960449, -1.9456501007080078, -0.0784311294555664, 1.788787841796875, 3.6560068130493164, 5.523225784301758, 7.390444755554199, 9.25766372680664, 11.124882698059082, 12.992101669311523, 14.859320640563965, 16.726539611816406, 18.59375762939453, 20.46097755432129, 22.328197479248047, 24.195415496826172, 26.062633514404297, 27.929853439331055, 29.797073364257812, 31.664291381835938, 33.53150939941406, 35.39872741699219, 37.26594924926758, 39.1331672668457, 41.00038528442383, 42.86760711669922, 44.734825134277344, 46.60204315185547, 48.469261169433594, 50.33647918701172, 52.20370101928711, 54.070919036865234, 55.93813705444336, 57.80535888671875, 59.672576904296875, 61.539794921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 8.0, 13.0, 14.0, 17.0, 19.0, 21.0, 16.0, 14.0, 26.0, 13.0, 25.0, 25.0, 24.0, 31.0, 22.0, 20.0, 29.0, 43.0, 31.0, 38.0, 40.0, 36.0, 35.0, 39.0, 35.0, 23.0, 35.0, 27.0, 26.0, 28.0, 25.0, 18.0, 23.0, 18.0, 20.0, 16.0, 12.0, 13.0, 5.0, 11.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 5.0], "bins": [-6.10546875, -5.9195556640625, -5.733642578125, -5.5477294921875, -5.36181640625, -5.1759033203125, -4.989990234375, -4.8040771484375, -4.6181640625, -4.4322509765625, -4.246337890625, -4.0604248046875, -3.87451171875, -3.6885986328125, -3.502685546875, -3.3167724609375, -3.130859375, -2.9449462890625, -2.759033203125, -2.5731201171875, -2.38720703125, -2.2012939453125, -2.015380859375, -1.8294677734375, -1.6435546875, -1.4576416015625, -1.271728515625, -1.0858154296875, -0.89990234375, -0.7139892578125, -0.528076171875, -0.3421630859375, -0.15625, 0.0296630859375, 0.215576171875, 0.4014892578125, 0.58740234375, 0.7733154296875, 0.959228515625, 1.1451416015625, 1.3310546875, 1.5169677734375, 1.702880859375, 1.8887939453125, 2.07470703125, 2.2606201171875, 2.446533203125, 2.6324462890625, 2.818359375, 3.0042724609375, 3.190185546875, 3.3760986328125, 3.56201171875, 3.7479248046875, 3.933837890625, 4.1197509765625, 4.3056640625, 4.4915771484375, 4.677490234375, 4.8634033203125, 5.04931640625, 5.2352294921875, 5.421142578125, 5.6070556640625, 5.79296875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 18.0, 21.0, 12.0, 40.0, 53.0, 84.0, 115.0, 215.0, 297.0, 449.0, 693.0, 1066.0, 1654.0, 2498.0, 3929.0, 6152.0, 9275.0, 14446.0, 22511.0, 35509.0, 58748.0, 99349.0, 182089.0, 248958.0, 145517.0, 81376.0, 48844.0, 30150.0, 19361.0, 12351.0, 7914.0, 5230.0, 3399.0, 2188.0, 1380.0, 876.0, 599.0, 416.0, 246.0, 175.0, 96.0, 67.0, 53.0, 37.0, 29.0, 18.0, 11.0, 8.0, 5.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-1.0146484375, -0.9822540283203125, -0.949859619140625, -0.9174652099609375, -0.88507080078125, -0.8526763916015625, -0.820281982421875, -0.7878875732421875, -0.7554931640625, -0.7230987548828125, -0.690704345703125, -0.6583099365234375, -0.62591552734375, -0.5935211181640625, -0.561126708984375, -0.5287322998046875, -0.496337890625, -0.4639434814453125, -0.431549072265625, -0.3991546630859375, -0.36676025390625, -0.3343658447265625, -0.301971435546875, -0.2695770263671875, -0.2371826171875, -0.2047882080078125, -0.172393798828125, -0.1399993896484375, -0.10760498046875, -0.0752105712890625, -0.042816162109375, -0.0104217529296875, 0.02197265625, 0.0543670654296875, 0.086761474609375, 0.1191558837890625, 0.15155029296875, 0.1839447021484375, 0.216339111328125, 0.2487335205078125, 0.2811279296875, 0.3135223388671875, 0.345916748046875, 0.3783111572265625, 0.41070556640625, 0.4430999755859375, 0.475494384765625, 0.5078887939453125, 0.540283203125, 0.5726776123046875, 0.605072021484375, 0.6374664306640625, 0.66986083984375, 0.7022552490234375, 0.734649658203125, 0.7670440673828125, 0.7994384765625, 0.8318328857421875, 0.864227294921875, 0.8966217041015625, 0.92901611328125, 0.9614105224609375, 0.993804931640625, 1.0261993408203125, 1.05859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 8.0, 8.0, 6.0, 10.0, 14.0, 13.0, 15.0, 31.0, 16.0, 21.0, 27.0, 27.0, 33.0, 37.0, 42.0, 33.0, 33.0, 41.0, 43.0, 1053.0, 44.0, 40.0, 41.0, 37.0, 36.0, 41.0, 29.0, 31.0, 30.0, 19.0, 25.0, 15.0, 29.0, 16.0, 15.0, 16.0, 16.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3671875, -4.2254638671875, -4.083740234375, -3.9420166015625, -3.80029296875, -3.6585693359375, -3.516845703125, -3.3751220703125, -3.2333984375, -3.0916748046875, -2.949951171875, -2.8082275390625, -2.66650390625, -2.5247802734375, -2.383056640625, -2.2413330078125, -2.099609375, -1.9578857421875, -1.816162109375, -1.6744384765625, -1.53271484375, -1.3909912109375, -1.249267578125, -1.1075439453125, -0.9658203125, -0.8240966796875, -0.682373046875, -0.5406494140625, -0.39892578125, -0.2572021484375, -0.115478515625, 0.0262451171875, 0.16796875, 0.3096923828125, 0.451416015625, 0.5931396484375, 0.73486328125, 0.8765869140625, 1.018310546875, 1.1600341796875, 1.3017578125, 1.4434814453125, 1.585205078125, 1.7269287109375, 1.86865234375, 2.0103759765625, 2.152099609375, 2.2938232421875, 2.435546875, 2.5772705078125, 2.718994140625, 2.8607177734375, 3.00244140625, 3.1441650390625, 3.285888671875, 3.4276123046875, 3.5693359375, 3.7110595703125, 3.852783203125, 3.9945068359375, 4.13623046875, 4.2779541015625, 4.419677734375, 4.5614013671875, 4.703125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 6.0, 5.0, 9.0, 15.0, 23.0, 50.0, 72.0, 84.0, 143.0, 190.0, 307.0, 430.0, 607.0, 944.0, 1416.0, 2198.0, 3357.0, 4963.0, 7332.0, 11176.0, 17000.0, 27082.0, 44138.0, 74383.0, 129831.0, 1278089.0, 204228.0, 113542.0, 65635.0, 39129.0, 24510.0, 15568.0, 10266.0, 6806.0, 4560.0, 3010.0, 2043.0, 1335.0, 885.0, 561.0, 400.0, 262.0, 176.0, 112.0, 76.0, 54.0, 36.0, 31.0, 18.0, 14.0, 11.0, 6.0, 5.0, 4.0, 0.0, 1.0], "bins": [-1.0, -0.970489501953125, -0.94097900390625, -0.911468505859375, -0.8819580078125, -0.852447509765625, -0.82293701171875, -0.793426513671875, -0.763916015625, -0.734405517578125, -0.70489501953125, -0.675384521484375, -0.6458740234375, -0.616363525390625, -0.58685302734375, -0.557342529296875, -0.52783203125, -0.498321533203125, -0.46881103515625, -0.439300537109375, -0.4097900390625, -0.380279541015625, -0.35076904296875, -0.321258544921875, -0.291748046875, -0.262237548828125, -0.23272705078125, -0.203216552734375, -0.1737060546875, -0.144195556640625, -0.11468505859375, -0.085174560546875, -0.0556640625, -0.026153564453125, 0.00335693359375, 0.032867431640625, 0.0623779296875, 0.091888427734375, 0.12139892578125, 0.150909423828125, 0.180419921875, 0.209930419921875, 0.23944091796875, 0.268951416015625, 0.2984619140625, 0.327972412109375, 0.35748291015625, 0.386993408203125, 0.41650390625, 0.446014404296875, 0.47552490234375, 0.505035400390625, 0.5345458984375, 0.564056396484375, 0.59356689453125, 0.623077392578125, 0.652587890625, 0.682098388671875, 0.71160888671875, 0.741119384765625, 0.7706298828125, 0.800140380859375, 0.82965087890625, 0.859161376953125, 0.888671875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 4.0, 6.0, 9.0, 16.0, 29.0, 39.0, 58.0, 68.0, 92.0, 93.0, 109.0, 119.0, 82.0, 75.0, 46.0, 52.0, 29.0, 14.0, 16.0, 11.0, 5.0, 6.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001422882080078125, -0.0013698935508728027, -0.0013169050216674805, -0.0012639164924621582, -0.001210927963256836, -0.0011579394340515137, -0.0011049509048461914, -0.0010519623756408691, -0.0009989738464355469, -0.0009459853172302246, -0.0008929967880249023, -0.0008400082588195801, -0.0007870197296142578, -0.0007340312004089355, -0.0006810426712036133, -0.000628054141998291, -0.0005750656127929688, -0.0005220770835876465, -0.0004690885543823242, -0.00041610002517700195, -0.0003631114959716797, -0.0003101229667663574, -0.00025713443756103516, -0.0002041459083557129, -0.00015115737915039062, -9.816884994506836e-05, -4.5180320739746094e-05, 7.808208465576172e-06, 6.079673767089844e-05, 0.0001137852668762207, 0.00016677379608154297, 0.00021976232528686523, 0.0002727508544921875, 0.00032573938369750977, 0.00037872791290283203, 0.0004317164421081543, 0.00048470497131347656, 0.0005376935005187988, 0.0005906820297241211, 0.0006436705589294434, 0.0006966590881347656, 0.0007496476173400879, 0.0008026361465454102, 0.0008556246757507324, 0.0009086132049560547, 0.000961601734161377, 0.0010145902633666992, 0.0010675787925720215, 0.0011205673217773438, 0.001173555850982666, 0.0012265443801879883, 0.0012795329093933105, 0.0013325214385986328, 0.001385509967803955, 0.0014384984970092773, 0.0014914870262145996, 0.0015444755554199219, 0.0015974640846252441, 0.0016504526138305664, 0.0017034411430358887, 0.001756429672241211, 0.0018094182014465332, 0.0018624067306518555, 0.0019153952598571777, 0.0019683837890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 1.0, 9.0, 8.0, 11.0, 13.0, 22.0, 36.0, 51.0, 94.0, 148.0, 278.0, 584.0, 1481.0, 1039343.0, 4726.0, 801.0, 357.0, 209.0, 135.0, 94.0, 40.0, 26.0, 16.0, 23.0, 8.0, 6.0, 4.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.039215087890625, -0.03822684288024902, -0.03723859786987305, -0.03625035285949707, -0.035262107849121094, -0.03427386283874512, -0.03328561782836914, -0.032297372817993164, -0.03130912780761719, -0.03032088279724121, -0.029332637786865234, -0.028344392776489258, -0.02735614776611328, -0.026367902755737305, -0.025379657745361328, -0.02439141273498535, -0.023403167724609375, -0.0224149227142334, -0.021426677703857422, -0.020438432693481445, -0.01945018768310547, -0.018461942672729492, -0.017473697662353516, -0.01648545265197754, -0.015497207641601562, -0.014508962631225586, -0.01352071762084961, -0.012532472610473633, -0.011544227600097656, -0.01055598258972168, -0.009567737579345703, -0.008579492568969727, -0.00759124755859375, -0.0066030025482177734, -0.005614757537841797, -0.00462651252746582, -0.0036382675170898438, -0.002650022506713867, -0.0016617774963378906, -0.0006735324859619141, 0.0003147125244140625, 0.001302957534790039, 0.0022912025451660156, 0.003279447555541992, 0.004267692565917969, 0.005255937576293945, 0.006244182586669922, 0.0072324275970458984, 0.008220672607421875, 0.009208917617797852, 0.010197162628173828, 0.011185407638549805, 0.012173652648925781, 0.013161897659301758, 0.014150142669677734, 0.015138387680053711, 0.016126632690429688, 0.017114877700805664, 0.01810312271118164, 0.019091367721557617, 0.020079612731933594, 0.02106785774230957, 0.022056102752685547, 0.023044347763061523, 0.0240325927734375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 48.0, 543.0, 395.0, 25.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021551731042563915, -0.0020686734933406115, -0.0019821738824248314, -0.0018956743879243731, -0.001809174893423915, -0.0017226752825081348, -0.0016361756715923548, -0.0015496761770918965, -0.0014631766825914383, -0.0013766770716756582, -0.0012901775771752, -0.00120367796625942, -0.0011171784717589617, -0.0010306788608431816, -0.0009441793081350625, -0.0008576797554269433, -0.0007711801445111632, -0.0006846805918030441, -0.0005981810390949249, -0.0005116814281791449, -0.00042518190457485616, -0.000338682351866737, -0.0002521827700547874, -0.00016568321734666824, -7.918366463854909e-05, 7.315895345527679e-06, 9.381545532960445e-05, 0.00018031502258963883, 0.000266814575297758, 0.00035331412800587714, 0.00043981370981782675, 0.0005263132625259459, 0.0006128128152340651, 0.0006993123679421842, 0.0007858119206503034, 0.0008723115315660834, 0.0009588110260665417, 0.0010453106369823217, 0.0011318102478981018, 0.00121830974239856, 0.0013048092368990183, 0.0013913088478147984, 0.0014778083423152566, 0.0015643079532310367, 0.001650807447731495, 0.001737307058647275, 0.001823806669563055, 0.0019103061640635133, 0.001996805891394615, 0.0020833055023103952, 0.0021698051132261753, 0.0022563044913113117, 0.002342804102227092, 0.002429303713142872, 0.002515803324058652, 0.002602302934974432, 0.0026888023130595684, 0.0027753019239753485, 0.0028618015348911285, 0.002948300912976265, 0.003034800523892045, 0.003121300134807825, 0.003207799745723605, 0.0032942993566393852, 0.0033807987347245216]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 10.0, 2.0, 9.0, 13.0, 17.0, 22.0, 18.0, 17.0, 24.0, 15.0, 22.0, 31.0, 30.0, 42.0, 37.0, 43.0, 34.0, 57.0, 45.0, 43.0, 43.0, 32.0, 34.0, 44.0, 42.0, 29.0, 37.0, 31.0, 31.0, 23.0, 23.0, 21.0, 11.0, 13.0, 8.0, 17.0, 4.0, 3.0, 6.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005935430526733398, -0.0005748383700847626, -0.0005561336874961853, -0.000537429004907608, -0.0005187243223190308, -0.0005000196397304535, -0.0004813149571418762, -0.00046261027455329895, -0.0004439055919647217, -0.0004252009093761444, -0.00040649622678756714, -0.00038779154419898987, -0.0003690868616104126, -0.00035038217902183533, -0.00033167749643325806, -0.0003129728138446808, -0.0002942681312561035, -0.00027556344866752625, -0.000256858766078949, -0.0002381540834903717, -0.00021944940090179443, -0.00020074471831321716, -0.0001820400357246399, -0.00016333535313606262, -0.00014463067054748535, -0.00012592598795890808, -0.00010722130537033081, -8.851662278175354e-05, -6.981194019317627e-05, -5.1107257604599e-05, -3.240257501602173e-05, -1.3697892427444458e-05, 5.0067901611328125e-06, 2.3711472749710083e-05, 4.2416155338287354e-05, 6.112083792686462e-05, 7.98255205154419e-05, 9.853020310401917e-05, 0.00011723488569259644, 0.0001359395682811737, 0.00015464425086975098, 0.00017334893345832825, 0.00019205361604690552, 0.0002107582986354828, 0.00022946298122406006, 0.00024816766381263733, 0.0002668723464012146, 0.00028557702898979187, 0.00030428171157836914, 0.0003229863941669464, 0.0003416910767555237, 0.00036039575934410095, 0.0003791004419326782, 0.0003978051245212555, 0.00041650980710983276, 0.00043521448969841003, 0.0004539191722869873, 0.0004726238548755646, 0.0004913285374641418, 0.0005100332200527191, 0.0005287379026412964, 0.0005474425852298737, 0.0005661472678184509, 0.0005848519504070282, 0.0006035566329956055]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 8.0, 13.0, 14.0, 17.0, 19.0, 21.0, 16.0, 14.0, 26.0, 13.0, 25.0, 25.0, 24.0, 31.0, 22.0, 20.0, 29.0, 43.0, 32.0, 37.0, 40.0, 36.0, 35.0, 39.0, 35.0, 23.0, 35.0, 27.0, 26.0, 28.0, 25.0, 18.0, 23.0, 18.0, 20.0, 16.0, 12.0, 13.0, 5.0, 11.0, 11.0, 9.0, 5.0, 7.0, 4.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 5.0], "bins": [-6.10546875, -5.9195556640625, -5.733642578125, -5.5477294921875, -5.36181640625, -5.1759033203125, -4.989990234375, -4.8040771484375, -4.6181640625, -4.4322509765625, -4.246337890625, -4.0604248046875, -3.87451171875, -3.6885986328125, -3.502685546875, -3.3167724609375, -3.130859375, -2.9449462890625, -2.759033203125, -2.5731201171875, -2.38720703125, -2.2012939453125, -2.015380859375, -1.8294677734375, -1.6435546875, -1.4576416015625, -1.271728515625, -1.0858154296875, -0.89990234375, -0.7139892578125, -0.528076171875, -0.3421630859375, -0.15625, 0.0296630859375, 0.215576171875, 0.4014892578125, 0.58740234375, 0.7733154296875, 0.959228515625, 1.1451416015625, 1.3310546875, 1.5169677734375, 1.702880859375, 1.8887939453125, 2.07470703125, 2.2606201171875, 2.446533203125, 2.6324462890625, 2.818359375, 3.0042724609375, 3.190185546875, 3.3760986328125, 3.56201171875, 3.7479248046875, 3.933837890625, 4.1197509765625, 4.3056640625, 4.4915771484375, 4.677490234375, 4.8634033203125, 5.04931640625, 5.2352294921875, 5.421142578125, 5.6070556640625, 5.79296875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 9.0, 6.0, 16.0, 17.0, 25.0, 34.0, 44.0, 43.0, 75.0, 103.0, 114.0, 150.0, 198.0, 285.0, 423.0, 604.0, 972.0, 1539.0, 2982.0, 6448.0, 16341.0, 50306.0, 227887.0, 563692.0, 121794.0, 32072.0, 11227.0, 4734.0, 2393.0, 1314.0, 805.0, 557.0, 381.0, 240.0, 183.0, 128.0, 107.0, 72.0, 47.0, 38.0, 26.0, 23.0, 23.0, 14.0, 14.0, 8.0, 9.0, 4.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-11.234375, -10.8756103515625, -10.516845703125, -10.1580810546875, -9.79931640625, -9.4405517578125, -9.081787109375, -8.7230224609375, -8.3642578125, -8.0054931640625, -7.646728515625, -7.2879638671875, -6.92919921875, -6.5704345703125, -6.211669921875, -5.8529052734375, -5.494140625, -5.1353759765625, -4.776611328125, -4.4178466796875, -4.05908203125, -3.7003173828125, -3.341552734375, -2.9827880859375, -2.6240234375, -2.2652587890625, -1.906494140625, -1.5477294921875, -1.18896484375, -0.8302001953125, -0.471435546875, -0.1126708984375, 0.24609375, 0.6048583984375, 0.963623046875, 1.3223876953125, 1.68115234375, 2.0399169921875, 2.398681640625, 2.7574462890625, 3.1162109375, 3.4749755859375, 3.833740234375, 4.1925048828125, 4.55126953125, 4.9100341796875, 5.268798828125, 5.6275634765625, 5.986328125, 6.3450927734375, 6.703857421875, 7.0626220703125, 7.42138671875, 7.7801513671875, 8.138916015625, 8.4976806640625, 8.8564453125, 9.2152099609375, 9.573974609375, 9.9327392578125, 10.29150390625, 10.6502685546875, 11.009033203125, 11.3677978515625, 11.7265625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 3.0, 9.0, 4.0, 16.0, 13.0, 16.0, 16.0, 21.0, 36.0, 24.0, 31.0, 35.0, 54.0, 48.0, 75.0, 129.0, 501.0, 1461.0, 150.0, 68.0, 53.0, 44.0, 39.0, 34.0, 31.0, 32.0, 25.0, 17.0, 13.0, 12.0, 9.0, 8.0, 4.0, 0.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.21875, -19.497314453125, -18.77587890625, -18.054443359375, -17.3330078125, -16.611572265625, -15.89013671875, -15.168701171875, -14.447265625, -13.725830078125, -13.00439453125, -12.282958984375, -11.5615234375, -10.840087890625, -10.11865234375, -9.397216796875, -8.67578125, -7.954345703125, -7.23291015625, -6.511474609375, -5.7900390625, -5.068603515625, -4.34716796875, -3.625732421875, -2.904296875, -2.182861328125, -1.46142578125, -0.739990234375, -0.0185546875, 0.702880859375, 1.42431640625, 2.145751953125, 2.8671875, 3.588623046875, 4.31005859375, 5.031494140625, 5.7529296875, 6.474365234375, 7.19580078125, 7.917236328125, 8.638671875, 9.360107421875, 10.08154296875, 10.802978515625, 11.5244140625, 12.245849609375, 12.96728515625, 13.688720703125, 14.41015625, 15.131591796875, 15.85302734375, 16.574462890625, 17.2958984375, 18.017333984375, 18.73876953125, 19.460205078125, 20.181640625, 20.903076171875, 21.62451171875, 22.345947265625, 23.0673828125, 23.788818359375, 24.51025390625, 25.231689453125, 25.953125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 5.0, 9.0, 12.0, 14.0, 26.0, 28.0, 40.0, 40.0, 58.0, 124.0, 211.0, 402.0, 860.0, 5785.0, 3131179.0, 5068.0, 832.0, 419.0, 221.0, 86.0, 73.0, 35.0, 44.0, 28.0, 22.0, 17.0, 18.0, 10.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-74.8125, -72.7041015625, -70.595703125, -68.4873046875, -66.37890625, -64.2705078125, -62.162109375, -60.0537109375, -57.9453125, -55.8369140625, -53.728515625, -51.6201171875, -49.51171875, -47.4033203125, -45.294921875, -43.1865234375, -41.078125, -38.9697265625, -36.861328125, -34.7529296875, -32.64453125, -30.5361328125, -28.427734375, -26.3193359375, -24.2109375, -22.1025390625, -19.994140625, -17.8857421875, -15.77734375, -13.6689453125, -11.560546875, -9.4521484375, -7.34375, -5.2353515625, -3.126953125, -1.0185546875, 1.08984375, 3.1982421875, 5.306640625, 7.4150390625, 9.5234375, 11.6318359375, 13.740234375, 15.8486328125, 17.95703125, 20.0654296875, 22.173828125, 24.2822265625, 26.390625, 28.4990234375, 30.607421875, 32.7158203125, 34.82421875, 36.9326171875, 39.041015625, 41.1494140625, 43.2578125, 45.3662109375, 47.474609375, 49.5830078125, 51.69140625, 53.7998046875, 55.908203125, 58.0166015625, 60.125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 212.0, 785.0, 14.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-102.9189453125, -96.56126403808594, -90.2035903930664, -83.84590911865234, -77.48823547363281, -71.13055419921875, -64.77287292480469, -58.41519546508789, -52.057518005371094, -45.6998405456543, -39.3421630859375, -32.98448181152344, -26.62680435180664, -20.269126892089844, -13.911445617675781, -7.553768157958984, -1.1960906982421875, 5.161587715148926, 11.519266128540039, 17.87694549560547, 24.234622955322266, 30.592300415039062, 36.949981689453125, 43.30765914916992, 49.66533660888672, 56.023014068603516, 62.38069152832031, 68.73837280273438, 75.09605407714844, 81.45372772216797, 87.81140899658203, 94.16908264160156, 100.52676391601562, 106.88444519042969, 113.24211883544922, 119.59980010986328, 125.95747375488281, 132.31515502929688, 138.67283630371094, 145.030517578125, 151.38818359375, 157.74586486816406, 164.10354614257812, 170.46121215820312, 176.8188934326172, 183.17657470703125, 189.5342559814453, 195.89193725585938, 202.24961853027344, 208.6072998046875, 214.96498107910156, 221.32266235351562, 227.68032836914062, 234.0380096435547, 240.39569091796875, 246.7533721923828, 253.11105346679688, 259.4687194824219, 265.826416015625, 272.18408203125, 278.5417785644531, 284.8994445800781, 291.25714111328125, 297.61480712890625, 303.97247314453125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 7.0, 8.0, 6.0, 12.0, 14.0, 21.0, 23.0, 30.0, 20.0, 26.0, 35.0, 37.0, 42.0, 38.0, 41.0, 35.0, 39.0, 55.0, 36.0, 41.0, 55.0, 49.0, 32.0, 36.0, 27.0, 26.0, 37.0, 29.0, 14.0, 27.0, 18.0, 19.0, 10.0, 16.0, 9.0, 8.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.13600158691406, -45.44004440307617, -43.74408721923828, -42.04813003540039, -40.3521728515625, -38.65621566772461, -36.96025848388672, -35.264305114746094, -33.56834411621094, -31.872386932373047, -30.176429748535156, -28.480472564697266, -26.784515380859375, -25.088558197021484, -23.392602920532227, -21.696645736694336, -20.000690460205078, -18.304733276367188, -16.608776092529297, -14.912819862365723, -13.216862678527832, -11.520905494689941, -9.824949264526367, -8.128992080688477, -6.433034896850586, -4.737077713012695, -3.041121006011963, -1.3451642990112305, 0.35079288482666016, 2.046750068664551, 3.742706298828125, 5.438663482666016, 7.134620666503906, 8.830577850341797, 10.526535034179688, 12.222491264343262, 13.918448448181152, 15.614405632019043, 17.310361862182617, 19.006319046020508, 20.7022762298584, 22.39823341369629, 24.09419059753418, 25.790145874023438, 27.486103057861328, 29.18206024169922, 30.87801742553711, 32.573974609375, 34.26993179321289, 35.96588897705078, 37.66184616088867, 39.35780334472656, 41.05376052856445, 42.749717712402344, 44.44567108154297, 46.141632080078125, 47.83758544921875, 49.53354263305664, 51.22949981689453, 52.92545700073242, 54.62141418457031, 56.3173713684082, 58.013328552246094, 59.70928192138672, 61.405242919921875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 9.0, 7.0, 24.0, 11.0, 11.0, 18.0, 21.0, 19.0, 29.0, 30.0, 29.0, 44.0, 35.0, 47.0, 35.0, 42.0, 48.0, 29.0, 49.0, 26.0, 45.0, 29.0, 32.0, 33.0, 31.0, 28.0, 29.0, 26.0, 30.0, 22.0, 20.0, 21.0, 13.0, 13.0, 13.0, 12.0, 10.0, 3.0, 4.0, 9.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0], "bins": [-9.734375, -9.46588134765625, -9.1973876953125, -8.92889404296875, -8.660400390625, -8.39190673828125, -8.1234130859375, -7.85491943359375, -7.58642578125, -7.31793212890625, -7.0494384765625, -6.78094482421875, -6.512451171875, -6.24395751953125, -5.9754638671875, -5.70697021484375, -5.4384765625, -5.16998291015625, -4.9014892578125, -4.63299560546875, -4.364501953125, -4.09600830078125, -3.8275146484375, -3.55902099609375, -3.29052734375, -3.02203369140625, -2.7535400390625, -2.48504638671875, -2.216552734375, -1.94805908203125, -1.6795654296875, -1.41107177734375, -1.142578125, -0.87408447265625, -0.6055908203125, -0.33709716796875, -0.068603515625, 0.19989013671875, 0.4683837890625, 0.73687744140625, 1.00537109375, 1.27386474609375, 1.5423583984375, 1.81085205078125, 2.079345703125, 2.34783935546875, 2.6163330078125, 2.88482666015625, 3.1533203125, 3.42181396484375, 3.6903076171875, 3.95880126953125, 4.227294921875, 4.49578857421875, 4.7642822265625, 5.03277587890625, 5.30126953125, 5.56976318359375, 5.8382568359375, 6.10675048828125, 6.375244140625, 6.64373779296875, 6.9122314453125, 7.18072509765625, 7.44921875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 6.0, 3.0, 7.0, 10.0, 14.0, 19.0, 30.0, 37.0, 37.0, 45.0, 50.0, 73.0, 100.0, 155.0, 169.0, 241.0, 383.0, 586.0, 1149.0, 3305.0, 309736.0, 3857340.0, 16338.0, 1887.0, 784.0, 501.0, 336.0, 238.0, 174.0, 118.0, 79.0, 71.0, 52.0, 40.0, 32.0, 44.0, 25.0, 20.0, 17.0, 6.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.875, -64.9248046875, -62.974609375, -61.0244140625, -59.07421875, -57.1240234375, -55.173828125, -53.2236328125, -51.2734375, -49.3232421875, -47.373046875, -45.4228515625, -43.47265625, -41.5224609375, -39.572265625, -37.6220703125, -35.671875, -33.7216796875, -31.771484375, -29.8212890625, -27.87109375, -25.9208984375, -23.970703125, -22.0205078125, -20.0703125, -18.1201171875, -16.169921875, -14.2197265625, -12.26953125, -10.3193359375, -8.369140625, -6.4189453125, -4.46875, -2.5185546875, -0.568359375, 1.3818359375, 3.33203125, 5.2822265625, 7.232421875, 9.1826171875, 11.1328125, 13.0830078125, 15.033203125, 16.9833984375, 18.93359375, 20.8837890625, 22.833984375, 24.7841796875, 26.734375, 28.6845703125, 30.634765625, 32.5849609375, 34.53515625, 36.4853515625, 38.435546875, 40.3857421875, 42.3359375, 44.2861328125, 46.236328125, 48.1865234375, 50.13671875, 52.0869140625, 54.037109375, 55.9873046875, 57.9375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 3.0, 7.0, 7.0, 19.0, 39.0, 76.0, 135.0, 377.0, 805.0, 1144.0, 834.0, 359.0, 125.0, 63.0, 27.0, 18.0, 9.0, 3.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.75, -25.87255859375, -24.9951171875, -24.11767578125, -23.240234375, -22.36279296875, -21.4853515625, -20.60791015625, -19.73046875, -18.85302734375, -17.9755859375, -17.09814453125, -16.220703125, -15.34326171875, -14.4658203125, -13.58837890625, -12.7109375, -11.83349609375, -10.9560546875, -10.07861328125, -9.201171875, -8.32373046875, -7.4462890625, -6.56884765625, -5.69140625, -4.81396484375, -3.9365234375, -3.05908203125, -2.181640625, -1.30419921875, -0.4267578125, 0.45068359375, 1.328125, 2.20556640625, 3.0830078125, 3.96044921875, 4.837890625, 5.71533203125, 6.5927734375, 7.47021484375, 8.34765625, 9.22509765625, 10.1025390625, 10.97998046875, 11.857421875, 12.73486328125, 13.6123046875, 14.48974609375, 15.3671875, 16.24462890625, 17.1220703125, 17.99951171875, 18.876953125, 19.75439453125, 20.6318359375, 21.50927734375, 22.38671875, 23.26416015625, 24.1416015625, 25.01904296875, 25.896484375, 26.77392578125, 27.6513671875, 28.52880859375, 29.40625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 6.0, 19.0, 23.0, 29.0, 87.0, 213.0, 573.0, 1800.0, 9179.0, 488343.0, 3663311.0, 26046.0, 3130.0, 890.0, 337.0, 126.0, 66.0, 26.0, 15.0, 11.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.90478515625, -34.7158203125, -33.52685546875, -32.337890625, -31.14892578125, -29.9599609375, -28.77099609375, -27.58203125, -26.39306640625, -25.2041015625, -24.01513671875, -22.826171875, -21.63720703125, -20.4482421875, -19.25927734375, -18.0703125, -16.88134765625, -15.6923828125, -14.50341796875, -13.314453125, -12.12548828125, -10.9365234375, -9.74755859375, -8.55859375, -7.36962890625, -6.1806640625, -4.99169921875, -3.802734375, -2.61376953125, -1.4248046875, -0.23583984375, 0.953125, 2.14208984375, 3.3310546875, 4.52001953125, 5.708984375, 6.89794921875, 8.0869140625, 9.27587890625, 10.46484375, 11.65380859375, 12.8427734375, 14.03173828125, 15.220703125, 16.40966796875, 17.5986328125, 18.78759765625, 19.9765625, 21.16552734375, 22.3544921875, 23.54345703125, 24.732421875, 25.92138671875, 27.1103515625, 28.29931640625, 29.48828125, 30.67724609375, 31.8662109375, 33.05517578125, 34.244140625, 35.43310546875, 36.6220703125, 37.81103515625, 39.0]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 10.0, 22.0, 59.0, 184.0, 318.0, 250.0, 122.0, 35.0, 8.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.4215087890625, -217.6017303466797, -209.7819366455078, -201.962158203125, -194.1423797607422, -186.3225860595703, -178.5028076171875, -170.68301391601562, -162.8632354736328, -155.04345703125, -147.22366333007812, -139.4038848876953, -131.5841064453125, -123.76431274414062, -115.94453430175781, -108.12474822998047, -100.30496978759766, -92.48518371582031, -84.6654052734375, -76.84561920166016, -69.02583312988281, -61.206050872802734, -53.386268615722656, -45.56648254394531, -37.746700286865234, -29.926916122436523, -22.107131958007812, -14.287349700927734, -6.467565536499023, 1.3522186279296875, 9.172000885009766, 16.99178695678711, 24.811569213867188, 32.631351470947266, 40.45113754272461, 48.27091979980469, 56.09070587158203, 63.91048812866211, 71.73027038574219, 79.55005645751953, 87.36984252929688, 95.18962860107422, 103.00940704345703, 110.82919311523438, 118.64897918701172, 126.46876525878906, 134.28854370117188, 142.10833740234375, 149.9281005859375, 157.7478790283203, 165.5676727294922, 173.387451171875, 181.2072296142578, 189.0270233154297, 196.8468017578125, 204.66659545898438, 212.4863739013672, 220.30615234375, 228.12594604492188, 235.9457244873047, 243.7655029296875, 251.58529663085938, 259.40509033203125, 267.224853515625, 275.0446472167969]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 5.0, 14.0, 8.0, 14.0, 20.0, 22.0, 27.0, 21.0, 45.0, 42.0, 36.0, 43.0, 52.0, 55.0, 50.0, 57.0, 42.0, 46.0, 47.0, 48.0, 57.0, 24.0, 33.0, 26.0, 31.0, 25.0, 20.0, 23.0, 21.0, 8.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.245452880859375, -52.4891471862793, -50.73284149169922, -48.976531982421875, -47.2202262878418, -45.46392059326172, -43.707611083984375, -41.9513053894043, -40.19499969482422, -38.43869400024414, -36.68238830566406, -34.92607879638672, -33.16977310180664, -31.413467407226562, -29.65715980529785, -27.90085220336914, -26.144546508789062, -24.388240814208984, -22.631933212280273, -20.875625610351562, -19.119319915771484, -17.363014221191406, -15.606706619262695, -13.8503999710083, -12.094093322753906, -10.337786674499512, -8.581480026245117, -6.825173377990723, -5.068866729736328, -3.3125600814819336, -1.556253433227539, 0.20005321502685547, 1.95635986328125, 3.7126665115356445, 5.468973159790039, 7.225279808044434, 8.981586456298828, 10.737893104553223, 12.494199752807617, 14.250506401062012, 16.006813049316406, 17.763118743896484, 19.519426345825195, 21.275733947753906, 23.032039642333984, 24.788345336914062, 26.544652938842773, 28.300960540771484, 30.057266235351562, 31.81357192993164, 33.56987762451172, 35.32618713378906, 37.08249282836914, 38.83879852294922, 40.59510803222656, 42.35141372680664, 44.10771942138672, 45.8640251159668, 47.620330810546875, 49.37664031982422, 51.1329460144043, 52.889251708984375, 54.64556121826172, 56.4018669128418, 58.158172607421875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 12.0, 8.0, 16.0, 14.0, 20.0, 33.0, 38.0, 33.0, 41.0, 54.0, 66.0, 68.0, 59.0, 58.0, 49.0, 57.0, 46.0, 64.0, 61.0, 34.0, 26.0, 29.0, 25.0, 23.0, 17.0, 16.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.3125, -88.1494140625, -84.986328125, -81.8232421875, -78.66015625, -75.4970703125, -72.333984375, -69.1708984375, -66.0078125, -62.8447265625, -59.681640625, -56.5185546875, -53.35546875, -50.1923828125, -47.029296875, -43.8662109375, -40.703125, -37.5400390625, -34.376953125, -31.2138671875, -28.05078125, -24.8876953125, -21.724609375, -18.5615234375, -15.3984375, -12.2353515625, -9.072265625, -5.9091796875, -2.74609375, 0.4169921875, 3.580078125, 6.7431640625, 9.90625, 13.0693359375, 16.232421875, 19.3955078125, 22.55859375, 25.7216796875, 28.884765625, 32.0478515625, 35.2109375, 38.3740234375, 41.537109375, 44.7001953125, 47.86328125, 51.0263671875, 54.189453125, 57.3525390625, 60.515625, 63.6787109375, 66.841796875, 70.0048828125, 73.16796875, 76.3310546875, 79.494140625, 82.6572265625, 85.8203125, 88.9833984375, 92.146484375, 95.3095703125, 98.47265625, 101.6357421875, 104.798828125, 107.9619140625, 111.125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 14.0, 17.0, 16.0, 33.0, 29.0, 48.0, 57.0, 95.0, 115.0, 179.0, 288.0, 453.0, 685.0, 1105.0, 1901.0, 3656.0, 6225.0, 11228.0, 20523.0, 39724.0, 80707.0, 176470.0, 327828.0, 194692.0, 89269.0, 43257.0, 22013.0, 12103.0, 6705.0, 3692.0, 2154.0, 1212.0, 695.0, 409.0, 295.0, 165.0, 134.0, 95.0, 80.0, 65.0, 25.0, 26.0, 18.0, 10.0, 10.0, 10.0, 1.0, 0.0, 6.0, 2.0, 5.0, 5.0], "bins": [-14.2890625, -13.8756103515625, -13.462158203125, -13.0487060546875, -12.63525390625, -12.2218017578125, -11.808349609375, -11.3948974609375, -10.9814453125, -10.5679931640625, -10.154541015625, -9.7410888671875, -9.32763671875, -8.9141845703125, -8.500732421875, -8.0872802734375, -7.673828125, -7.2603759765625, -6.846923828125, -6.4334716796875, -6.02001953125, -5.6065673828125, -5.193115234375, -4.7796630859375, -4.3662109375, -3.9527587890625, -3.539306640625, -3.1258544921875, -2.71240234375, -2.2989501953125, -1.885498046875, -1.4720458984375, -1.05859375, -0.6451416015625, -0.231689453125, 0.1817626953125, 0.59521484375, 1.0086669921875, 1.422119140625, 1.8355712890625, 2.2490234375, 2.6624755859375, 3.075927734375, 3.4893798828125, 3.90283203125, 4.3162841796875, 4.729736328125, 5.1431884765625, 5.556640625, 5.9700927734375, 6.383544921875, 6.7969970703125, 7.21044921875, 7.6239013671875, 8.037353515625, 8.4508056640625, 8.8642578125, 9.2777099609375, 9.691162109375, 10.1046142578125, 10.51806640625, 10.9315185546875, 11.344970703125, 11.7584228515625, 12.171875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 8.0, 4.0, 12.0, 5.0, 9.0, 13.0, 14.0, 13.0, 19.0, 21.0, 18.0, 30.0, 23.0, 32.0, 39.0, 45.0, 46.0, 40.0, 47.0, 54.0, 1064.0, 42.0, 33.0, 54.0, 30.0, 36.0, 27.0, 27.0, 31.0, 27.0, 21.0, 29.0, 21.0, 18.0, 9.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 5.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.34375, -38.9150390625, -37.486328125, -36.0576171875, -34.62890625, -33.2001953125, -31.771484375, -30.3427734375, -28.9140625, -27.4853515625, -26.056640625, -24.6279296875, -23.19921875, -21.7705078125, -20.341796875, -18.9130859375, -17.484375, -16.0556640625, -14.626953125, -13.1982421875, -11.76953125, -10.3408203125, -8.912109375, -7.4833984375, -6.0546875, -4.6259765625, -3.197265625, -1.7685546875, -0.33984375, 1.0888671875, 2.517578125, 3.9462890625, 5.375, 6.8037109375, 8.232421875, 9.6611328125, 11.08984375, 12.5185546875, 13.947265625, 15.3759765625, 16.8046875, 18.2333984375, 19.662109375, 21.0908203125, 22.51953125, 23.9482421875, 25.376953125, 26.8056640625, 28.234375, 29.6630859375, 31.091796875, 32.5205078125, 33.94921875, 35.3779296875, 36.806640625, 38.2353515625, 39.6640625, 41.0927734375, 42.521484375, 43.9501953125, 45.37890625, 46.8076171875, 48.236328125, 49.6650390625, 51.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 16.0, 24.0, 36.0, 57.0, 92.0, 96.0, 163.0, 226.0, 352.0, 479.0, 726.0, 1036.0, 1528.0, 2361.0, 3383.0, 5032.0, 7607.0, 11480.0, 18571.0, 29805.0, 50272.0, 88573.0, 159433.0, 1305468.0, 172669.0, 95583.0, 53781.0, 31772.0, 19678.0, 12542.0, 7971.0, 5366.0, 3489.0, 2360.0, 1573.0, 1069.0, 743.0, 508.0, 351.0, 268.0, 196.0, 134.0, 95.0, 54.0, 42.0, 21.0, 20.0, 11.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.34375, -9.0477294921875, -8.751708984375, -8.4556884765625, -8.15966796875, -7.8636474609375, -7.567626953125, -7.2716064453125, -6.9755859375, -6.6795654296875, -6.383544921875, -6.0875244140625, -5.79150390625, -5.4954833984375, -5.199462890625, -4.9034423828125, -4.607421875, -4.3114013671875, -4.015380859375, -3.7193603515625, -3.42333984375, -3.1273193359375, -2.831298828125, -2.5352783203125, -2.2392578125, -1.9432373046875, -1.647216796875, -1.3511962890625, -1.05517578125, -0.7591552734375, -0.463134765625, -0.1671142578125, 0.12890625, 0.4249267578125, 0.720947265625, 1.0169677734375, 1.31298828125, 1.6090087890625, 1.905029296875, 2.2010498046875, 2.4970703125, 2.7930908203125, 3.089111328125, 3.3851318359375, 3.68115234375, 3.9771728515625, 4.273193359375, 4.5692138671875, 4.865234375, 5.1612548828125, 5.457275390625, 5.7532958984375, 6.04931640625, 6.3453369140625, 6.641357421875, 6.9373779296875, 7.2333984375, 7.5294189453125, 7.825439453125, 8.1214599609375, 8.41748046875, 8.7135009765625, 9.009521484375, 9.3055419921875, 9.6015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 8.0, 7.0, 9.0, 19.0, 13.0, 14.0, 9.0, 19.0, 19.0, 20.0, 26.0, 41.0, 31.0, 37.0, 51.0, 54.0, 42.0, 78.0, 72.0, 58.0, 53.0, 49.0, 41.0, 31.0, 25.0, 26.0, 14.0, 22.0, 14.0, 8.0, 10.0, 8.0, 14.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.010955810546875, -0.010612010955810547, -0.010268211364746094, -0.00992441177368164, -0.009580612182617188, -0.009236812591552734, -0.008893013000488281, -0.008549213409423828, -0.008205413818359375, -0.007861614227294922, -0.007517814636230469, -0.007174015045166016, -0.0068302154541015625, -0.006486415863037109, -0.006142616271972656, -0.005798816680908203, -0.00545501708984375, -0.005111217498779297, -0.004767417907714844, -0.004423618316650391, -0.0040798187255859375, -0.0037360191345214844, -0.0033922195434570312, -0.003048419952392578, -0.002704620361328125, -0.002360820770263672, -0.0020170211791992188, -0.0016732215881347656, -0.0013294219970703125, -0.0009856224060058594, -0.0006418228149414062, -0.0002980232238769531, 4.57763671875e-05, 0.0003895759582519531, 0.0007333755493164062, 0.0010771751403808594, 0.0014209747314453125, 0.0017647743225097656, 0.0021085739135742188, 0.002452373504638672, 0.002796173095703125, 0.003139972686767578, 0.0034837722778320312, 0.0038275718688964844, 0.0041713714599609375, 0.004515171051025391, 0.004858970642089844, 0.005202770233154297, 0.00554656982421875, 0.005890369415283203, 0.006234169006347656, 0.006577968597412109, 0.0069217681884765625, 0.007265567779541016, 0.007609367370605469, 0.007953166961669922, 0.008296966552734375, 0.008640766143798828, 0.008984565734863281, 0.009328365325927734, 0.009672164916992188, 0.01001596450805664, 0.010359764099121094, 0.010703563690185547, 0.01104736328125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 9.0, 16.0, 14.0, 33.0, 30.0, 38.0, 62.0, 95.0, 138.0, 190.0, 270.0, 438.0, 1046.0, 3207.0, 15891.0, 136588.0, 735658.0, 133545.0, 15688.0, 3164.0, 981.0, 504.0, 277.0, 201.0, 118.0, 87.0, 78.0, 44.0, 47.0, 24.0, 14.0, 17.0, 4.0, 5.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12017822265625, -0.1163625717163086, -0.11254692077636719, -0.10873126983642578, -0.10491561889648438, -0.10109996795654297, -0.09728431701660156, -0.09346866607666016, -0.08965301513671875, -0.08583736419677734, -0.08202171325683594, -0.07820606231689453, -0.07439041137695312, -0.07057476043701172, -0.06675910949707031, -0.0629434585571289, -0.0591278076171875, -0.055312156677246094, -0.05149650573730469, -0.04768085479736328, -0.043865203857421875, -0.04004955291748047, -0.03623390197753906, -0.032418251037597656, -0.02860260009765625, -0.024786949157714844, -0.020971298217773438, -0.01715564727783203, -0.013339996337890625, -0.009524345397949219, -0.0057086944580078125, -0.0018930435180664062, 0.001922607421875, 0.005738258361816406, 0.009553909301757812, 0.013369560241699219, 0.017185211181640625, 0.02100086212158203, 0.024816513061523438, 0.028632164001464844, 0.03244781494140625, 0.036263465881347656, 0.04007911682128906, 0.04389476776123047, 0.047710418701171875, 0.05152606964111328, 0.05534172058105469, 0.059157371520996094, 0.0629730224609375, 0.0667886734008789, 0.07060432434082031, 0.07441997528076172, 0.07823562622070312, 0.08205127716064453, 0.08586692810058594, 0.08968257904052734, 0.09349822998046875, 0.09731388092041016, 0.10112953186035156, 0.10494518280029297, 0.10876083374023438, 0.11257648468017578, 0.11639213562011719, 0.1202077865600586, 0.1240234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 16.0, 42.0, 106.0, 170.0, 239.0, 206.0, 128.0, 60.0, 25.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01266908273100853, -0.011856491677463055, -0.011043899692595005, -0.01023130863904953, -0.009418717585504055, -0.00860612653195858, -0.00779353454709053, -0.006980943493545055, -0.006168351974338293, -0.005355760455131531, -0.004543169401586056, -0.0037305778823792934, -0.0029179865960031748, -0.002105395309627056, -0.0012928037904202938, -0.0004802127368748188, 0.0003323787823319435, 0.0011449700687080622, 0.001957561355084181, 0.002770152874290943, 0.003582744160667062, 0.0043953354470431805, 0.005207926966249943, 0.006020518019795418, 0.00683310953900218, 0.007645701058208942, 0.008458292111754417, 0.009270884096622467, 0.010083475150167942, 0.010896066203713417, 0.011708658188581467, 0.012521248310804367, 0.013333840295672417, 0.014146431349217892, 0.014959023334085941, 0.015771614387631416, 0.016584206372499466, 0.017396796494722366, 0.018209388479590416, 0.019021980464458466, 0.019834570586681366, 0.020647162571549416, 0.021459752693772316, 0.022272344678640366, 0.023084936663508415, 0.023897526785731316, 0.024710118770599365, 0.025522708892822266, 0.026335302740335464, 0.027147894725203514, 0.027960484847426414, 0.028773076832294464, 0.029585668817162514, 0.030398258939385414, 0.031210850924253464, 0.032023441046476364, 0.032836031168699265, 0.033648621290922165, 0.034461215138435364, 0.035273805260658264, 0.036086395382881165, 0.03689898923039436, 0.037711579352617264, 0.038524169474840164, 0.03933676332235336]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 3.0, 8.0, 8.0, 9.0, 10.0, 21.0, 20.0, 18.0, 19.0, 23.0, 29.0, 29.0, 36.0, 41.0, 40.0, 35.0, 40.0, 44.0, 41.0, 49.0, 40.0, 59.0, 50.0, 31.0, 32.0, 29.0, 41.0, 24.0, 27.0, 20.0, 20.0, 12.0, 22.0, 10.0, 11.0, 9.0, 10.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.007381021976470947, -0.007165335118770599, -0.0069496482610702515, -0.0067339614033699036, -0.006518274545669556, -0.006302587687969208, -0.00608690083026886, -0.005871213972568512, -0.005655527114868164, -0.005439840257167816, -0.005224153399467468, -0.00500846654176712, -0.0047927796840667725, -0.0045770928263664246, -0.004361405968666077, -0.004145719110965729, -0.003930032253265381, -0.003714345395565033, -0.003498658537864685, -0.003282971680164337, -0.0030672848224639893, -0.0028515979647636414, -0.0026359111070632935, -0.0024202242493629456, -0.0022045373916625977, -0.0019888505339622498, -0.0017731636762619019, -0.001557476818561554, -0.001341789960861206, -0.0011261031031608582, -0.0009104162454605103, -0.0006947293877601624, -0.00047904253005981445, -0.00026335567235946655, -4.766881465911865e-05, 0.00016801804304122925, 0.00038370490074157715, 0.000599391758441925, 0.000815078616142273, 0.0010307654738426208, 0.0012464523315429688, 0.0014621391892433167, 0.0016778260469436646, 0.0018935129046440125, 0.0021091997623443604, 0.0023248866200447083, 0.002540573477745056, 0.002756260335445404, 0.002971947193145752, 0.0031876340508461, 0.0034033209085464478, 0.0036190077662467957, 0.0038346946239471436, 0.0040503814816474915, 0.004266068339347839, 0.004481755197048187, 0.004697442054748535, 0.004913128912448883, 0.005128815770149231, 0.005344502627849579, 0.005560189485549927, 0.005775876343250275, 0.0059915632009506226, 0.0062072500586509705, 0.006422936916351318]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 12.0, 8.0, 16.0, 14.0, 20.0, 32.0, 39.0, 33.0, 41.0, 54.0, 66.0, 68.0, 58.0, 59.0, 49.0, 57.0, 46.0, 64.0, 61.0, 34.0, 26.0, 29.0, 25.0, 22.0, 18.0, 16.0, 10.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.3125, -88.150390625, -84.98828125, -81.826171875, -78.6640625, -75.501953125, -72.33984375, -69.177734375, -66.015625, -62.853515625, -59.69140625, -56.529296875, -53.3671875, -50.205078125, -47.04296875, -43.880859375, -40.71875, -37.556640625, -34.39453125, -31.232421875, -28.0703125, -24.908203125, -21.74609375, -18.583984375, -15.421875, -12.259765625, -9.09765625, -5.935546875, -2.7734375, 0.388671875, 3.55078125, 6.712890625, 9.875, 13.037109375, 16.19921875, 19.361328125, 22.5234375, 25.685546875, 28.84765625, 32.009765625, 35.171875, 38.333984375, 41.49609375, 44.658203125, 47.8203125, 50.982421875, 54.14453125, 57.306640625, 60.46875, 63.630859375, 66.79296875, 69.955078125, 73.1171875, 76.279296875, 79.44140625, 82.603515625, 85.765625, 88.927734375, 92.08984375, 95.251953125, 98.4140625, 101.576171875, 104.73828125, 107.900390625, 111.0625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 1.0, 4.0, 7.0, 12.0, 6.0, 25.0, 22.0, 47.0, 64.0, 114.0, 144.0, 293.0, 466.0, 1067.0, 2161.0, 5271.0, 16886.0, 100142.0, 702725.0, 182653.0, 24294.0, 6720.0, 2813.0, 1206.0, 568.0, 307.0, 187.0, 117.0, 75.0, 45.0, 38.0, 23.0, 18.0, 13.0, 6.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.390625, -22.5439453125, -21.697265625, -20.8505859375, -20.00390625, -19.1572265625, -18.310546875, -17.4638671875, -16.6171875, -15.7705078125, -14.923828125, -14.0771484375, -13.23046875, -12.3837890625, -11.537109375, -10.6904296875, -9.84375, -8.9970703125, -8.150390625, -7.3037109375, -6.45703125, -5.6103515625, -4.763671875, -3.9169921875, -3.0703125, -2.2236328125, -1.376953125, -0.5302734375, 0.31640625, 1.1630859375, 2.009765625, 2.8564453125, 3.703125, 4.5498046875, 5.396484375, 6.2431640625, 7.08984375, 7.9365234375, 8.783203125, 9.6298828125, 10.4765625, 11.3232421875, 12.169921875, 13.0166015625, 13.86328125, 14.7099609375, 15.556640625, 16.4033203125, 17.25, 18.0966796875, 18.943359375, 19.7900390625, 20.63671875, 21.4833984375, 22.330078125, 23.1767578125, 24.0234375, 24.8701171875, 25.716796875, 26.5634765625, 27.41015625, 28.2568359375, 29.103515625, 29.9501953125, 30.796875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 12.0, 18.0, 33.0, 37.0, 46.0, 67.0, 80.0, 79.0, 98.0, 2116.0, 82.0, 65.0, 76.0, 50.0, 36.0, 44.0, 26.0, 25.0, 10.0, 16.0, 9.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.125, -154.25, -148.375, -142.5, -136.625, -130.75, -124.875, -119.0, -113.125, -107.25, -101.375, -95.5, -89.625, -83.75, -77.875, -72.0, -66.125, -60.25, -54.375, -48.5, -42.625, -36.75, -30.875, -25.0, -19.125, -13.25, -7.375, -1.5, 4.375, 10.25, 16.125, 22.0, 27.875, 33.75, 39.625, 45.5, 51.375, 57.25, 63.125, 69.0, 74.875, 80.75, 86.625, 92.5, 98.375, 104.25, 110.125, 116.0, 121.875, 127.75, 133.625, 139.5, 145.375, 151.25, 157.125, 163.0, 168.875, 174.75, 180.625, 186.5, 192.375, 198.25, 204.125, 210.0, 215.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 10.0, 10.0, 6.0, 18.0, 26.0, 36.0, 61.0, 71.0, 126.0, 191.0, 257.0, 436.0, 889.0, 2211.0, 9901.0, 148183.0, 2916189.0, 57941.0, 5754.0, 1606.0, 679.0, 364.0, 228.0, 149.0, 101.0, 72.0, 41.0, 34.0, 20.0, 18.0, 11.0, 10.0, 4.0, 12.0, 5.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.46875, -38.31982421875, -37.1708984375, -36.02197265625, -34.873046875, -33.72412109375, -32.5751953125, -31.42626953125, -30.27734375, -29.12841796875, -27.9794921875, -26.83056640625, -25.681640625, -24.53271484375, -23.3837890625, -22.23486328125, -21.0859375, -19.93701171875, -18.7880859375, -17.63916015625, -16.490234375, -15.34130859375, -14.1923828125, -13.04345703125, -11.89453125, -10.74560546875, -9.5966796875, -8.44775390625, -7.298828125, -6.14990234375, -5.0009765625, -3.85205078125, -2.703125, -1.55419921875, -0.4052734375, 0.74365234375, 1.892578125, 3.04150390625, 4.1904296875, 5.33935546875, 6.48828125, 7.63720703125, 8.7861328125, 9.93505859375, 11.083984375, 12.23291015625, 13.3818359375, 14.53076171875, 15.6796875, 16.82861328125, 17.9775390625, 19.12646484375, 20.275390625, 21.42431640625, 22.5732421875, 23.72216796875, 24.87109375, 26.02001953125, 27.1689453125, 28.31787109375, 29.466796875, 30.61572265625, 31.7646484375, 32.91357421875, 34.0625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 12.0, 37.0, 208.0, 492.0, 192.0, 39.0, 13.0, 6.0, 2.0, 3.0, 4.0, 5.0, 1.0], "bins": [-1014.8699951171875, -996.2274780273438, -977.5849609375, -958.9424438476562, -940.2999267578125, -921.657470703125, -903.0149536132812, -884.3724365234375, -865.7299194335938, -847.08740234375, -828.4448852539062, -809.8023681640625, -791.159912109375, -772.5173950195312, -753.8748779296875, -735.2323608398438, -716.58984375, -697.9473266601562, -679.3048095703125, -660.6622924804688, -642.019775390625, -623.3773193359375, -604.7348022460938, -586.09228515625, -567.4497680664062, -548.8072509765625, -530.1647338867188, -511.5222473144531, -492.8797302246094, -474.2372131347656, -455.5947265625, -436.95220947265625, -418.3096618652344, -399.6671447753906, -381.024658203125, -362.38214111328125, -343.7396240234375, -325.09710693359375, -306.45458984375, -287.8121032714844, -269.1695861816406, -250.52706909179688, -231.8845672607422, -213.2420654296875, -194.59954833984375, -175.95703125, -157.3145294189453, -138.67202758789062, -120.02951049804688, -101.38700103759766, -82.74449157714844, -64.10198211669922, -45.45947265625, -26.81696319580078, -8.174453735351562, 10.468048095703125, 29.110565185546875, 47.753074645996094, 66.39558410644531, 85.03809356689453, 103.68060302734375, 122.32311248779297, 140.9656219482422, 159.60812377929688, 178.25064086914062]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 4.0, 5.0, 9.0, 11.0, 12.0, 17.0, 23.0, 27.0, 25.0, 28.0, 35.0, 33.0, 38.0, 28.0, 50.0, 38.0, 48.0, 34.0, 48.0, 55.0, 42.0, 29.0, 52.0, 41.0, 30.0, 30.0, 40.0, 27.0, 24.0, 16.0, 14.0, 18.0, 13.0, 10.0, 4.0, 8.0, 3.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.74847412109375, -144.1166229248047, -139.48475646972656, -134.8529052734375, -130.22103881835938, -125.58918762207031, -120.95732879638672, -116.32546997070312, -111.69361114501953, -107.06175231933594, -102.42989349365234, -97.79803466796875, -93.16618347167969, -88.53431701660156, -83.9024658203125, -79.2706069946289, -74.63874816894531, -70.00688934326172, -65.37503051757812, -60.7431755065918, -56.1113166809082, -51.47945785522461, -46.84760284423828, -42.21574401855469, -37.583885192871094, -32.9520263671875, -28.32016944885254, -23.688312530517578, -19.056453704833984, -14.42459487915039, -9.79273796081543, -5.160881042480469, -0.5290374755859375, 4.10282039642334, 8.734678268432617, 13.366536140441895, 17.998394012451172, 22.630252838134766, 27.262109756469727, 31.893966674804688, 36.52582550048828, 41.157684326171875, 45.78954315185547, 50.4213981628418, 55.05325698852539, 59.685115814208984, 64.31697082519531, 68.9488296508789, 73.5806884765625, 78.2125473022461, 82.84440612792969, 87.47626495361328, 92.10812377929688, 96.73997497558594, 101.37183380126953, 106.00369262695312, 110.63555145263672, 115.26741027832031, 119.8992691040039, 124.5311279296875, 129.16297912597656, 133.7948455810547, 138.42669677734375, 143.05856323242188, 147.69041442871094]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 1.0, 10.0, 9.0, 17.0, 18.0, 18.0, 36.0, 46.0, 54.0, 86.0, 111.0, 145.0, 210.0, 266.0, 415.0, 524.0, 751.0, 1077.0, 1040168.0, 1468.0, 825.0, 606.0, 421.0, 322.0, 250.0, 173.0, 115.0, 98.0, 90.0, 40.0, 28.0, 35.0, 21.0, 31.0, 14.0, 11.0, 9.0, 6.0, 3.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.51396560668945, -49.94153594970703, -48.36910629272461, -46.79667663574219, -45.2242431640625, -43.65181350708008, -42.079383850097656, -40.506954193115234, -38.93452453613281, -37.36209487915039, -35.78966522216797, -34.21723556518555, -32.644805908203125, -31.07237434387207, -29.499942779541016, -27.927513122558594, -26.355083465576172, -24.78265380859375, -23.210224151611328, -21.637792587280273, -20.06536293029785, -18.49293327331543, -16.920501708984375, -15.348072052001953, -13.775642395019531, -12.20321273803711, -10.630782127380371, -9.058351516723633, -7.485921859741211, -5.913491725921631, -4.341061592102051, -2.7686309814453125, -1.196197509765625, 0.3762326240539551, 1.9486627578735352, 3.5210928916931152, 5.093523025512695, 6.665953159332275, 8.238383293151855, 9.810813903808594, 11.383243560791016, 12.955673217773438, 14.528103828430176, 16.100534439086914, 17.672964096069336, 19.245393753051758, 20.817825317382812, 22.390254974365234, 23.962684631347656, 25.535114288330078, 27.1075439453125, 28.679975509643555, 30.252405166625977, 31.8248348236084, 33.39726638793945, 34.969696044921875, 36.5421257019043, 38.11455535888672, 39.68698501586914, 41.25941467285156, 42.83184814453125, 44.40427780151367, 45.976707458496094, 47.549137115478516, 49.12156677246094]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 10.0, 7.0, 23.0, 15.0, 29.0, 114.0, 51461984.0, 800.0, 81.0, 20.0, 7.0, 5.0, 5.0, 3.0, 12.0, 15.0, 3.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5682.0771484375, -5433.32861328125, -5184.580078125, -4935.83154296875, -4687.0830078125, -4438.3349609375, -4189.58642578125, -3940.837890625, -3692.08935546875, -3443.3408203125, -3194.59228515625, -2945.843994140625, -2697.095458984375, -2448.346923828125, -2199.5986328125, -1950.85009765625, -1702.1015625, -1453.35302734375, -1204.6046142578125, -955.8561401367188, -707.107666015625, -458.359130859375, -209.6107177734375, 39.1376953125, 287.88623046875, 536.6347045898438, 785.3831787109375, 1034.131591796875, 1282.880126953125, 1531.628662109375, 1780.3770751953125, 2029.12548828125, 2277.8740234375, 2526.62255859375, 2775.37109375, 3024.119384765625, 3272.867919921875, 3521.616455078125, 3770.36474609375, 4019.11328125, 4267.86181640625, 4516.6103515625, 4765.35888671875, 5014.107421875, 5262.85546875, 5511.6044921875, 5760.3525390625, 6009.10107421875, 6257.849609375, 6506.59814453125, 6755.3466796875, 7004.09521484375, 7252.84375, 7501.591796875, 7750.34033203125, 7999.0888671875, 8247.837890625, 8496.5859375, 8745.3349609375, 8994.0830078125, 9242.83203125, 9491.580078125, 9740.3291015625, 9989.0771484375, 10237.8251953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 11.0, 16.0, 20.0, 29.0, 52.0, 91.0, 114.0, 134.0, 175.0, 267.0, 403.0, 602.0, 860.0, 1377.0, 1846.0, 2876.0, 4367.0, 6669.0, 10650.0, 16990.0, 26923.0, 42149.0, 69493.0, 115294.0, 203214.0, 408416.0, 3882394.0, 803383.0, 291933.0, 156638.0, 92240.0, 55466.0, 34767.0, 21840.0, 14017.0, 8806.0, 5646.0, 3710.0, 2533.0, 1625.0, 1087.0, 713.0, 508.0, 321.0, 224.0, 167.0, 96.0, 84.0, 46.0, 36.0, 36.0, 24.0, 18.0, 16.0, 9.0, 7.0, 5.0], "bins": [-6.2578125, -6.07257080078125, -5.8873291015625, -5.70208740234375, -5.516845703125, -5.33160400390625, -5.1463623046875, -4.96112060546875, -4.77587890625, -4.59063720703125, -4.4053955078125, -4.22015380859375, -4.034912109375, -3.84967041015625, -3.6644287109375, -3.47918701171875, -3.2939453125, -3.10870361328125, -2.9234619140625, -2.73822021484375, -2.552978515625, -2.36773681640625, -2.1824951171875, -1.99725341796875, -1.81201171875, -1.62677001953125, -1.4415283203125, -1.25628662109375, -1.071044921875, -0.88580322265625, -0.7005615234375, -0.51531982421875, -0.330078125, -0.14483642578125, 0.0404052734375, 0.22564697265625, 0.410888671875, 0.59613037109375, 0.7813720703125, 0.96661376953125, 1.15185546875, 1.33709716796875, 1.5223388671875, 1.70758056640625, 1.892822265625, 2.07806396484375, 2.2633056640625, 2.44854736328125, 2.6337890625, 2.81903076171875, 3.0042724609375, 3.18951416015625, 3.374755859375, 3.55999755859375, 3.7452392578125, 3.93048095703125, 4.11572265625, 4.30096435546875, 4.4862060546875, 4.67144775390625, 4.856689453125, 5.04193115234375, 5.2271728515625, 5.41241455078125, 5.59765625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 6.0, 8.0, 7.0, 12.0, 13.0, 19.0, 11.0, 14.0, 25.0, 24.0, 18.0, 25.0, 39.0, 30.0, 30.0, 30.0, 34.0, 44.0, 42.0, 234.0, 739.0, 144.0, 44.0, 48.0, 39.0, 34.0, 38.0, 36.0, 29.0, 25.0, 24.0, 24.0, 17.0, 24.0, 13.0, 17.0, 11.0, 11.0, 11.0, 6.0, 5.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7890625, -14.3011474609375, -13.813232421875, -13.3253173828125, -12.83740234375, -12.3494873046875, -11.861572265625, -11.3736572265625, -10.8857421875, -10.3978271484375, -9.909912109375, -9.4219970703125, -8.93408203125, -8.4461669921875, -7.958251953125, -7.4703369140625, -6.982421875, -6.4945068359375, -6.006591796875, -5.5186767578125, -5.03076171875, -4.5428466796875, -4.054931640625, -3.5670166015625, -3.0791015625, -2.5911865234375, -2.103271484375, -1.6153564453125, -1.12744140625, -0.6395263671875, -0.151611328125, 0.3363037109375, 0.82421875, 1.3121337890625, 1.800048828125, 2.2879638671875, 2.77587890625, 3.2637939453125, 3.751708984375, 4.2396240234375, 4.7275390625, 5.2154541015625, 5.703369140625, 6.1912841796875, 6.67919921875, 7.1671142578125, 7.655029296875, 8.1429443359375, 8.630859375, 9.1187744140625, 9.606689453125, 10.0946044921875, 10.58251953125, 11.0704345703125, 11.558349609375, 12.0462646484375, 12.5341796875, 13.0220947265625, 13.510009765625, 13.9979248046875, 14.48583984375, 14.9737548828125, 15.461669921875, 15.9495849609375, 16.4375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 0.0, 4.0, 7.0, 5.0, 2.0, 8.0, 14.0, 15.0, 19.0, 37.0, 29.0, 40.0, 100.0, 155.0, 298.0, 478.0, 668.0, 1109.0, 1723.0, 2532.0, 3868.0, 5763.0, 9074.0, 13996.0, 22506.0, 35537.0, 59730.0, 100343.0, 177028.0, 373346.0, 3573383.0, 1219278.0, 304073.0, 154571.0, 88719.0, 52740.0, 33014.0, 20662.0, 12823.0, 8126.0, 5490.0, 3458.0, 2318.0, 1524.0, 1072.0, 685.0, 392.0, 240.0, 192.0, 72.0, 66.0, 40.0, 13.0, 14.0, 15.0, 4.0, 8.0, 8.0, 7.0, 3.0, 3.0], "bins": [-8.03125, -7.79425048828125, -7.5572509765625, -7.32025146484375, -7.083251953125, -6.84625244140625, -6.6092529296875, -6.37225341796875, -6.13525390625, -5.89825439453125, -5.6612548828125, -5.42425537109375, -5.187255859375, -4.95025634765625, -4.7132568359375, -4.47625732421875, -4.2392578125, -4.00225830078125, -3.7652587890625, -3.52825927734375, -3.291259765625, -3.05426025390625, -2.8172607421875, -2.58026123046875, -2.34326171875, -2.10626220703125, -1.8692626953125, -1.63226318359375, -1.395263671875, -1.15826416015625, -0.9212646484375, -0.68426513671875, -0.447265625, -0.21026611328125, 0.0267333984375, 0.26373291015625, 0.500732421875, 0.73773193359375, 0.9747314453125, 1.21173095703125, 1.44873046875, 1.68572998046875, 1.9227294921875, 2.15972900390625, 2.396728515625, 2.63372802734375, 2.8707275390625, 3.10772705078125, 3.3447265625, 3.58172607421875, 3.8187255859375, 4.05572509765625, 4.292724609375, 4.52972412109375, 4.7667236328125, 5.00372314453125, 5.24072265625, 5.47772216796875, 5.7147216796875, 5.95172119140625, 6.188720703125, 6.42572021484375, 6.6627197265625, 6.89971923828125, 7.13671875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 7.0, 8.0, 6.0, 7.0, 13.0, 7.0, 12.0, 16.0, 14.0, 23.0, 20.0, 19.0, 27.0, 25.0, 33.0, 30.0, 28.0, 35.0, 47.0, 63.0, 126.0, 520.0, 359.0, 106.0, 62.0, 40.0, 42.0, 38.0, 35.0, 34.0, 19.0, 30.0, 27.0, 18.0, 24.0, 10.0, 14.0, 15.0, 12.0, 9.0, 3.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-11.34375, -11.008544921875, -10.67333984375, -10.338134765625, -10.0029296875, -9.667724609375, -9.33251953125, -8.997314453125, -8.662109375, -8.326904296875, -7.99169921875, -7.656494140625, -7.3212890625, -6.986083984375, -6.65087890625, -6.315673828125, -5.98046875, -5.645263671875, -5.31005859375, -4.974853515625, -4.6396484375, -4.304443359375, -3.96923828125, -3.634033203125, -3.298828125, -2.963623046875, -2.62841796875, -2.293212890625, -1.9580078125, -1.622802734375, -1.28759765625, -0.952392578125, -0.6171875, -0.281982421875, 0.05322265625, 0.388427734375, 0.7236328125, 1.058837890625, 1.39404296875, 1.729248046875, 2.064453125, 2.399658203125, 2.73486328125, 3.070068359375, 3.4052734375, 3.740478515625, 4.07568359375, 4.410888671875, 4.74609375, 5.081298828125, 5.41650390625, 5.751708984375, 6.0869140625, 6.422119140625, 6.75732421875, 7.092529296875, 7.427734375, 7.762939453125, 8.09814453125, 8.433349609375, 8.7685546875, 9.103759765625, 9.43896484375, 9.774169921875, 10.109375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 0.0, 14.0, 9.0, 10.0, 5.0, 6.0, 8.0, 12.0, 28.0, 34.0, 19.0, 30.0, 55.0, 119.0, 118.0, 179.0, 236.0, 305.0, 459.0, 591.0, 865.0, 1301.0, 2166.0, 3391.0, 6715.0, 13395.0, 36966.0, 188125.0, 5921330.0, 71269.0, 21735.0, 9253.0, 4580.0, 2760.0, 1644.0, 1110.0, 743.0, 482.0, 341.0, 293.0, 173.0, 151.0, 84.0, 72.0, 88.0, 65.0, 27.0, 9.0, 4.0, 13.0, 9.0, 13.0, 16.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-27.03125, -26.1376953125, -25.244140625, -24.3505859375, -23.45703125, -22.5634765625, -21.669921875, -20.7763671875, -19.8828125, -18.9892578125, -18.095703125, -17.2021484375, -16.30859375, -15.4150390625, -14.521484375, -13.6279296875, -12.734375, -11.8408203125, -10.947265625, -10.0537109375, -9.16015625, -8.2666015625, -7.373046875, -6.4794921875, -5.5859375, -4.6923828125, -3.798828125, -2.9052734375, -2.01171875, -1.1181640625, -0.224609375, 0.6689453125, 1.5625, 2.4560546875, 3.349609375, 4.2431640625, 5.13671875, 6.0302734375, 6.923828125, 7.8173828125, 8.7109375, 9.6044921875, 10.498046875, 11.3916015625, 12.28515625, 13.1787109375, 14.072265625, 14.9658203125, 15.859375, 16.7529296875, 17.646484375, 18.5400390625, 19.43359375, 20.3271484375, 21.220703125, 22.1142578125, 23.0078125, 23.9013671875, 24.794921875, 25.6884765625, 26.58203125, 27.4755859375, 28.369140625, 29.2626953125, 30.15625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 10.0, 7.0, 20.0, 22.0, 24.0, 21.0, 24.0, 32.0, 28.0, 37.0, 46.0, 50.0, 60.0, 99.0, 183.0, 564.0, 246.0, 121.0, 66.0, 53.0, 40.0, 46.0, 33.0, 29.0, 29.0, 17.0, 24.0, 15.0, 13.0, 14.0, 12.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.095947265625, -8.77783203125, -8.459716796875, -8.1416015625, -7.823486328125, -7.50537109375, -7.187255859375, -6.869140625, -6.551025390625, -6.23291015625, -5.914794921875, -5.5966796875, -5.278564453125, -4.96044921875, -4.642333984375, -4.32421875, -4.006103515625, -3.68798828125, -3.369873046875, -3.0517578125, -2.733642578125, -2.41552734375, -2.097412109375, -1.779296875, -1.461181640625, -1.14306640625, -0.824951171875, -0.5068359375, -0.188720703125, 0.12939453125, 0.447509765625, 0.765625, 1.083740234375, 1.40185546875, 1.719970703125, 2.0380859375, 2.356201171875, 2.67431640625, 2.992431640625, 3.310546875, 3.628662109375, 3.94677734375, 4.264892578125, 4.5830078125, 4.901123046875, 5.21923828125, 5.537353515625, 5.85546875, 6.173583984375, 6.49169921875, 6.809814453125, 7.1279296875, 7.446044921875, 7.76416015625, 8.082275390625, 8.400390625, 8.718505859375, 9.03662109375, 9.354736328125, 9.6728515625, 9.990966796875, 10.30908203125, 10.627197265625, 10.9453125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 11.0, 32.0, 54.0, 204.0, 475.0, 122.0, 57.0, 17.0, 17.0, 6.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.23688507080078, -42.493629455566406, -40.750370025634766, -39.00711441040039, -37.26385498046875, -35.520599365234375, -33.777339935302734, -32.03408432006836, -30.29082489013672, -28.54756736755371, -26.804309844970703, -25.061052322387695, -23.317794799804688, -21.574539184570312, -19.831279754638672, -18.088024139404297, -16.34476661682129, -14.601509094238281, -12.858251571655273, -11.114994049072266, -9.371736526489258, -7.628479957580566, -5.885222434997559, -4.141964912414551, -2.398707389831543, -0.6554499864578247, 1.0878074169158936, 2.8310647010803223, 4.57432222366333, 6.31757926940918, 8.060836791992188, 9.804094314575195, 11.547351837158203, 13.290609359741211, 15.033866882324219, 16.777124404907227, 18.520381927490234, 20.26363754272461, 22.00689697265625, 23.750152587890625, 25.493412017822266, 27.236669540405273, 28.97992706298828, 30.72318458557129, 32.4664421081543, 34.20969772338867, 35.95295715332031, 37.69621276855469, 39.43946838378906, 41.18272399902344, 42.92598342895508, 44.66923904418945, 46.412498474121094, 48.15575408935547, 49.89901351928711, 51.642269134521484, 53.385528564453125, 55.1287841796875, 56.87204360961914, 58.615299224853516, 60.358558654785156, 62.10181427001953, 63.84507369995117, 65.58833312988281, 67.33158874511719]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 7.0, 3.0, 8.0, 6.0, 12.0, 12.0, 13.0, 19.0, 20.0, 33.0, 25.0, 29.0, 42.0, 49.0, 56.0, 49.0, 56.0, 49.0, 54.0, 50.0, 59.0, 45.0, 56.0, 43.0, 42.0, 29.0, 23.0, 21.0, 22.0, 15.0, 13.0, 14.0, 8.0, 9.0, 9.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.537908554077148, -10.996195793151855, -10.454482078552246, -9.912769317626953, -9.37105655670166, -8.829343795776367, -8.287630081176758, -7.745917320251465, -7.204204082489014, -6.6624908447265625, -6.1207780838012695, -5.579064846038818, -5.037351608276367, -4.495638847351074, -3.953925609588623, -3.412212610244751, -2.870499610900879, -2.328786611557007, -1.7870734930038452, -1.2453603744506836, -0.7036473751068115, -0.16193437576293945, 0.3797788619995117, 0.9214918613433838, 1.4632048606872559, 2.004917860031128, 2.546630859375, 3.088344097137451, 3.6300570964813232, 4.171770095825195, 4.7134833335876465, 5.255196571350098, 5.796909332275391, 6.338622570037842, 6.880335330963135, 7.422048568725586, 7.963761329650879, 8.505474090576172, 9.047187805175781, 9.588900566101074, 10.130613327026367, 10.67232608795166, 11.21403980255127, 11.755752563476562, 12.297465324401855, 12.839178085327148, 13.380891799926758, 13.92260456085205, 14.46431827545166, 15.006031036376953, 15.547744750976562, 16.089458465576172, 16.63117027282715, 17.172883987426758, 17.714595794677734, 18.256309509277344, 18.798023223876953, 19.339736938476562, 19.88144874572754, 20.42316246032715, 20.964876174926758, 21.506587982177734, 22.048301696777344, 22.590015411376953, 23.13172721862793]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 10.0, 11.0, 10.0, 13.0, 28.0, 40.0, 55.0, 94.0, 164.0, 247.0, 519.0, 1094.0, 2890.0, 10453.0, 59782.0, 4004244.0, 87639.0, 16498.0, 5361.0, 2170.0, 1108.0, 644.0, 386.0, 245.0, 141.0, 130.0, 63.0, 52.0, 48.0, 34.0, 23.0, 12.0, 18.0, 7.0, 12.0, 6.0, 4.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.040435791015625, -0.038561344146728516, -0.03668689727783203, -0.03481245040893555, -0.03293800354003906, -0.031063556671142578, -0.029189109802246094, -0.02731466293334961, -0.025440216064453125, -0.02356576919555664, -0.021691322326660156, -0.019816875457763672, -0.017942428588867188, -0.016067981719970703, -0.014193534851074219, -0.012319087982177734, -0.01044464111328125, -0.008570194244384766, -0.006695747375488281, -0.004821300506591797, -0.0029468536376953125, -0.0010724067687988281, 0.0008020401000976562, 0.0026764869689941406, 0.004550933837890625, 0.006425380706787109, 0.008299827575683594, 0.010174274444580078, 0.012048721313476562, 0.013923168182373047, 0.01579761505126953, 0.017672061920166016, 0.0195465087890625, 0.021420955657958984, 0.02329540252685547, 0.025169849395751953, 0.027044296264648438, 0.028918743133544922, 0.030793190002441406, 0.03266763687133789, 0.034542083740234375, 0.03641653060913086, 0.038290977478027344, 0.04016542434692383, 0.04203987121582031, 0.0439143180847168, 0.04578876495361328, 0.047663211822509766, 0.04953765869140625, 0.051412105560302734, 0.05328655242919922, 0.0551609992980957, 0.05703544616699219, 0.05890989303588867, 0.060784339904785156, 0.06265878677368164, 0.06453323364257812, 0.06640768051147461, 0.0682821273803711, 0.07015657424926758, 0.07203102111816406, 0.07390546798706055, 0.07577991485595703, 0.07765436172485352, 0.07952880859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 4.0, 8.0, 5.0, 12.0, 19.0, 16.0, 26.0, 748.0, 72.0, 20.0, 15.0, 9.0, 8.0, 10.0, 6.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005268096923828125, -0.005038797855377197, -0.0048094987869262695, -0.004580199718475342, -0.004350900650024414, -0.004121601581573486, -0.0038923025131225586, -0.003663003444671631, -0.003433704376220703, -0.0032044053077697754, -0.0029751062393188477, -0.00274580717086792, -0.002516508102416992, -0.0022872090339660645, -0.0020579099655151367, -0.001828610897064209, -0.0015993118286132812, -0.0013700127601623535, -0.0011407136917114258, -0.000911414623260498, -0.0006821155548095703, -0.0004528164863586426, -0.00022351741790771484, 5.781650543212891e-06, 0.00023508071899414062, 0.00046437978744506836, 0.0006936788558959961, 0.0009229779243469238, 0.0011522769927978516, 0.0013815760612487793, 0.001610875129699707, 0.0018401741981506348, 0.0020694732666015625, 0.0022987723350524902, 0.002528071403503418, 0.0027573704719543457, 0.0029866695404052734, 0.003215968608856201, 0.003445267677307129, 0.0036745667457580566, 0.0039038658142089844, 0.004133164882659912, 0.00436246395111084, 0.004591763019561768, 0.004821062088012695, 0.005050361156463623, 0.005279660224914551, 0.0055089592933654785, 0.005738258361816406, 0.005967557430267334, 0.006196856498718262, 0.0064261555671691895, 0.006655454635620117, 0.006884753704071045, 0.007114052772521973, 0.0073433518409729, 0.007572650909423828, 0.007801949977874756, 0.008031249046325684, 0.008260548114776611, 0.008489847183227539, 0.008719146251678467, 0.008948445320129395, 0.009177744388580322, 0.00940704345703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 8.0, 8.0, 9.0, 7.0, 19.0, 26.0, 27.0, 42.0, 56.0, 93.0, 112.0, 202.0, 286.0, 586.0, 1179.0, 3096.0, 12451.0, 97428.0, 2902825.0, 1100666.0, 61135.0, 9154.0, 2475.0, 1001.0, 532.0, 296.0, 156.0, 133.0, 66.0, 57.0, 35.0, 25.0, 14.0, 24.0, 13.0, 8.0, 11.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053863525390625, -0.052175045013427734, -0.05048656463623047, -0.0487980842590332, -0.04710960388183594, -0.04542112350463867, -0.043732643127441406, -0.04204416275024414, -0.040355682373046875, -0.03866720199584961, -0.036978721618652344, -0.03529024124145508, -0.03360176086425781, -0.03191328048706055, -0.03022480010986328, -0.028536319732666016, -0.02684783935546875, -0.025159358978271484, -0.02347087860107422, -0.021782398223876953, -0.020093917846679688, -0.018405437469482422, -0.016716957092285156, -0.01502847671508789, -0.013339996337890625, -0.01165151596069336, -0.009963035583496094, -0.008274555206298828, -0.0065860748291015625, -0.004897594451904297, -0.0032091140747070312, -0.0015206336975097656, 0.0001678466796875, 0.0018563270568847656, 0.0035448074340820312, 0.005233287811279297, 0.0069217681884765625, 0.008610248565673828, 0.010298728942871094, 0.01198720932006836, 0.013675689697265625, 0.01536417007446289, 0.017052650451660156, 0.018741130828857422, 0.020429611206054688, 0.022118091583251953, 0.02380657196044922, 0.025495052337646484, 0.02718353271484375, 0.028872013092041016, 0.03056049346923828, 0.03224897384643555, 0.03393745422363281, 0.03562593460083008, 0.037314414978027344, 0.03900289535522461, 0.040691375732421875, 0.04237985610961914, 0.044068336486816406, 0.04575681686401367, 0.04744529724121094, 0.0491337776184082, 0.05082225799560547, 0.052510738372802734, 0.05419921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 10.0, 19.0, 19.0, 35.0, 42.0, 52.0, 63.0, 77.0, 90.0, 138.0, 164.0, 228.0, 317.0, 551.0, 791.0, 362.0, 237.0, 200.0, 138.0, 109.0, 105.0, 76.0, 68.0, 43.0, 25.0, 13.0, 19.0, 17.0, 12.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0060882568359375, -0.005864381790161133, -0.005640506744384766, -0.0054166316986083984, -0.005192756652832031, -0.004968881607055664, -0.004745006561279297, -0.00452113151550293, -0.0042972564697265625, -0.004073381423950195, -0.003849506378173828, -0.003625631332397461, -0.0034017562866210938, -0.0031778812408447266, -0.0029540061950683594, -0.002730131149291992, -0.002506256103515625, -0.002282381057739258, -0.0020585060119628906, -0.0018346309661865234, -0.0016107559204101562, -0.001386880874633789, -0.0011630058288574219, -0.0009391307830810547, -0.0007152557373046875, -0.0004913806915283203, -0.0002675056457519531, -4.363059997558594e-05, 0.00018024444580078125, 0.00040411949157714844, 0.0006279945373535156, 0.0008518695831298828, 0.00107574462890625, 0.0012996196746826172, 0.0015234947204589844, 0.0017473697662353516, 0.0019712448120117188, 0.002195119857788086, 0.002418994903564453, 0.0026428699493408203, 0.0028667449951171875, 0.0030906200408935547, 0.003314495086669922, 0.003538370132446289, 0.0037622451782226562, 0.0039861202239990234, 0.004209995269775391, 0.004433870315551758, 0.004657745361328125, 0.004881620407104492, 0.005105495452880859, 0.0053293704986572266, 0.005553245544433594, 0.005777120590209961, 0.006000995635986328, 0.006224870681762695, 0.0064487457275390625, 0.00667262077331543, 0.006896495819091797, 0.007120370864868164, 0.007344245910644531, 0.0075681209564208984, 0.007791996002197266, 0.008015871047973633, 0.00823974609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 8.0, 11.0, 18.0, 43.0, 111.0, 191.0, 287.0, 192.0, 81.0, 33.0, 18.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10753180831670761, -0.10386888682842255, -0.10020596534013748, -0.09654304385185242, -0.09288012981414795, -0.08921720832586288, -0.08555428683757782, -0.08189136534929276, -0.07822844386100769, -0.07456552237272263, -0.07090260088443756, -0.0672396868467331, -0.06357676535844803, -0.059913843870162964, -0.0562509223818779, -0.052588000893592834, -0.04892508685588837, -0.0452621653676033, -0.041599247604608536, -0.03793632611632347, -0.034273408353328705, -0.03061048686504364, -0.026947565376758575, -0.02328464575111866, -0.019621726125478745, -0.01595880649983883, -0.012295885942876339, -0.008632965385913849, -0.004970045760273933, -0.001307126134634018, 0.0023557953536510468, 0.006018714979290962, 0.00968162715435028, 0.013344546779990196, 0.01700746640563011, 0.020670387893915176, 0.024333307519555092, 0.027996227145195007, 0.03165914863348007, 0.03532207012176514, 0.0389849878847599, 0.04264790937304497, 0.046310827136039734, 0.0499737486243248, 0.05363667011260986, 0.05729958787560463, 0.060962509363889694, 0.06462542712688446, 0.06828834861516953, 0.07195127010345459, 0.07561419159173965, 0.07927711308002472, 0.08294002711772919, 0.08660294860601425, 0.09026587009429932, 0.09392879158258438, 0.09759171307086945, 0.10125463455915451, 0.10491755604743958, 0.10858047008514404, 0.11224339157342911, 0.11590631306171417, 0.11956923454999924, 0.1232321560382843, 0.12689507007598877]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 6.0, 2.0, 15.0, 8.0, 13.0, 13.0, 16.0, 24.0, 39.0, 35.0, 37.0, 48.0, 60.0, 60.0, 70.0, 65.0, 70.0, 59.0, 58.0, 39.0, 36.0, 42.0, 42.0, 27.0, 18.0, 22.0, 13.0, 11.0, 10.0, 11.0, 12.0, 11.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03702443838119507, -0.03586341440677643, -0.03470238670706749, -0.03354135900735855, -0.03238033503293991, -0.03121930919587612, -0.030058283358812332, -0.028897257521748543, -0.027736231684684753, -0.026575205847620964, -0.025414180010557175, -0.024253154173493385, -0.023092128336429596, -0.021931102499365807, -0.020770076662302017, -0.019609050825238228, -0.01844802498817444, -0.01728699915111065, -0.01612597331404686, -0.01496494747698307, -0.013803921639919281, -0.012642895802855492, -0.011481869965791702, -0.010320844128727913, -0.009159818291664124, -0.007998792454600334, -0.006837766617536545, -0.005676740780472755, -0.004515714943408966, -0.0033546891063451767, -0.0021936632692813873, -0.001032637432217598, 0.0001283884048461914, 0.0012894142419099808, 0.00245044007897377, 0.0036114659160375595, 0.004772491753101349, 0.005933517590165138, 0.007094543427228928, 0.008255569264292717, 0.009416595101356506, 0.010577620938420296, 0.011738646775484085, 0.012899672612547874, 0.014060698449611664, 0.015221724286675453, 0.016382750123739243, 0.017543775960803032, 0.01870480179786682, 0.01986582763493061, 0.0210268534719944, 0.02218787930905819, 0.02334890514612198, 0.024509930983185768, 0.025670956820249557, 0.026831982657313347, 0.027993008494377136, 0.029154034331440926, 0.030315060168504715, 0.031476087868213654, 0.032637111842632294, 0.033798135817050934, 0.03495916351675987, 0.03612019121646881, 0.03728121519088745]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 9.0, 15.0, 25.0, 29.0, 34.0, 58.0, 82.0, 125.0, 225.0, 378.0, 712.0, 1293.0, 2899.0, 7336.0, 23490.0, 889749.0, 98492.0, 13940.0, 5025.0, 2130.0, 1059.0, 559.0, 314.0, 202.0, 119.0, 61.0, 55.0, 35.0, 32.0, 11.0, 15.0, 8.0, 9.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0792236328125, -0.07656574249267578, -0.07390785217285156, -0.07124996185302734, -0.06859207153320312, -0.0659341812133789, -0.06327629089355469, -0.06061840057373047, -0.05796051025390625, -0.05530261993408203, -0.05264472961425781, -0.049986839294433594, -0.047328948974609375, -0.044671058654785156, -0.04201316833496094, -0.03935527801513672, -0.0366973876953125, -0.03403949737548828, -0.03138160705566406, -0.028723716735839844, -0.026065826416015625, -0.023407936096191406, -0.020750045776367188, -0.01809215545654297, -0.01543426513671875, -0.012776374816894531, -0.010118484497070312, -0.007460594177246094, -0.004802703857421875, -0.0021448135375976562, 0.0005130767822265625, 0.0031709671020507812, 0.005828857421875, 0.008486747741699219, 0.011144638061523438, 0.013802528381347656, 0.016460418701171875, 0.019118309020996094, 0.021776199340820312, 0.02443408966064453, 0.02709197998046875, 0.02974987030029297, 0.03240776062011719, 0.035065650939941406, 0.037723541259765625, 0.040381431579589844, 0.04303932189941406, 0.04569721221923828, 0.0483551025390625, 0.05101299285888672, 0.05367088317871094, 0.056328773498535156, 0.058986663818359375, 0.061644554138183594, 0.06430244445800781, 0.06696033477783203, 0.06961822509765625, 0.07227611541748047, 0.07493400573730469, 0.0775918960571289, 0.08024978637695312, 0.08290767669677734, 0.08556556701660156, 0.08822345733642578, 0.09088134765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 9.0, 10.0, 15.0, 16.0, 45.0, 320.0, 419.0, 82.0, 14.0, 13.0, 5.0, 6.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005199432373046875, -0.004976212978363037, -0.004752993583679199, -0.004529774188995361, -0.0043065547943115234, -0.0040833353996276855, -0.0038601160049438477, -0.0036368966102600098, -0.003413677215576172, -0.003190457820892334, -0.002967238426208496, -0.002744019031524658, -0.0025207996368408203, -0.0022975802421569824, -0.0020743608474731445, -0.0018511414527893066, -0.0016279220581054688, -0.0014047026634216309, -0.001181483268737793, -0.0009582638740539551, -0.0007350444793701172, -0.0005118250846862793, -0.0002886056900024414, -6.538629531860352e-05, 0.00015783309936523438, 0.00038105249404907227, 0.0006042718887329102, 0.000827491283416748, 0.001050710678100586, 0.0012739300727844238, 0.0014971494674682617, 0.0017203688621520996, 0.0019435882568359375, 0.0021668076515197754, 0.0023900270462036133, 0.002613246440887451, 0.002836465835571289, 0.003059685230255127, 0.003282904624938965, 0.0035061240196228027, 0.0037293434143066406, 0.0039525628089904785, 0.004175782203674316, 0.004399001598358154, 0.004622220993041992, 0.00484544038772583, 0.005068659782409668, 0.005291879177093506, 0.005515098571777344, 0.005738317966461182, 0.0059615373611450195, 0.006184756755828857, 0.006407976150512695, 0.006631195545196533, 0.006854414939880371, 0.007077634334564209, 0.007300853729248047, 0.007524073123931885, 0.007747292518615723, 0.00797051191329956, 0.008193731307983398, 0.008416950702667236, 0.008640170097351074, 0.008863389492034912, 0.00908660888671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 10.0, 17.0, 23.0, 27.0, 55.0, 56.0, 66.0, 103.0, 145.0, 231.0, 326.0, 501.0, 746.0, 1241.0, 1975.0, 3963.0, 9406.0, 41704.0, 783538.0, 173137.0, 18110.0, 5924.0, 2812.0, 1624.0, 891.0, 561.0, 381.0, 304.0, 190.0, 154.0, 90.0, 65.0, 46.0, 36.0, 21.0, 18.0, 16.0, 9.0, 8.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08258056640625, -0.08006000518798828, -0.07753944396972656, -0.07501888275146484, -0.07249832153320312, -0.0699777603149414, -0.06745719909667969, -0.06493663787841797, -0.06241607666015625, -0.05989551544189453, -0.05737495422363281, -0.054854393005371094, -0.052333831787109375, -0.049813270568847656, -0.04729270935058594, -0.04477214813232422, -0.0422515869140625, -0.03973102569580078, -0.03721046447753906, -0.034689903259277344, -0.032169342041015625, -0.029648780822753906, -0.027128219604492188, -0.02460765838623047, -0.02208709716796875, -0.01956653594970703, -0.017045974731445312, -0.014525413513183594, -0.012004852294921875, -0.009484291076660156, -0.0069637298583984375, -0.004443168640136719, -0.001922607421875, 0.0005979537963867188, 0.0031185150146484375, 0.005639076232910156, 0.008159637451171875, 0.010680198669433594, 0.013200759887695312, 0.01572132110595703, 0.01824188232421875, 0.02076244354248047, 0.023283004760742188, 0.025803565979003906, 0.028324127197265625, 0.030844688415527344, 0.03336524963378906, 0.03588581085205078, 0.0384063720703125, 0.04092693328857422, 0.04344749450683594, 0.045968055725097656, 0.048488616943359375, 0.051009178161621094, 0.05352973937988281, 0.05605030059814453, 0.05857086181640625, 0.06109142303466797, 0.06361198425292969, 0.0661325454711914, 0.06865310668945312, 0.07117366790771484, 0.07369422912597656, 0.07621479034423828, 0.0787353515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 6.0, 8.0, 3.0, 12.0, 9.0, 13.0, 16.0, 21.0, 11.0, 8.0, 15.0, 36.0, 26.0, 28.0, 30.0, 31.0, 27.0, 29.0, 31.0, 38.0, 29.0, 37.0, 54.0, 42.0, 35.0, 46.0, 33.0, 48.0, 28.0, 33.0, 28.0, 21.0, 25.0, 22.0, 17.0, 18.0, 24.0, 11.0, 13.0, 11.0, 7.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.02099609375, -0.0203704833984375, -0.019744873046875, -0.0191192626953125, -0.01849365234375, -0.0178680419921875, -0.017242431640625, -0.0166168212890625, -0.0159912109375, -0.0153656005859375, -0.014739990234375, -0.0141143798828125, -0.01348876953125, -0.0128631591796875, -0.012237548828125, -0.0116119384765625, -0.010986328125, -0.0103607177734375, -0.009735107421875, -0.0091094970703125, -0.00848388671875, -0.0078582763671875, -0.007232666015625, -0.0066070556640625, -0.0059814453125, -0.0053558349609375, -0.004730224609375, -0.0041046142578125, -0.00347900390625, -0.0028533935546875, -0.002227783203125, -0.0016021728515625, -0.0009765625, -0.0003509521484375, 0.000274658203125, 0.0009002685546875, 0.00152587890625, 0.0021514892578125, 0.002777099609375, 0.0034027099609375, 0.0040283203125, 0.0046539306640625, 0.005279541015625, 0.0059051513671875, 0.00653076171875, 0.0071563720703125, 0.007781982421875, 0.0084075927734375, 0.009033203125, 0.0096588134765625, 0.010284423828125, 0.0109100341796875, 0.01153564453125, 0.0121612548828125, 0.012786865234375, 0.0134124755859375, 0.0140380859375, 0.0146636962890625, 0.015289306640625, 0.0159149169921875, 0.01654052734375, 0.0171661376953125, 0.017791748046875, 0.0184173583984375, 0.01904296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 5.0, 9.0, 9.0, 9.0, 20.0, 26.0, 29.0, 61.0, 73.0, 150.0, 213.0, 449.0, 943.0, 2473.0, 9407.0, 190875.0, 822429.0, 15640.0, 3273.0, 1178.0, 528.0, 276.0, 162.0, 104.0, 55.0, 53.0, 23.0, 20.0, 19.0, 8.0, 5.0, 2.0, 3.0, 5.0, 5.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0732421875, -0.07081127166748047, -0.06838035583496094, -0.0659494400024414, -0.06351852416992188, -0.061087608337402344, -0.05865669250488281, -0.05622577667236328, -0.05379486083984375, -0.05136394500732422, -0.04893302917480469, -0.046502113342285156, -0.044071197509765625, -0.041640281677246094, -0.03920936584472656, -0.03677845001220703, -0.0343475341796875, -0.03191661834716797, -0.029485702514648438, -0.027054786682128906, -0.024623870849609375, -0.022192955017089844, -0.019762039184570312, -0.01733112335205078, -0.01490020751953125, -0.012469291687011719, -0.010038375854492188, -0.007607460021972656, -0.005176544189453125, -0.0027456283569335938, -0.0003147125244140625, 0.0021162033081054688, 0.004547119140625, 0.006978034973144531, 0.009408950805664062, 0.011839866638183594, 0.014270782470703125, 0.016701698303222656, 0.019132614135742188, 0.02156352996826172, 0.02399444580078125, 0.02642536163330078, 0.028856277465820312, 0.031287193298339844, 0.033718109130859375, 0.036149024963378906, 0.03857994079589844, 0.04101085662841797, 0.0434417724609375, 0.04587268829345703, 0.04830360412597656, 0.050734519958496094, 0.053165435791015625, 0.055596351623535156, 0.05802726745605469, 0.06045818328857422, 0.06288909912109375, 0.06532001495361328, 0.06775093078613281, 0.07018184661865234, 0.07261276245117188, 0.0750436782836914, 0.07747459411621094, 0.07990550994873047, 0.08233642578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 9.0, 3.0, 6.0, 6.0, 9.0, 18.0, 24.0, 20.0, 39.0, 39.0, 55.0, 78.0, 88.0, 132.0, 112.0, 85.0, 59.0, 52.0, 48.0, 27.0, 24.0, 12.0, 14.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.008676528930664e-05, -1.9313767552375793e-05, -1.8540769815444946e-05, -1.77677720785141e-05, -1.6994774341583252e-05, -1.6221776604652405e-05, -1.5448778867721558e-05, -1.467578113079071e-05, -1.3902783393859863e-05, -1.3129785656929016e-05, -1.2356787919998169e-05, -1.1583790183067322e-05, -1.0810792446136475e-05, -1.0037794709205627e-05, -9.26479697227478e-06, -8.491799235343933e-06, -7.718801498413086e-06, -6.945803761482239e-06, -6.172806024551392e-06, -5.3998082876205444e-06, -4.626810550689697e-06, -3.85381281375885e-06, -3.080815076828003e-06, -2.3078173398971558e-06, -1.5348196029663086e-06, -7.618218660354614e-07, 1.1175870895385742e-08, 7.841736078262329e-07, 1.55717134475708e-06, 2.3301690816879272e-06, 3.1031668186187744e-06, 3.876164555549622e-06, 4.649162292480469e-06, 5.422160029411316e-06, 6.195157766342163e-06, 6.96815550327301e-06, 7.741153240203857e-06, 8.514150977134705e-06, 9.287148714065552e-06, 1.0060146450996399e-05, 1.0833144187927246e-05, 1.1606141924858093e-05, 1.237913966178894e-05, 1.3152137398719788e-05, 1.3925135135650635e-05, 1.4698132872581482e-05, 1.547113060951233e-05, 1.6244128346443176e-05, 1.7017126083374023e-05, 1.779012382030487e-05, 1.8563121557235718e-05, 1.9336119294166565e-05, 2.0109117031097412e-05, 2.088211476802826e-05, 2.1655112504959106e-05, 2.2428110241889954e-05, 2.32011079788208e-05, 2.3974105715751648e-05, 2.4747103452682495e-05, 2.5520101189613342e-05, 2.629309892654419e-05, 2.7066096663475037e-05, 2.7839094400405884e-05, 2.861209213733673e-05, 2.9385089874267578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 26.0, 43.0, 51.0, 46.0, 79.0, 187.0, 333.0, 624.0, 1407.0, 4552.0, 32757.0, 953285.0, 46773.0, 5229.0, 1639.0, 655.0, 296.0, 195.0, 142.0, 65.0, 37.0, 20.0, 19.0, 10.0, 9.0, 16.0, 5.0, 7.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.11658191680908203, -0.11310768127441406, -0.1096334457397461, -0.10615921020507812, -0.10268497467041016, -0.09921073913574219, -0.09573650360107422, -0.09226226806640625, -0.08878803253173828, -0.08531379699707031, -0.08183956146240234, -0.07836532592773438, -0.0748910903930664, -0.07141685485839844, -0.06794261932373047, -0.0644683837890625, -0.06099414825439453, -0.05751991271972656, -0.054045677185058594, -0.050571441650390625, -0.047097206115722656, -0.04362297058105469, -0.04014873504638672, -0.03667449951171875, -0.03320026397705078, -0.029726028442382812, -0.026251792907714844, -0.022777557373046875, -0.019303321838378906, -0.015829086303710938, -0.012354850769042969, -0.008880615234375, -0.005406379699707031, -0.0019321441650390625, 0.0015420913696289062, 0.005016326904296875, 0.008490562438964844, 0.011964797973632812, 0.015439033508300781, 0.01891326904296875, 0.02238750457763672, 0.025861740112304688, 0.029335975646972656, 0.032810211181640625, 0.036284446716308594, 0.03975868225097656, 0.04323291778564453, 0.0467071533203125, 0.05018138885498047, 0.05365562438964844, 0.057129859924316406, 0.060604095458984375, 0.06407833099365234, 0.06755256652832031, 0.07102680206298828, 0.07450103759765625, 0.07797527313232422, 0.08144950866699219, 0.08492374420166016, 0.08839797973632812, 0.0918722152709961, 0.09534645080566406, 0.09882068634033203, 0.102294921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 6.0, 7.0, 11.0, 13.0, 18.0, 37.0, 38.0, 74.0, 108.0, 257.0, 192.0, 72.0, 38.0, 29.0, 22.0, 23.0, 8.0, 10.0, 6.0, 4.0, 5.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039306640625, -0.03783988952636719, -0.036373138427734375, -0.03490638732910156, -0.03343963623046875, -0.03197288513183594, -0.030506134033203125, -0.029039382934570312, -0.0275726318359375, -0.026105880737304688, -0.024639129638671875, -0.023172378540039062, -0.02170562744140625, -0.020238876342773438, -0.018772125244140625, -0.017305374145507812, -0.015838623046875, -0.014371871948242188, -0.012905120849609375, -0.011438369750976562, -0.00997161865234375, -0.008504867553710938, -0.007038116455078125, -0.0055713653564453125, -0.0041046142578125, -0.0026378631591796875, -0.001171112060546875, 0.0002956390380859375, 0.00176239013671875, 0.0032291412353515625, 0.004695892333984375, 0.0061626434326171875, 0.00762939453125, 0.009096145629882812, 0.010562896728515625, 0.012029647827148438, 0.01349639892578125, 0.014963150024414062, 0.016429901123046875, 0.017896652221679688, 0.0193634033203125, 0.020830154418945312, 0.022296905517578125, 0.023763656616210938, 0.02523040771484375, 0.026697158813476562, 0.028163909912109375, 0.029630661010742188, 0.031097412109375, 0.03256416320800781, 0.034030914306640625, 0.03549766540527344, 0.03696441650390625, 0.03843116760253906, 0.039897918701171875, 0.04136466979980469, 0.0428314208984375, 0.04429817199707031, 0.045764923095703125, 0.04723167419433594, 0.04869842529296875, 0.05016517639160156, 0.051631927490234375, 0.05309867858886719, 0.0545654296875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 12.0, 30.0, 103.0, 676.0, 125.0, 25.0, 11.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3106211423873901, -1.2715755701065063, -1.232529878616333, -1.1934843063354492, -1.1544386148452759, -1.115393042564392, -1.0763473510742188, -1.037301778793335, -0.9982561469078064, -0.9592105150222778, -0.9201648831367493, -0.8811192512512207, -0.8420736789703369, -0.8030279874801636, -0.7639824151992798, -0.7249367833137512, -0.6858911514282227, -0.6468455195426941, -0.6077998876571655, -0.568754255771637, -0.5297086238861084, -0.4906630218029022, -0.45161741971969604, -0.4125717878341675, -0.3735261559486389, -0.33448052406311035, -0.2954348921775818, -0.2563892900943756, -0.21734365820884705, -0.17829802632331848, -0.1392524093389511, -0.10020679235458374, -0.06116127967834473, -0.02211565524339676, 0.01692996919155121, 0.055975593626499176, 0.09502121806144714, 0.1340668499469757, 0.17311246693134308, 0.21215808391571045, 0.251203715801239, 0.2902493476867676, 0.32929497957229614, 0.3683405816555023, 0.4073862135410309, 0.44643184542655945, 0.4854774475097656, 0.5245230793952942, 0.5635687112808228, 0.6026143431663513, 0.6416599750518799, 0.6807056069374084, 0.719751238822937, 0.7587968111038208, 0.7978424429893494, 0.8368880748748779, 0.8759337067604065, 0.9149793386459351, 0.9540249705314636, 0.9930706024169922, 1.032116174697876, 1.0711618661880493, 1.110207438468933, 1.1492531299591064, 1.1882987022399902]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 0.0, 4.0, 5.0, 7.0, 8.0, 12.0, 22.0, 17.0, 38.0, 52.0, 81.0, 87.0, 150.0, 131.0, 99.0, 80.0, 67.0, 47.0, 15.0, 18.0, 15.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425875186920166, -0.41289544105529785, -0.3999156951904297, -0.3869359493255615, -0.37395623326301575, -0.3609764873981476, -0.3479967415332794, -0.33501699566841125, -0.3220372796058655, -0.3090575337409973, -0.29607778787612915, -0.283098042011261, -0.2701183259487152, -0.25713858008384705, -0.24415883421897888, -0.23117908835411072, -0.21819934248924255, -0.2052195966243744, -0.19223986566066742, -0.17926011979579926, -0.16628038883209229, -0.15330064296722412, -0.14032089710235596, -0.1273411512374878, -0.11436142027378082, -0.10138168185949326, -0.08840194344520569, -0.07542219758033752, -0.06244245916604996, -0.04946272075176239, -0.036482974886894226, -0.02350323647260666, -0.010523498058319092, 0.0024562422186136246, 0.015435982495546341, 0.028415724635124207, 0.041395463049411774, 0.05437520146369934, 0.0673549473285675, 0.08033468574285507, 0.09331442415714264, 0.1062941625714302, 0.11927390098571777, 0.13225364685058594, 0.1452333927154541, 0.15821312367916107, 0.17119286954402924, 0.1841726005077362, 0.19715234637260437, 0.21013209223747253, 0.2231118232011795, 0.23609156906604767, 0.24907130002975464, 0.2620510458946228, 0.27503079175949097, 0.28801053762435913, 0.3009902834892273, 0.31397002935409546, 0.3269497752189636, 0.3399295210838318, 0.35290923714637756, 0.3658889830112457, 0.3788687288761139, 0.39184847474098206, 0.40482819080352783]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 10.0, 11.0, 17.0, 25.0, 37.0, 92.0, 730.0, 4163539.0, 28941.0, 625.0, 113.0, 36.0, 24.0, 21.0, 11.0, 14.0, 5.0, 7.0, 4.0, 0.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.7183837890625, -3.530517578125, -3.3426513671875, -3.15478515625, -2.9669189453125, -2.779052734375, -2.5911865234375, -2.4033203125, -2.2154541015625, -2.027587890625, -1.8397216796875, -1.65185546875, -1.4639892578125, -1.276123046875, -1.0882568359375, -0.900390625, -0.7125244140625, -0.524658203125, -0.3367919921875, -0.14892578125, 0.0389404296875, 0.226806640625, 0.4146728515625, 0.6025390625, 0.7904052734375, 0.978271484375, 1.1661376953125, 1.35400390625, 1.5418701171875, 1.729736328125, 1.9176025390625, 2.10546875, 2.2933349609375, 2.481201171875, 2.6690673828125, 2.85693359375, 3.0447998046875, 3.232666015625, 3.4205322265625, 3.6083984375, 3.7962646484375, 3.984130859375, 4.1719970703125, 4.35986328125, 4.5477294921875, 4.735595703125, 4.9234619140625, 5.111328125, 5.2991943359375, 5.487060546875, 5.6749267578125, 5.86279296875, 6.0506591796875, 6.238525390625, 6.4263916015625, 6.6142578125, 6.8021240234375, 6.989990234375, 7.1778564453125, 7.36572265625, 7.5535888671875, 7.741455078125, 7.9293212890625, 8.1171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 9.0, 15.0, 11.0, 25.0, 92.0, 170.0, 334.0, 168.0, 72.0, 29.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 11.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029754638671875, -0.0028154850006103516, -0.002655506134033203, -0.0024955272674560547, -0.0023355484008789062, -0.002175569534301758, -0.0020155906677246094, -0.001855611801147461, -0.0016956329345703125, -0.001535654067993164, -0.0013756752014160156, -0.0012156963348388672, -0.0010557174682617188, -0.0008957386016845703, -0.0007357597351074219, -0.0005757808685302734, -0.000415802001953125, -0.00025582313537597656, -9.584426879882812e-05, 6.413459777832031e-05, 0.00022411346435546875, 0.0003840923309326172, 0.0005440711975097656, 0.0007040500640869141, 0.0008640289306640625, 0.001024007797241211, 0.0011839866638183594, 0.0013439655303955078, 0.0015039443969726562, 0.0016639232635498047, 0.0018239021301269531, 0.0019838809967041016, 0.00214385986328125, 0.0023038387298583984, 0.002463817596435547, 0.0026237964630126953, 0.0027837753295898438, 0.002943754196166992, 0.0031037330627441406, 0.003263711929321289, 0.0034236907958984375, 0.003583669662475586, 0.0037436485290527344, 0.003903627395629883, 0.004063606262207031, 0.00422358512878418, 0.004383563995361328, 0.0045435428619384766, 0.004703521728515625, 0.0048635005950927734, 0.005023479461669922, 0.00518345832824707, 0.005343437194824219, 0.005503416061401367, 0.005663394927978516, 0.005823373794555664, 0.0059833526611328125, 0.006143331527709961, 0.006303310394287109, 0.006463289260864258, 0.006623268127441406, 0.006783246994018555, 0.006943225860595703, 0.0071032047271728516, 0.00726318359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 11.0, 11.0, 16.0, 20.0, 34.0, 40.0, 54.0, 98.0, 107.0, 145.0, 170.0, 243.0, 557.0, 112665.0, 4079097.0, 538.0, 187.0, 111.0, 64.0, 39.0, 26.0, 18.0, 9.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.57489013671875, -1.5374755859375, -1.50006103515625, -1.462646484375, -1.42523193359375, -1.3878173828125, -1.35040283203125, -1.31298828125, -1.27557373046875, -1.2381591796875, -1.20074462890625, -1.163330078125, -1.12591552734375, -1.0885009765625, -1.05108642578125, -1.013671875, -0.97625732421875, -0.9388427734375, -0.90142822265625, -0.864013671875, -0.82659912109375, -0.7891845703125, -0.75177001953125, -0.71435546875, -0.67694091796875, -0.6395263671875, -0.60211181640625, -0.564697265625, -0.52728271484375, -0.4898681640625, -0.45245361328125, -0.4150390625, -0.37762451171875, -0.3402099609375, -0.30279541015625, -0.265380859375, -0.22796630859375, -0.1905517578125, -0.15313720703125, -0.11572265625, -0.07830810546875, -0.0408935546875, -0.00347900390625, 0.033935546875, 0.07135009765625, 0.1087646484375, 0.14617919921875, 0.18359375, 0.22100830078125, 0.2584228515625, 0.29583740234375, 0.333251953125, 0.37066650390625, 0.4080810546875, 0.44549560546875, 0.48291015625, 0.52032470703125, 0.5577392578125, 0.59515380859375, 0.632568359375, 0.66998291015625, 0.7073974609375, 0.74481201171875, 0.7822265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 15.0, 18.0, 21.0, 23.0, 34.0, 63.0, 74.0, 101.0, 121.0, 172.0, 202.0, 276.0, 335.0, 1045.0, 614.0, 334.0, 212.0, 120.0, 97.0, 60.0, 32.0, 31.0, 17.0, 14.0, 11.0, 9.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01212310791015625, -0.011834144592285156, -0.011545181274414062, -0.011256217956542969, -0.010967254638671875, -0.010678291320800781, -0.010389328002929688, -0.010100364685058594, -0.0098114013671875, -0.009522438049316406, -0.009233474731445312, -0.008944511413574219, -0.008655548095703125, -0.008366584777832031, -0.008077621459960938, -0.007788658142089844, -0.00749969482421875, -0.007210731506347656, -0.0069217681884765625, -0.006632804870605469, -0.006343841552734375, -0.006054878234863281, -0.0057659149169921875, -0.005476951599121094, -0.00518798828125, -0.004899024963378906, -0.0046100616455078125, -0.004321098327636719, -0.004032135009765625, -0.0037431716918945312, -0.0034542083740234375, -0.0031652450561523438, -0.00287628173828125, -0.0025873184204101562, -0.0022983551025390625, -0.0020093917846679688, -0.001720428466796875, -0.0014314651489257812, -0.0011425018310546875, -0.0008535385131835938, -0.0005645751953125, -0.00027561187744140625, 1.33514404296875e-05, 0.00030231475830078125, 0.000591278076171875, 0.0008802413940429688, 0.0011692047119140625, 0.0014581680297851562, 0.00174713134765625, 0.0020360946655273438, 0.0023250579833984375, 0.0026140213012695312, 0.002902984619140625, 0.0031919479370117188, 0.0034809112548828125, 0.0037698745727539062, 0.004058837890625, 0.004347801208496094, 0.0046367645263671875, 0.004925727844238281, 0.005214691162109375, 0.005503654479980469, 0.0057926177978515625, 0.006081581115722656, 0.00637054443359375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 10.0, 87.0, 921.0, 4.0], "bins": [-8.81961727142334, -8.678313255310059, -8.537010192871094, -8.395706176757812, -8.254403114318848, -8.113099098205566, -7.971795558929443, -7.83049201965332, -7.689188003540039, -7.547884464263916, -7.406580924987793, -7.265276908874512, -7.123973369598389, -6.982669830322266, -6.841366291046143, -6.7000627517700195, -6.5587592124938965, -6.417455673217773, -6.27615213394165, -6.134848117828369, -5.993544578552246, -5.852241039276123, -5.7109375, -5.569633960723877, -5.428330421447754, -5.287026882171631, -5.145723342895508, -5.004419326782227, -4.8631157875061035, -4.7218122482299805, -4.580508708953857, -4.439205169677734, -4.297901153564453, -4.15659761428833, -4.015294075012207, -3.873990297317505, -3.7326865196228027, -3.5913829803466797, -3.4500794410705566, -3.3087759017944336, -3.1674721240997314, -3.0261685848236084, -2.8848648071289062, -2.743561267852783, -2.60225772857666, -2.460953950881958, -2.319650411605835, -2.178346633911133, -2.0370430946350098, -1.8957394361495972, -1.7544357776641846, -1.6131322383880615, -1.471828579902649, -1.3305249214172363, -1.1892213821411133, -1.0479177236557007, -0.9066140651702881, -0.7653104066848755, -0.6240068078041077, -0.48270317912101746, -0.34139955043792725, -0.20009589195251465, -0.058792293071746826, 0.082511305809021, 0.22381499409675598]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 11.0, 17.0, 21.0, 41.0, 79.0, 104.0, 148.0, 131.0, 139.0, 118.0, 64.0, 46.0, 44.0, 21.0, 9.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5828588604927063, -0.5710079669952393, -0.5591570734977722, -0.54730623960495, -0.5354553461074829, -0.5236044526100159, -0.5117535591125488, -0.4999026656150818, -0.48805180191993713, -0.4762009084224701, -0.46435004472732544, -0.4524991512298584, -0.44064825773239136, -0.4287973940372467, -0.41694650053977966, -0.405095636844635, -0.39324474334716797, -0.3813938498497009, -0.3695429861545563, -0.35769209265708923, -0.3458412289619446, -0.33399033546447754, -0.3221394419670105, -0.31028854846954346, -0.2984376847743988, -0.28658679127693176, -0.2747359275817871, -0.26288503408432007, -0.251034140586853, -0.23918327689170837, -0.22733238339424133, -0.21548150479793549, -0.20363062620162964, -0.1917797476053238, -0.17992886900901794, -0.1680779755115509, -0.15622709691524506, -0.1443762183189392, -0.13252532482147217, -0.12067444622516632, -0.10882356762886047, -0.09697268903255463, -0.08512180298566818, -0.07327091693878174, -0.06142003834247589, -0.049569156020879745, -0.0377182736992836, -0.025867387652397156, -0.014016509056091309, -0.002165626734495163, 0.009685255587100983, 0.02153613790869713, 0.033387020230293274, 0.04523790255188942, 0.057088784873485565, 0.06893967092037201, 0.08079054951667786, 0.0926414281129837, 0.10449231415987015, 0.11634320020675659, 0.12819407880306244, 0.1400449573993683, 0.15189585089683533, 0.16374672949314117, 0.17559760808944702]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 7.0, 8.0, 6.0, 8.0, 12.0, 17.0, 9.0, 24.0, 39.0, 54.0, 54.0, 84.0, 97.0, 136.0, 184.0, 229.0, 313.0, 422.0, 583.0, 799.0, 1074.0, 1546.0, 2178.0, 3218.0, 4867.0, 7650.0, 13686.0, 31885.0, 145381.0, 624869.0, 140288.0, 31434.0, 13883.0, 7801.0, 4812.0, 3159.0, 2176.0, 1454.0, 1102.0, 813.0, 541.0, 415.0, 301.0, 234.0, 196.0, 135.0, 102.0, 81.0, 40.0, 49.0, 26.0, 29.0, 13.0, 9.0, 13.0, 5.0, 6.0, 5.0, 1.0, 3.0, 3.0], "bins": [-0.037353515625, -0.036203861236572266, -0.03505420684814453, -0.0339045524597168, -0.03275489807128906, -0.03160524368286133, -0.030455589294433594, -0.02930593490600586, -0.028156280517578125, -0.02700662612915039, -0.025856971740722656, -0.024707317352294922, -0.023557662963867188, -0.022408008575439453, -0.02125835418701172, -0.020108699798583984, -0.01895904541015625, -0.017809391021728516, -0.01665973663330078, -0.015510082244873047, -0.014360427856445312, -0.013210773468017578, -0.012061119079589844, -0.01091146469116211, -0.009761810302734375, -0.00861215591430664, -0.007462501525878906, -0.006312847137451172, -0.0051631927490234375, -0.004013538360595703, -0.0028638839721679688, -0.0017142295837402344, -0.0005645751953125, 0.0005850791931152344, 0.0017347335815429688, 0.002884387969970703, 0.0040340423583984375, 0.005183696746826172, 0.006333351135253906, 0.007483005523681641, 0.008632659912109375, 0.00978231430053711, 0.010931968688964844, 0.012081623077392578, 0.013231277465820312, 0.014380931854248047, 0.015530586242675781, 0.016680240631103516, 0.01782989501953125, 0.018979549407958984, 0.02012920379638672, 0.021278858184814453, 0.022428512573242188, 0.023578166961669922, 0.024727821350097656, 0.02587747573852539, 0.027027130126953125, 0.02817678451538086, 0.029326438903808594, 0.030476093292236328, 0.03162574768066406, 0.0327754020690918, 0.03392505645751953, 0.035074710845947266, 0.036224365234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 10.0, 8.0, 12.0, 15.0, 10.0, 23.0, 43.0, 69.0, 75.0, 110.0, 153.0, 123.0, 102.0, 57.0, 56.0, 33.0, 27.0, 13.0, 4.0, 7.0, 9.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.003570556640625, -0.003467947244644165, -0.00336533784866333, -0.003262728452682495, -0.00316011905670166, -0.003057509660720825, -0.0029549002647399902, -0.0028522908687591553, -0.0027496814727783203, -0.0026470720767974854, -0.0025444626808166504, -0.0024418532848358154, -0.0023392438888549805, -0.0022366344928741455, -0.0021340250968933105, -0.0020314157009124756, -0.0019288063049316406, -0.0018261969089508057, -0.0017235875129699707, -0.0016209781169891357, -0.0015183687210083008, -0.0014157593250274658, -0.0013131499290466309, -0.001210540533065796, -0.001107931137084961, -0.001005321741104126, -0.000902712345123291, -0.0008001029491424561, -0.0006974935531616211, -0.0005948841571807861, -0.0004922747611999512, -0.0003896653652191162, -0.00028705596923828125, -0.0001844465732574463, -8.183717727661133e-05, 2.0772218704223633e-05, 0.0001233816146850586, 0.00022599101066589355, 0.0003286004066467285, 0.0004312098026275635, 0.0005338191986083984, 0.0006364285945892334, 0.0007390379905700684, 0.0008416473865509033, 0.0009442567825317383, 0.0010468661785125732, 0.0011494755744934082, 0.0012520849704742432, 0.0013546943664550781, 0.001457303762435913, 0.001559913158416748, 0.001662522554397583, 0.001765131950378418, 0.001867741346359253, 0.001970350742340088, 0.002072960138320923, 0.002175569534301758, 0.0022781789302825928, 0.0023807883262634277, 0.0024833977222442627, 0.0025860071182250977, 0.0026886165142059326, 0.0027912259101867676, 0.0028938353061676025, 0.0029964447021484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 10.0, 7.0, 8.0, 9.0, 13.0, 13.0, 17.0, 6.0, 24.0, 20.0, 22.0, 21.0, 37.0, 51.0, 44.0, 107.0, 450.0, 3212.0, 81281.0, 945066.0, 16100.0, 1410.0, 215.0, 83.0, 40.0, 36.0, 31.0, 29.0, 25.0, 14.0, 21.0, 21.0, 17.0, 14.0, 9.0, 9.0, 6.0, 12.0, 6.0, 7.0, 10.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.13525390625, -0.13106727600097656, -0.12688064575195312, -0.12269401550292969, -0.11850738525390625, -0.11432075500488281, -0.11013412475585938, -0.10594749450683594, -0.1017608642578125, -0.09757423400878906, -0.09338760375976562, -0.08920097351074219, -0.08501434326171875, -0.08082771301269531, -0.07664108276367188, -0.07245445251464844, -0.068267822265625, -0.06408119201660156, -0.059894561767578125, -0.05570793151855469, -0.05152130126953125, -0.04733467102050781, -0.043148040771484375, -0.03896141052246094, -0.0347747802734375, -0.030588150024414062, -0.026401519775390625, -0.022214889526367188, -0.01802825927734375, -0.013841629028320312, -0.009654998779296875, -0.0054683685302734375, -0.00128173828125, 0.0029048919677734375, 0.007091522216796875, 0.011278152465820312, 0.01546478271484375, 0.019651412963867188, 0.023838043212890625, 0.028024673461914062, 0.0322113037109375, 0.03639793395996094, 0.040584564208984375, 0.04477119445800781, 0.04895782470703125, 0.05314445495605469, 0.057331085205078125, 0.06151771545410156, 0.065704345703125, 0.06989097595214844, 0.07407760620117188, 0.07826423645019531, 0.08245086669921875, 0.08663749694824219, 0.09082412719726562, 0.09501075744628906, 0.0991973876953125, 0.10338401794433594, 0.10757064819335938, 0.11175727844238281, 0.11594390869140625, 0.12013053894042969, 0.12431716918945312, 0.12850379943847656, 0.1326904296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 1.0, 5.0, 11.0, 7.0, 15.0, 12.0, 13.0, 20.0, 16.0, 18.0, 23.0, 25.0, 37.0, 35.0, 42.0, 38.0, 33.0, 29.0, 44.0, 45.0, 47.0, 38.0, 39.0, 37.0, 45.0, 46.0, 30.0, 43.0, 25.0, 23.0, 19.0, 20.0, 15.0, 21.0, 11.0, 13.0, 15.0, 12.0, 7.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01187896728515625, -0.011500358581542969, -0.011121749877929688, -0.010743141174316406, -0.010364532470703125, -0.009985923767089844, -0.009607315063476562, -0.009228706359863281, -0.00885009765625, -0.008471488952636719, -0.008092880249023438, -0.007714271545410156, -0.007335662841796875, -0.006957054138183594, -0.0065784454345703125, -0.006199836730957031, -0.00582122802734375, -0.005442619323730469, -0.0050640106201171875, -0.004685401916503906, -0.004306793212890625, -0.003928184509277344, -0.0035495758056640625, -0.0031709671020507812, -0.0027923583984375, -0.0024137496948242188, -0.0020351409912109375, -0.0016565322875976562, -0.001277923583984375, -0.0008993148803710938, -0.0005207061767578125, -0.00014209747314453125, 0.00023651123046875, 0.0006151199340820312, 0.0009937286376953125, 0.0013723373413085938, 0.001750946044921875, 0.0021295547485351562, 0.0025081634521484375, 0.0028867721557617188, 0.003265380859375, 0.0036439895629882812, 0.0040225982666015625, 0.004401206970214844, 0.004779815673828125, 0.005158424377441406, 0.0055370330810546875, 0.005915641784667969, 0.00629425048828125, 0.006672859191894531, 0.0070514678955078125, 0.007430076599121094, 0.007808685302734375, 0.008187294006347656, 0.008565902709960938, 0.008944511413574219, 0.0093231201171875, 0.009701728820800781, 0.010080337524414062, 0.010458946228027344, 0.010837554931640625, 0.011216163635253906, 0.011594772338867188, 0.011973381042480469, 0.01235198974609375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 10.0, 23.0, 36.0, 189.0, 1031.0, 45965.0, 999084.0, 1810.0, 261.0, 49.0, 23.0, 15.0, 7.0, 4.0, 1.0, 1.0, 2.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30224609375, -0.2918663024902344, -0.28148651123046875, -0.2711067199707031, -0.2607269287109375, -0.2503471374511719, -0.23996734619140625, -0.22958755493164062, -0.219207763671875, -0.20882797241210938, -0.19844818115234375, -0.18806838989257812, -0.1776885986328125, -0.16730880737304688, -0.15692901611328125, -0.14654922485351562, -0.13616943359375, -0.12578964233398438, -0.11540985107421875, -0.10503005981445312, -0.0946502685546875, -0.08427047729492188, -0.07389068603515625, -0.06351089477539062, -0.053131103515625, -0.042751312255859375, -0.03237152099609375, -0.021991729736328125, -0.0116119384765625, -0.001232147216796875, 0.00914764404296875, 0.019527435302734375, 0.0299072265625, 0.040287017822265625, 0.05066680908203125, 0.061046600341796875, 0.0714263916015625, 0.08180618286132812, 0.09218597412109375, 0.10256576538085938, 0.112945556640625, 0.12332534790039062, 0.13370513916015625, 0.14408493041992188, 0.1544647216796875, 0.16484451293945312, 0.17522430419921875, 0.18560409545898438, 0.19598388671875, 0.20636367797851562, 0.21674346923828125, 0.22712326049804688, 0.2375030517578125, 0.24788284301757812, 0.25826263427734375, 0.2686424255371094, 0.279022216796875, 0.2894020080566406, 0.29978179931640625, 0.3101615905761719, 0.3205413818359375, 0.3309211730957031, 0.34130096435546875, 0.3516807556152344, 0.362060546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 8.0, 12.0, 20.0, 41.0, 103.0, 264.0, 298.0, 123.0, 38.0, 26.0, 12.0, 13.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015807151794433594, -0.00015281513333320618, -0.00014755874872207642, -0.00014230236411094666, -0.0001370459794998169, -0.00013178959488868713, -0.00012653321027755737, -0.00012127682566642761, -0.00011602044105529785, -0.00011076405644416809, -0.00010550767183303833, -0.00010025128722190857, -9.499490261077881e-05, -8.973851799964905e-05, -8.448213338851929e-05, -7.922574877738953e-05, -7.396936416625977e-05, -6.871297955513e-05, -6.345659494400024e-05, -5.8200210332870483e-05, -5.294382572174072e-05, -4.768744111061096e-05, -4.24310564994812e-05, -3.717467188835144e-05, -3.191828727722168e-05, -2.666190266609192e-05, -2.1405518054962158e-05, -1.6149133443832397e-05, -1.0892748832702637e-05, -5.636364221572876e-06, -3.7997961044311523e-07, 4.8764050006866455e-06, 1.0132789611816406e-05, 1.5389174222946167e-05, 2.0645558834075928e-05, 2.590194344520569e-05, 3.115832805633545e-05, 3.641471266746521e-05, 4.167109727859497e-05, 4.692748188972473e-05, 5.218386650085449e-05, 5.744025111198425e-05, 6.269663572311401e-05, 6.795302033424377e-05, 7.320940494537354e-05, 7.84657895565033e-05, 8.372217416763306e-05, 8.897855877876282e-05, 9.423494338989258e-05, 9.949132800102234e-05, 0.0001047477126121521, 0.00011000409722328186, 0.00011526048183441162, 0.00012051686644554138, 0.00012577325105667114, 0.0001310296356678009, 0.00013628602027893066, 0.00014154240489006042, 0.00014679878950119019, 0.00015205517411231995, 0.0001573115587234497, 0.00016256794333457947, 0.00016782432794570923, 0.000173080712556839, 0.00017833709716796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 8.0, 14.0, 14.0, 46.0, 145.0, 649.0, 3768.0, 184671.0, 852902.0, 5283.0, 749.0, 184.0, 49.0, 19.0, 8.0, 10.0, 12.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2373046875, -0.231231689453125, -0.22515869140625, -0.219085693359375, -0.2130126953125, -0.206939697265625, -0.20086669921875, -0.194793701171875, -0.188720703125, -0.182647705078125, -0.17657470703125, -0.170501708984375, -0.1644287109375, -0.158355712890625, -0.15228271484375, -0.146209716796875, -0.14013671875, -0.134063720703125, -0.12799072265625, -0.121917724609375, -0.1158447265625, -0.109771728515625, -0.10369873046875, -0.097625732421875, -0.091552734375, -0.085479736328125, -0.07940673828125, -0.073333740234375, -0.0672607421875, -0.061187744140625, -0.05511474609375, -0.049041748046875, -0.04296875, -0.036895751953125, -0.03082275390625, -0.024749755859375, -0.0186767578125, -0.012603759765625, -0.00653076171875, -0.000457763671875, 0.005615234375, 0.011688232421875, 0.01776123046875, 0.023834228515625, 0.0299072265625, 0.035980224609375, 0.04205322265625, 0.048126220703125, 0.05419921875, 0.060272216796875, 0.06634521484375, 0.072418212890625, 0.0784912109375, 0.084564208984375, 0.09063720703125, 0.096710205078125, 0.102783203125, 0.108856201171875, 0.11492919921875, 0.121002197265625, 0.1270751953125, 0.133148193359375, 0.13922119140625, 0.145294189453125, 0.1513671875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 19.0, 27.0, 40.0, 81.0, 223.0, 301.0, 130.0, 68.0, 23.0, 26.0, 8.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0364990234375, -0.0352935791015625, -0.034088134765625, -0.0328826904296875, -0.03167724609375, -0.0304718017578125, -0.029266357421875, -0.0280609130859375, -0.02685546875, -0.0256500244140625, -0.024444580078125, -0.0232391357421875, -0.02203369140625, -0.0208282470703125, -0.019622802734375, -0.0184173583984375, -0.0172119140625, -0.0160064697265625, -0.014801025390625, -0.0135955810546875, -0.01239013671875, -0.0111846923828125, -0.009979248046875, -0.0087738037109375, -0.007568359375, -0.0063629150390625, -0.005157470703125, -0.0039520263671875, -0.00274658203125, -0.0015411376953125, -0.000335693359375, 0.0008697509765625, 0.0020751953125, 0.0032806396484375, 0.004486083984375, 0.0056915283203125, 0.00689697265625, 0.0081024169921875, 0.009307861328125, 0.0105133056640625, 0.01171875, 0.0129241943359375, 0.014129638671875, 0.0153350830078125, 0.01654052734375, 0.0177459716796875, 0.018951416015625, 0.0201568603515625, 0.0213623046875, 0.0225677490234375, 0.023773193359375, 0.0249786376953125, 0.02618408203125, 0.0273895263671875, 0.028594970703125, 0.0298004150390625, 0.031005859375, 0.0322113037109375, 0.033416748046875, 0.0346221923828125, 0.03582763671875, 0.0370330810546875, 0.038238525390625, 0.0394439697265625, 0.0406494140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 11.0, 38.0, 120.0, 376.0, 345.0, 76.0, 17.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5281555652618408, -0.5142734050750732, -0.5003912448883057, -0.4865091145038605, -0.4726269841194153, -0.4587448239326477, -0.4448626637458801, -0.43098050355911255, -0.41709837317466736, -0.4032162129878998, -0.3893340826034546, -0.375451922416687, -0.36156976222991943, -0.34768763184547424, -0.33380547165870667, -0.3199233412742615, -0.3060411810874939, -0.2921590209007263, -0.27827689051628113, -0.26439473032951355, -0.25051259994506836, -0.23663043975830078, -0.2227482795715332, -0.20886613428592682, -0.19498398900032043, -0.18110184371471405, -0.16721969842910767, -0.1533375382423401, -0.1394553929567337, -0.12557324767112732, -0.11169109493494034, -0.09780894219875336, -0.08392676711082458, -0.0700446218252182, -0.05616246908903122, -0.04228032007813454, -0.028398171067237854, -0.01451602578163147, -0.0006338730454444885, 0.013248279690742493, 0.027130424976348877, 0.04101257398724556, 0.05489472299814224, 0.06877687573432922, 0.08265902101993561, 0.09654116630554199, 0.11042331904172897, 0.12430547177791595, 0.13818761706352234, 0.15206976234912872, 0.1659519076347351, 0.17983406782150269, 0.19371621310710907, 0.20759835839271545, 0.22148051857948303, 0.23536266386508942, 0.2492448091506958, 0.2631269693374634, 0.27700909972190857, 0.29089125990867615, 0.30477339029312134, 0.3186555504798889, 0.3325377106666565, 0.3464198708534241, 0.36030200123786926]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 1.0, 3.0, 3.0, 7.0, 7.0, 6.0, 12.0, 12.0, 31.0, 41.0, 50.0, 71.0, 63.0, 59.0, 72.0, 99.0, 91.0, 71.0, 75.0, 67.0, 47.0, 33.0, 17.0, 20.0, 9.0, 4.0, 10.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.15782815217971802, -0.15318745374679565, -0.1485467404127121, -0.14390604197978973, -0.13926532864570618, -0.1346246302127838, -0.12998391687870026, -0.1253432184457779, -0.12070251256227493, -0.11606180667877197, -0.11142110079526901, -0.10678039491176605, -0.10213969647884369, -0.09749898314476013, -0.09285828471183777, -0.08821757882833481, -0.08357687294483185, -0.07893616706132889, -0.07429546117782593, -0.06965475529432297, -0.06501404941082001, -0.060373347252607346, -0.055732645094394684, -0.051091939210891724, -0.04645123332738876, -0.0418105274438858, -0.03716982156038284, -0.03252911940217018, -0.02788841351866722, -0.02324770763516426, -0.01860700361430645, -0.013966299593448639, -0.009325593709945679, -0.004684888757765293, -4.418380558490753e-05, 0.004596521146595478, 0.009237226098775864, 0.013877931982278824, 0.018518636003136635, 0.023159340023994446, 0.027800045907497406, 0.032440751791000366, 0.037081457674503326, 0.04172215983271599, 0.04636286571621895, 0.05100357159972191, 0.05564427375793457, 0.06028497964143753, 0.06492568552494049, 0.06956639140844345, 0.07420709729194641, 0.07884780317544937, 0.08348850905895233, 0.0881292074918747, 0.09276991337537766, 0.09741061925888062, 0.10205132514238358, 0.10669203102588654, 0.1113327369093895, 0.11597344279289246, 0.12061414122581482, 0.12525485455989838, 0.12989555299282074, 0.1345362663269043, 0.13917696475982666]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 8.0, 6.0, 6.0, 8.0, 8.0, 16.0, 6.0, 12.0, 16.0, 22.0, 28.0, 22.0, 48.0, 160.0, 1327.0, 4192126.0, 242.0, 45.0, 28.0, 22.0, 20.0, 8.0, 10.0, 12.0, 18.0, 6.0, 6.0, 8.0, 4.0, 10.0, 2.0, 4.0, 2.0, 2.0, 8.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8125, -1.743377685546875, -1.67425537109375, -1.605133056640625, -1.5360107421875, -1.466888427734375, -1.39776611328125, -1.328643798828125, -1.259521484375, -1.190399169921875, -1.12127685546875, -1.052154541015625, -0.9830322265625, -0.913909912109375, -0.84478759765625, -0.775665283203125, -0.70654296875, -0.637420654296875, -0.56829833984375, -0.499176025390625, -0.4300537109375, -0.360931396484375, -0.29180908203125, -0.222686767578125, -0.153564453125, -0.084442138671875, -0.01531982421875, 0.053802490234375, 0.1229248046875, 0.192047119140625, 0.26116943359375, 0.330291748046875, 0.3994140625, 0.468536376953125, 0.53765869140625, 0.606781005859375, 0.6759033203125, 0.745025634765625, 0.81414794921875, 0.883270263671875, 0.952392578125, 1.021514892578125, 1.09063720703125, 1.159759521484375, 1.2288818359375, 1.298004150390625, 1.36712646484375, 1.436248779296875, 1.50537109375, 1.574493408203125, 1.64361572265625, 1.712738037109375, 1.7818603515625, 1.850982666015625, 1.92010498046875, 1.989227294921875, 2.058349609375, 2.127471923828125, 2.19659423828125, 2.265716552734375, 2.3348388671875, 2.403961181640625, 2.47308349609375, 2.542205810546875, 2.611328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 10.0, 17.0, 19.0, 21.0, 28.0, 44.0, 68.0, 82.0, 116.0, 149.0, 105.0, 84.0, 81.0, 48.0, 39.0, 21.0, 15.0, 13.0, 7.0, 3.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029544830322265625, -0.0028477609157562256, -0.0027410387992858887, -0.0026343166828155518, -0.002527594566345215, -0.002420872449874878, -0.002314150333404541, -0.002207428216934204, -0.002100706100463867, -0.0019939839839935303, -0.0018872618675231934, -0.0017805397510528564, -0.0016738176345825195, -0.0015670955181121826, -0.0014603734016418457, -0.0013536512851715088, -0.0012469291687011719, -0.001140207052230835, -0.001033484935760498, -0.0009267628192901611, -0.0008200407028198242, -0.0007133185863494873, -0.0006065964698791504, -0.0004998743534088135, -0.00039315223693847656, -0.00028643012046813965, -0.00017970800399780273, -7.298588752746582e-05, 3.3736228942871094e-05, 0.000140458345413208, 0.0002471804618835449, 0.00035390257835388184, 0.00046062469482421875, 0.0005673468112945557, 0.0006740689277648926, 0.0007807910442352295, 0.0008875131607055664, 0.0009942352771759033, 0.0011009573936462402, 0.0012076795101165771, 0.001314401626586914, 0.001421123743057251, 0.0015278458595275879, 0.0016345679759979248, 0.0017412900924682617, 0.0018480122089385986, 0.0019547343254089355, 0.0020614564418792725, 0.0021681785583496094, 0.0022749006748199463, 0.002381622791290283, 0.00248834490776062, 0.002595067024230957, 0.002701789140701294, 0.002808511257171631, 0.0029152333736419678, 0.0030219554901123047, 0.0031286776065826416, 0.0032353997230529785, 0.0033421218395233154, 0.0034488439559936523, 0.0035555660724639893, 0.003662288188934326, 0.003769010305404663, 0.003875732421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 9.0, 56.0, 2227.0, 4191824.0, 146.0, 22.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.57177734375, -0.47837066650390625, -0.3849639892578125, -0.29155731201171875, -0.198150634765625, -0.10474395751953125, -0.0113372802734375, 0.08206939697265625, 0.17547607421875, 0.26888275146484375, 0.3622894287109375, 0.45569610595703125, 0.549102783203125, 0.6425094604492188, 0.7359161376953125, 0.8293228149414062, 0.9227294921875, 1.0161361694335938, 1.1095428466796875, 1.2029495239257812, 1.296356201171875, 1.3897628784179688, 1.4831695556640625, 1.5765762329101562, 1.66998291015625, 1.7633895874023438, 1.8567962646484375, 1.9502029418945312, 2.043609619140625, 2.1370162963867188, 2.2304229736328125, 2.3238296508789062, 2.417236328125, 2.5106430053710938, 2.6040496826171875, 2.6974563598632812, 2.790863037109375, 2.8842697143554688, 2.9776763916015625, 3.0710830688476562, 3.16448974609375, 3.2578964233398438, 3.3513031005859375, 3.4447097778320312, 3.538116455078125, 3.6315231323242188, 3.7249298095703125, 3.8183364868164062, 3.9117431640625, 4.005149841308594, 4.0985565185546875, 4.191963195800781, 4.285369873046875, 4.378776550292969, 4.4721832275390625, 4.565589904785156, 4.65899658203125, 4.752403259277344, 4.8458099365234375, 4.939216613769531, 5.032623291015625, 5.126029968261719, 5.2194366455078125, 5.312843322753906, 5.40625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 4.0, 7.0, 6.0, 41.0, 194.0, 1125.0, 2362.0, 241.0, 79.0, 18.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00786590576171875, -0.006895184516906738, -0.0059244632720947266, -0.004953742027282715, -0.003983020782470703, -0.0030122995376586914, -0.0020415782928466797, -0.001070857048034668, -0.00010013580322265625, 0.0008705854415893555, 0.0018413066864013672, 0.002812027931213379, 0.0037827491760253906, 0.004753470420837402, 0.005724191665649414, 0.006694912910461426, 0.0076656341552734375, 0.00863635540008545, 0.009607076644897461, 0.010577797889709473, 0.011548519134521484, 0.012519240379333496, 0.013489961624145508, 0.01446068286895752, 0.015431404113769531, 0.016402125358581543, 0.017372846603393555, 0.018343567848205566, 0.019314289093017578, 0.02028501033782959, 0.0212557315826416, 0.022226452827453613, 0.023197174072265625, 0.024167895317077637, 0.02513861656188965, 0.02610933780670166, 0.027080059051513672, 0.028050780296325684, 0.029021501541137695, 0.029992222785949707, 0.03096294403076172, 0.03193366527557373, 0.03290438652038574, 0.033875107765197754, 0.034845829010009766, 0.03581655025482178, 0.03678727149963379, 0.0377579927444458, 0.03872871398925781, 0.039699435234069824, 0.040670156478881836, 0.04164087772369385, 0.04261159896850586, 0.04358232021331787, 0.04455304145812988, 0.045523762702941895, 0.046494483947753906, 0.04746520519256592, 0.04843592643737793, 0.04940664768218994, 0.05037736892700195, 0.051348090171813965, 0.05231881141662598, 0.05328953266143799, 0.05426025390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1020.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11939653754234314, 0.08671316504478455, 0.29282286763191223, 0.4989325702190399, 0.7050422430038452, 0.9111520051956177, 1.1172616481781006, 1.3233712911605835, 1.529481053352356, 1.7355906963348389, 1.9417004585266113, 2.147810220718384, 2.3539199829101562, 2.5600295066833496, 2.766139268875122, 2.9722490310668945, 3.178358793258667, 3.3844685554504395, 3.590578079223633, 3.7966878414154053, 4.002797603607178, 4.208907127380371, 4.415017127990723, 4.621126651763916, 4.827236175537109, 5.033345699310303, 5.239455699920654, 5.445565223693848, 5.651675224304199, 5.857784748077393, 6.063894271850586, 6.2700042724609375, 6.476114273071289, 6.682223796844482, 6.888333797454834, 7.094443321228027, 7.300553321838379, 7.506662845611572, 7.712772369384766, 7.918882369995117, 8.124992370605469, 8.33110237121582, 8.537211418151855, 8.743321418762207, 8.949431419372559, 9.155540466308594, 9.361650466918945, 9.567760467529297, 9.773869514465332, 9.979979515075684, 10.186088562011719, 10.39219856262207, 10.598308563232422, 10.804418563842773, 11.010527610778809, 11.21663761138916, 11.422746658325195, 11.628856658935547, 11.834965705871582, 12.041075706481934, 12.247185707092285, 12.45329475402832, 12.659404754638672, 12.865514755249023, 13.071624755859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 14.0, 32.0, 79.0, 179.0, 263.0, 233.0, 141.0, 44.0, 18.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2908943295478821, -0.2686131000518799, -0.24633187055587769, -0.22405065596103668, -0.20176942646503448, -0.1794881969690323, -0.15720698237419128, -0.1349257528781891, -0.11264452338218689, -0.09036329388618469, -0.06808207184076309, -0.04580084979534149, -0.023519620299339294, -0.0012383908033370972, 0.021042823791503906, 0.043324053287506104, 0.0656052827835083, 0.0878865122795105, 0.1101677343249321, 0.1324489563703537, 0.1547301858663559, 0.1770114153623581, 0.1992926299571991, 0.2215738594532013, 0.2438550889492035, 0.2661363184452057, 0.2884175479412079, 0.3106987476348877, 0.3329799771308899, 0.3552612066268921, 0.3775424361228943, 0.3998236656188965, 0.42210495471954346, 0.44438618421554565, 0.46666741371154785, 0.48894864320755005, 0.5112298727035522, 0.5335111021995544, 0.5557923316955566, 0.5780735015869141, 0.600354790687561, 0.6226360201835632, 0.6449172496795654, 0.6671984791755676, 0.6894797086715698, 0.711760938167572, 0.7340421676635742, 0.7563233375549316, 0.7786045670509338, 0.800885796546936, 0.8231670260429382, 0.8454482555389404, 0.8677294850349426, 0.8900107145309448, 0.9122918844223022, 0.9345731735229492, 0.9568543434143066, 0.9791355729103088, 1.001416802406311, 1.0236979722976685, 1.0459792613983154, 1.0682604312896729, 1.0905417203903198, 1.1128228902816772, 1.1351041793823242]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 14.0, 13.0, 17.0, 29.0, 26.0, 29.0, 41.0, 55.0, 58.0, 57.0, 130.0, 1042005.0, 5629.0, 65.0, 60.0, 52.0, 48.0, 41.0, 31.0, 32.0, 24.0, 26.0, 19.0, 7.0, 5.0, 8.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.466796875, -1.4268798828125, -1.386962890625, -1.3470458984375, -1.30712890625, -1.2672119140625, -1.227294921875, -1.1873779296875, -1.1474609375, -1.1075439453125, -1.067626953125, -1.0277099609375, -0.98779296875, -0.9478759765625, -0.907958984375, -0.8680419921875, -0.828125, -0.7882080078125, -0.748291015625, -0.7083740234375, -0.66845703125, -0.6285400390625, -0.588623046875, -0.5487060546875, -0.5087890625, -0.4688720703125, -0.428955078125, -0.3890380859375, -0.34912109375, -0.3092041015625, -0.269287109375, -0.2293701171875, -0.189453125, -0.1495361328125, -0.109619140625, -0.0697021484375, -0.02978515625, 0.0101318359375, 0.050048828125, 0.0899658203125, 0.1298828125, 0.1697998046875, 0.209716796875, 0.2496337890625, 0.28955078125, 0.3294677734375, 0.369384765625, 0.4093017578125, 0.44921875, 0.4891357421875, 0.529052734375, 0.5689697265625, 0.60888671875, 0.6488037109375, 0.688720703125, 0.7286376953125, 0.7685546875, 0.8084716796875, 0.848388671875, 0.8883056640625, 0.92822265625, 0.9681396484375, 1.008056640625, 1.0479736328125, 1.087890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [21.0, 254.0, 648.0, 94.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01087188720703125, -0.006265521049499512, -0.0016591548919677734, 0.002947211265563965, 0.007553577423095703, 0.012159943580627441, 0.01676630973815918, 0.021372675895690918, 0.025979042053222656, 0.030585408210754395, 0.03519177436828613, 0.03979814052581787, 0.04440450668334961, 0.04901087284088135, 0.053617238998413086, 0.058223605155944824, 0.06282997131347656, 0.0674363374710083, 0.07204270362854004, 0.07664906978607178, 0.08125543594360352, 0.08586180210113525, 0.09046816825866699, 0.09507453441619873, 0.09968090057373047, 0.10428726673126221, 0.10889363288879395, 0.11349999904632568, 0.11810636520385742, 0.12271273136138916, 0.1273190975189209, 0.13192546367645264, 0.13653182983398438, 0.1411381959915161, 0.14574456214904785, 0.1503509283065796, 0.15495729446411133, 0.15956366062164307, 0.1641700267791748, 0.16877639293670654, 0.17338275909423828, 0.17798912525177002, 0.18259549140930176, 0.1872018575668335, 0.19180822372436523, 0.19641458988189697, 0.2010209560394287, 0.20562732219696045, 0.2102336883544922, 0.21484005451202393, 0.21944642066955566, 0.2240527868270874, 0.22865915298461914, 0.23326551914215088, 0.23787188529968262, 0.24247825145721436, 0.2470846176147461, 0.25169098377227783, 0.25629734992980957, 0.2609037160873413, 0.26551008224487305, 0.2701164484024048, 0.2747228145599365, 0.27932918071746826, 0.283935546875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 9.0, 14.0, 16.0, 28.0, 35.0, 27.0, 62.0, 83.0, 164.0, 353.0, 1259.0, 6760.0, 81211.0, 883671.0, 66603.0, 6222.0, 1235.0, 339.0, 158.0, 79.0, 52.0, 39.0, 29.0, 15.0, 17.0, 11.0, 2.0, 11.0, 4.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.44140625, -0.4286003112792969, -0.41579437255859375, -0.4029884338378906, -0.3901824951171875, -0.3773765563964844, -0.36457061767578125, -0.3517646789550781, -0.338958740234375, -0.3261528015136719, -0.31334686279296875, -0.3005409240722656, -0.2877349853515625, -0.2749290466308594, -0.26212310791015625, -0.24931716918945312, -0.23651123046875, -0.22370529174804688, -0.21089935302734375, -0.19809341430664062, -0.1852874755859375, -0.17248153686523438, -0.15967559814453125, -0.14686965942382812, -0.134063720703125, -0.12125778198242188, -0.10845184326171875, -0.09564590454101562, -0.0828399658203125, -0.07003402709960938, -0.05722808837890625, -0.044422149658203125, -0.0316162109375, -0.018810272216796875, -0.00600433349609375, 0.006801605224609375, 0.0196075439453125, 0.032413482666015625, 0.04521942138671875, 0.058025360107421875, 0.070831298828125, 0.08363723754882812, 0.09644317626953125, 0.10924911499023438, 0.1220550537109375, 0.13486099243164062, 0.14766693115234375, 0.16047286987304688, 0.17327880859375, 0.18608474731445312, 0.19889068603515625, 0.21169662475585938, 0.2245025634765625, 0.23730850219726562, 0.25011444091796875, 0.2629203796386719, 0.275726318359375, 0.2885322570800781, 0.30133819580078125, 0.3141441345214844, 0.3269500732421875, 0.3397560119628906, 0.35256195068359375, 0.3653678894042969, 0.378173828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 7.0, 7.0, 9.0, 25.0, 18.0, 19.0, 30.0, 38.0, 42.0, 48.0, 52.0, 65.0, 76.0, 62.0, 68.0, 75.0, 66.0, 44.0, 45.0, 48.0, 35.0, 20.0, 16.0, 17.0, 12.0, 11.0, 7.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.234619140625, -0.22789955139160156, -0.22117996215820312, -0.2144603729248047, -0.20774078369140625, -0.2010211944580078, -0.19430160522460938, -0.18758201599121094, -0.1808624267578125, -0.17414283752441406, -0.16742324829101562, -0.1607036590576172, -0.15398406982421875, -0.1472644805908203, -0.14054489135742188, -0.13382530212402344, -0.127105712890625, -0.12038612365722656, -0.11366653442382812, -0.10694694519042969, -0.10022735595703125, -0.09350776672363281, -0.08678817749023438, -0.08006858825683594, -0.0733489990234375, -0.06662940979003906, -0.059909820556640625, -0.05319023132324219, -0.04647064208984375, -0.03975105285644531, -0.033031463623046875, -0.026311874389648438, -0.01959228515625, -0.012872695922851562, -0.006153106689453125, 0.0005664825439453125, 0.00728607177734375, 0.014005661010742188, 0.020725250244140625, 0.027444839477539062, 0.0341644287109375, 0.04088401794433594, 0.047603607177734375, 0.05432319641113281, 0.06104278564453125, 0.06776237487792969, 0.07448196411132812, 0.08120155334472656, 0.087921142578125, 0.09464073181152344, 0.10136032104492188, 0.10807991027832031, 0.11479949951171875, 0.12151908874511719, 0.12823867797851562, 0.13495826721191406, 0.1416778564453125, 0.14839744567871094, 0.15511703491210938, 0.1618366241455078, 0.16855621337890625, 0.1752758026123047, 0.18199539184570312, 0.18871498107910156, 0.1954345703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 8.0, 10.0, 13.0, 14.0, 27.0, 25.0, 37.0, 57.0, 80.0, 160.0, 349.0, 1035.0, 4611.0, 66432.0, 958644.0, 13650.0, 2192.0, 584.0, 259.0, 102.0, 64.0, 35.0, 32.0, 29.0, 22.0, 11.0, 13.0, 10.0, 6.0, 11.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.75732421875, -0.7352218627929688, -0.7131195068359375, -0.6910171508789062, -0.668914794921875, -0.6468124389648438, -0.6247100830078125, -0.6026077270507812, -0.58050537109375, -0.5584030151367188, -0.5363006591796875, -0.5141983032226562, -0.492095947265625, -0.46999359130859375, -0.4478912353515625, -0.42578887939453125, -0.4036865234375, -0.38158416748046875, -0.3594818115234375, -0.33737945556640625, -0.315277099609375, -0.29317474365234375, -0.2710723876953125, -0.24897003173828125, -0.22686767578125, -0.20476531982421875, -0.1826629638671875, -0.16056060791015625, -0.138458251953125, -0.11635589599609375, -0.0942535400390625, -0.07215118408203125, -0.050048828125, -0.02794647216796875, -0.0058441162109375, 0.01625823974609375, 0.038360595703125, 0.06046295166015625, 0.0825653076171875, 0.10466766357421875, 0.12677001953125, 0.14887237548828125, 0.1709747314453125, 0.19307708740234375, 0.215179443359375, 0.23728179931640625, 0.2593841552734375, 0.28148651123046875, 0.3035888671875, 0.32569122314453125, 0.3477935791015625, 0.36989593505859375, 0.391998291015625, 0.41410064697265625, 0.4362030029296875, 0.45830535888671875, 0.48040771484375, 0.5025100708007812, 0.5246124267578125, 0.5467147827148438, 0.568817138671875, 0.5909194946289062, 0.6130218505859375, 0.6351242065429688, 0.6572265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 8.0, 19.0, 17.0, 25.0, 39.0, 53.0, 84.0, 131.0, 127.0, 144.0, 85.0, 64.0, 47.0, 29.0, 20.0, 24.0, 13.0, 9.0, 7.0, 12.0, 4.0, 5.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4378299713134766e-05, -2.342555671930313e-05, -2.2472813725471497e-05, -2.1520070731639862e-05, -2.0567327737808228e-05, -1.9614584743976593e-05, -1.866184175014496e-05, -1.7709098756313324e-05, -1.675635576248169e-05, -1.5803612768650055e-05, -1.485086977481842e-05, -1.3898126780986786e-05, -1.2945383787155151e-05, -1.1992640793323517e-05, -1.1039897799491882e-05, -1.0087154805660248e-05, -9.134411811828613e-06, -8.181668817996979e-06, -7.228925824165344e-06, -6.27618283033371e-06, -5.323439836502075e-06, -4.370696842670441e-06, -3.417953848838806e-06, -2.4652108550071716e-06, -1.5124678611755371e-06, -5.597248673439026e-07, 3.9301812648773193e-07, 1.3457611203193665e-06, 2.298504114151001e-06, 3.2512471079826355e-06, 4.20399010181427e-06, 5.1567330956459045e-06, 6.109476089477539e-06, 7.062219083309174e-06, 8.014962077140808e-06, 8.967705070972443e-06, 9.920448064804077e-06, 1.0873191058635712e-05, 1.1825934052467346e-05, 1.277867704629898e-05, 1.3731420040130615e-05, 1.468416303396225e-05, 1.5636906027793884e-05, 1.658964902162552e-05, 1.7542392015457153e-05, 1.8495135009288788e-05, 1.9447878003120422e-05, 2.0400620996952057e-05, 2.135336399078369e-05, 2.2306106984615326e-05, 2.325884997844696e-05, 2.4211592972278595e-05, 2.516433596611023e-05, 2.6117078959941864e-05, 2.70698219537735e-05, 2.8022564947605133e-05, 2.8975307941436768e-05, 2.9928050935268402e-05, 3.088079392910004e-05, 3.183353692293167e-05, 3.2786279916763306e-05, 3.373902291059494e-05, 3.4691765904426575e-05, 3.564450889825821e-05, 3.6597251892089844e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 6.0, 3.0, 5.0, 7.0, 12.0, 7.0, 22.0, 61.0, 130.0, 406.0, 2429.0, 67601.0, 971353.0, 5674.0, 569.0, 152.0, 51.0, 20.0, 14.0, 8.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.671875, -1.6340255737304688, -1.5961761474609375, -1.5583267211914062, -1.520477294921875, -1.4826278686523438, -1.4447784423828125, -1.4069290161132812, -1.36907958984375, -1.3312301635742188, -1.2933807373046875, -1.2555313110351562, -1.217681884765625, -1.1798324584960938, -1.1419830322265625, -1.1041336059570312, -1.0662841796875, -1.0284347534179688, -0.9905853271484375, -0.9527359008789062, -0.914886474609375, -0.8770370483398438, -0.8391876220703125, -0.8013381958007812, -0.76348876953125, -0.7256393432617188, -0.6877899169921875, -0.6499404907226562, -0.612091064453125, -0.5742416381835938, -0.5363922119140625, -0.49854278564453125, -0.460693359375, -0.42284393310546875, -0.3849945068359375, -0.34714508056640625, -0.309295654296875, -0.27144622802734375, -0.2335968017578125, -0.19574737548828125, -0.15789794921875, -0.12004852294921875, -0.0821990966796875, -0.04434967041015625, -0.006500244140625, 0.03134918212890625, 0.0691986083984375, 0.10704803466796875, 0.1448974609375, 0.18274688720703125, 0.2205963134765625, 0.25844573974609375, 0.296295166015625, 0.33414459228515625, 0.3719940185546875, 0.40984344482421875, 0.44769287109375, 0.48554229736328125, 0.5233917236328125, 0.5612411499023438, 0.599090576171875, 0.6369400024414062, 0.6747894287109375, 0.7126388549804688, 0.75048828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 4.0, 3.0, 7.0, 11.0, 22.0, 32.0, 63.0, 130.0, 408.0, 160.0, 50.0, 27.0, 18.0, 15.0, 8.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.640625, -0.6262321472167969, -0.6118392944335938, -0.5974464416503906, -0.5830535888671875, -0.5686607360839844, -0.5542678833007812, -0.5398750305175781, -0.525482177734375, -0.5110893249511719, -0.49669647216796875, -0.4823036193847656, -0.4679107666015625, -0.4535179138183594, -0.43912506103515625, -0.4247322082519531, -0.41033935546875, -0.3959465026855469, -0.38155364990234375, -0.3671607971191406, -0.3527679443359375, -0.3383750915527344, -0.32398223876953125, -0.3095893859863281, -0.295196533203125, -0.2808036804199219, -0.26641082763671875, -0.2520179748535156, -0.2376251220703125, -0.22323226928710938, -0.20883941650390625, -0.19444656372070312, -0.1800537109375, -0.16566085815429688, -0.15126800537109375, -0.13687515258789062, -0.1224822998046875, -0.10808944702148438, -0.09369659423828125, -0.07930374145507812, -0.064910888671875, -0.050518035888671875, -0.03612518310546875, -0.021732330322265625, -0.0073394775390625, 0.007053375244140625, 0.02144622802734375, 0.035839080810546875, 0.05023193359375, 0.06462478637695312, 0.07901763916015625, 0.09341049194335938, 0.1078033447265625, 0.12219619750976562, 0.13658905029296875, 0.15098190307617188, 0.165374755859375, 0.17976760864257812, 0.19416046142578125, 0.20855331420898438, 0.2229461669921875, 0.23733901977539062, 0.25173187255859375, 0.2661247253417969, 0.280517578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 29.0, 981.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.129974842071533, -4.764760494232178, -3.399545907974243, -2.0343313217163086, -0.6691169738769531, 0.6960973739624023, 2.061312198638916, 3.4265265464782715, 4.791740894317627, 6.156955242156982, 7.522170066833496, 8.887384414672852, 10.252598762512207, 11.617813110351562, 12.983028411865234, 14.348241806030273, 15.713457107543945, 17.078672409057617, 18.443885803222656, 19.809101104736328, 21.174314498901367, 22.53952980041504, 23.904743194580078, 25.26995849609375, 26.63517189025879, 28.00038719177246, 29.3656005859375, 30.730815887451172, 32.096031188964844, 33.46124267578125, 34.82645797729492, 36.191673278808594, 37.556888580322266, 38.92210388183594, 40.28731918334961, 41.652530670166016, 43.01774597167969, 44.38296127319336, 45.74817657470703, 47.11338806152344, 48.47860336303711, 49.84381866455078, 51.20903396606445, 52.57424545288086, 53.93946075439453, 55.3046760559082, 56.669891357421875, 58.03510284423828, 59.40032196044922, 60.76553726196289, 62.13075256347656, 63.49596405029297, 64.8611831665039, 66.22639465332031, 67.59160614013672, 68.95682525634766, 70.32203674316406, 71.68724822998047, 73.0524673461914, 74.41767883300781, 75.78289794921875, 77.14810943603516, 78.51332092285156, 79.8785400390625, 81.2437515258789]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 17.0, 26.0, 61.0, 74.0, 103.0, 150.0, 136.0, 119.0, 123.0, 81.0, 55.0, 35.0, 12.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2526531219482422, -1.1390981674194336, -1.0255430936813354, -0.9119881391525269, -0.7984331250190735, -0.6848781108856201, -0.5713231563568115, -0.45776814222335815, -0.3442131280899048, -0.2306581288576126, -0.11710312962532043, -0.003548145294189453, 0.11000686883926392, 0.22356188297271729, 0.3371168375015259, 0.45067185163497925, 0.5642268657684326, 0.677781879901886, 0.7913368940353394, 0.904891848564148, 1.018446922302246, 1.1320018768310547, 1.2455568313598633, 1.3591117858886719, 1.47266685962677, 1.5862218141555786, 1.6997768878936768, 1.8133318424224854, 1.926886796951294, 2.0404419898986816, 2.1539969444274902, 2.267551898956299, 2.3811068534851074, 2.494661808013916, 2.6082167625427246, 2.721771717071533, 2.835326910018921, 2.9488818645477295, 3.062436819076538, 3.1759917736053467, 3.2895469665527344, 3.403101921081543, 3.5166568756103516, 3.63021183013916, 3.743767023086548, 3.8573219776153564, 3.970876932144165, 4.084432125091553, 4.197986602783203, 4.311541557312012, 4.42509651184082, 4.538651466369629, 4.6522064208984375, 4.765761375427246, 4.879316329956055, 4.9928717613220215, 5.10642671585083, 5.219981670379639, 5.333536624908447, 5.447091579437256, 5.5606465339660645, 5.674201965332031, 5.78775691986084, 5.901311874389648, 6.014866828918457]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 19.0, 112.0, 1551.0, 4191286.0, 859.0, 234.0, 125.0, 64.0, 22.0, 13.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.7072525024414062, -0.4911651611328125, -0.27507781982421875, -0.058990478515625, 0.15709686279296875, 0.3731842041015625, 0.5892715454101562, 0.80535888671875, 1.0214462280273438, 1.2375335693359375, 1.4536209106445312, 1.669708251953125, 1.8857955932617188, 2.1018829345703125, 2.3179702758789062, 2.5340576171875, 2.7501449584960938, 2.9662322998046875, 3.1823196411132812, 3.398406982421875, 3.6144943237304688, 3.8305816650390625, 4.046669006347656, 4.26275634765625, 4.478843688964844, 4.6949310302734375, 4.911018371582031, 5.127105712890625, 5.343193054199219, 5.5592803955078125, 5.775367736816406, 5.991455078125, 6.207542419433594, 6.4236297607421875, 6.639717102050781, 6.855804443359375, 7.071891784667969, 7.2879791259765625, 7.504066467285156, 7.72015380859375, 7.936241149902344, 8.152328491210938, 8.368415832519531, 8.584503173828125, 8.800590515136719, 9.016677856445312, 9.232765197753906, 9.4488525390625, 9.664939880371094, 9.881027221679688, 10.097114562988281, 10.313201904296875, 10.529289245605469, 10.745376586914062, 10.961463928222656, 11.17755126953125, 11.393638610839844, 11.609725952148438, 11.825813293457031, 12.041900634765625, 12.257987976074219, 12.474075317382812, 12.690162658691406, 12.90625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 13.0, 84.0, 231.0, 398.0, 208.0, 65.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026702880859375, -0.02076578140258789, -0.014828681945800781, -0.008891582489013672, -0.0029544830322265625, 0.002982616424560547, 0.008919715881347656, 0.014856815338134766, 0.020793914794921875, 0.026731014251708984, 0.032668113708496094, 0.0386052131652832, 0.04454231262207031, 0.05047941207885742, 0.05641651153564453, 0.06235361099243164, 0.06829071044921875, 0.07422780990600586, 0.08016490936279297, 0.08610200881958008, 0.09203910827636719, 0.0979762077331543, 0.1039133071899414, 0.10985040664672852, 0.11578750610351562, 0.12172460556030273, 0.12766170501708984, 0.13359880447387695, 0.13953590393066406, 0.14547300338745117, 0.15141010284423828, 0.1573472023010254, 0.1632843017578125, 0.1692214012145996, 0.17515850067138672, 0.18109560012817383, 0.18703269958496094, 0.19296979904174805, 0.19890689849853516, 0.20484399795532227, 0.21078109741210938, 0.21671819686889648, 0.2226552963256836, 0.2285923957824707, 0.2345294952392578, 0.24046659469604492, 0.24640369415283203, 0.25234079360961914, 0.25827789306640625, 0.26421499252319336, 0.27015209197998047, 0.2760891914367676, 0.2820262908935547, 0.2879633903503418, 0.2939004898071289, 0.299837589263916, 0.3057746887207031, 0.31171178817749023, 0.31764888763427734, 0.32358598709106445, 0.32952308654785156, 0.33546018600463867, 0.3413972854614258, 0.3473343849182129, 0.353271484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 11.0, 38.0, 71.0, 188.0, 427.0, 4185729.0, 6981.0, 344.0, 260.0, 141.0, 67.0, 12.0, 13.0, 9.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.00390625, -5.62591552734375, -5.2479248046875, -4.86993408203125, -4.491943359375, -4.11395263671875, -3.7359619140625, -3.35797119140625, -2.97998046875, -2.60198974609375, -2.2239990234375, -1.84600830078125, -1.468017578125, -1.09002685546875, -0.7120361328125, -0.33404541015625, 0.0439453125, 0.42193603515625, 0.7999267578125, 1.17791748046875, 1.555908203125, 1.93389892578125, 2.3118896484375, 2.68988037109375, 3.06787109375, 3.44586181640625, 3.8238525390625, 4.20184326171875, 4.579833984375, 4.95782470703125, 5.3358154296875, 5.71380615234375, 6.091796875, 6.46978759765625, 6.8477783203125, 7.22576904296875, 7.603759765625, 7.98175048828125, 8.3597412109375, 8.73773193359375, 9.11572265625, 9.49371337890625, 9.8717041015625, 10.24969482421875, 10.627685546875, 11.00567626953125, 11.3836669921875, 11.76165771484375, 12.1396484375, 12.51763916015625, 12.8956298828125, 13.27362060546875, 13.651611328125, 14.02960205078125, 14.4075927734375, 14.78558349609375, 15.16357421875, 15.54156494140625, 15.9195556640625, 16.29754638671875, 16.675537109375, 17.05352783203125, 17.4315185546875, 17.80950927734375, 18.1875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 10.0, 29.0, 242.0, 3787.0, 17.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.51123046875, -0.47537994384765625, -0.4395294189453125, -0.40367889404296875, -0.367828369140625, -0.33197784423828125, -0.2961273193359375, -0.26027679443359375, -0.22442626953125, -0.18857574462890625, -0.1527252197265625, -0.11687469482421875, -0.081024169921875, -0.04517364501953125, -0.0093231201171875, 0.02652740478515625, 0.0623779296875, 0.09822845458984375, 0.1340789794921875, 0.16992950439453125, 0.205780029296875, 0.24163055419921875, 0.2774810791015625, 0.31333160400390625, 0.34918212890625, 0.38503265380859375, 0.4208831787109375, 0.45673370361328125, 0.492584228515625, 0.5284347534179688, 0.5642852783203125, 0.6001358032226562, 0.635986328125, 0.6718368530273438, 0.7076873779296875, 0.7435379028320312, 0.779388427734375, 0.8152389526367188, 0.8510894775390625, 0.8869400024414062, 0.92279052734375, 0.9586410522460938, 0.9944915771484375, 1.0303421020507812, 1.066192626953125, 1.1020431518554688, 1.1378936767578125, 1.1737442016601562, 1.2095947265625, 1.2454452514648438, 1.2812957763671875, 1.3171463012695312, 1.352996826171875, 1.3888473510742188, 1.4246978759765625, 1.4605484008789062, 1.49639892578125, 1.5322494506835938, 1.5680999755859375, 1.6039505004882812, 1.639801025390625, 1.6756515502929688, 1.7115020751953125, 1.7473526000976562, 1.783203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 30.0, 342.0, 611.0, 22.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4958527088165283, -3.11041259765625, -2.724972724914551, -2.3395326137542725, -1.9540926218032837, -1.568652629852295, -1.1832125186920166, -0.7977726459503174, -0.41233253479003906, -0.026892513036727905, 0.35854750871658325, 0.7439875602722168, 1.1294275522232056, 1.5148675441741943, 1.9003076553344727, 2.285747528076172, 2.67118763923645, 3.0566277503967285, 3.4420676231384277, 3.827507734298706, 4.212947845458984, 4.598387718200684, 4.983827590942383, 5.369267463684082, 5.7547078132629395, 6.140147686004639, 6.525588035583496, 6.911027908325195, 7.2964677810668945, 7.681907653808594, 8.06734848022461, 8.452787399291992, 8.838227272033691, 9.22366714477539, 9.60910701751709, 9.994546890258789, 10.379987716674805, 10.765427589416504, 11.150867462158203, 11.536307334899902, 11.921747207641602, 12.3071870803833, 12.692626953125, 13.078067779541016, 13.463507652282715, 13.848947525024414, 14.234387397766113, 14.619827270507812, 15.005268096923828, 15.390707969665527, 15.776147842407227, 16.161588668823242, 16.547027587890625, 16.93246841430664, 17.317909240722656, 17.70334815979004, 18.088787078857422, 18.474227905273438, 18.85966682434082, 19.245107650756836, 19.63054656982422, 20.015987396240234, 20.40142822265625, 20.786867141723633, 21.17230796813965]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 10.0, 30.0, 63.0, 81.0, 121.0, 169.0, 156.0, 141.0, 110.0, 52.0, 31.0, 20.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.499293327331543, -6.298373222351074, -6.097453594207764, -5.896533489227295, -5.695613384246826, -5.494693756103516, -5.293773651123047, -5.092853546142578, -4.891933441162109, -4.691013336181641, -4.49009370803833, -4.289173603057861, -4.088253498077393, -3.887333631515503, -3.6864137649536133, -3.4854936599731445, -3.284574031829834, -3.0836541652679443, -2.8827340602874756, -2.681814193725586, -2.480894088745117, -2.2799742221832275, -2.079054355621338, -1.8781343698501587, -1.6772143840789795, -1.4762943983078003, -1.275374412536621, -1.0744545459747314, -0.8735345602035522, -0.672614574432373, -0.4716947078704834, -0.2707747220993042, -0.069854736328125, 0.1310652196407318, 0.3319851756095886, 0.532905101776123, 0.7338250875473022, 0.9347450733184814, 1.135664939880371, 1.3365849256515503, 1.5375049114227295, 1.7384248971939087, 1.939344882965088, 2.1402647495269775, 2.341184616088867, 2.542104721069336, 2.7430245876312256, 2.9439444541931152, 3.144864559173584, 3.3457844257354736, 3.5467045307159424, 3.747624397277832, 3.948544502258301, 4.1494646072387695, 4.35038423538208, 4.551304340362549, 4.752223968505859, 4.953144073486328, 5.154063701629639, 5.354983806610107, 5.555903911590576, 5.756823539733887, 5.9577436447143555, 6.158663749694824, 6.359583854675293]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 6.0, 9.0, 10.0, 23.0, 29.0, 46.0, 79.0, 159.0, 291.0, 890.0, 3660.0, 54547.0, 959105.0, 25751.0, 2602.0, 751.0, 268.0, 104.0, 75.0, 52.0, 30.0, 22.0, 8.0, 9.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.451171875, -2.375518798828125, -2.29986572265625, -2.224212646484375, -2.1485595703125, -2.072906494140625, -1.99725341796875, -1.921600341796875, -1.845947265625, -1.770294189453125, -1.69464111328125, -1.618988037109375, -1.5433349609375, -1.467681884765625, -1.39202880859375, -1.316375732421875, -1.24072265625, -1.165069580078125, -1.08941650390625, -1.013763427734375, -0.9381103515625, -0.862457275390625, -0.78680419921875, -0.711151123046875, -0.635498046875, -0.559844970703125, -0.48419189453125, -0.408538818359375, -0.3328857421875, -0.257232666015625, -0.18157958984375, -0.105926513671875, -0.0302734375, 0.045379638671875, 0.12103271484375, 0.196685791015625, 0.2723388671875, 0.347991943359375, 0.42364501953125, 0.499298095703125, 0.574951171875, 0.650604248046875, 0.72625732421875, 0.801910400390625, 0.8775634765625, 0.953216552734375, 1.02886962890625, 1.104522705078125, 1.18017578125, 1.255828857421875, 1.33148193359375, 1.407135009765625, 1.4827880859375, 1.558441162109375, 1.63409423828125, 1.709747314453125, 1.785400390625, 1.861053466796875, 1.93670654296875, 2.012359619140625, 2.0880126953125, 2.163665771484375, 2.23931884765625, 2.314971923828125, 2.390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 20.0, 37.0, 81.0, 108.0, 172.0, 175.0, 158.0, 116.0, 57.0, 43.0, 20.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.2040729522705078, -0.19244766235351562, -0.18082237243652344, -0.16919708251953125, -0.15757179260253906, -0.14594650268554688, -0.1343212127685547, -0.1226959228515625, -0.11107063293457031, -0.09944534301757812, -0.08782005310058594, -0.07619476318359375, -0.06456947326660156, -0.052944183349609375, -0.04131889343261719, -0.029693603515625, -0.018068313598632812, -0.006443023681640625, 0.0051822662353515625, 0.01680755615234375, 0.028432846069335938, 0.040058135986328125, 0.05168342590332031, 0.0633087158203125, 0.07493400573730469, 0.08655929565429688, 0.09818458557128906, 0.10980987548828125, 0.12143516540527344, 0.13306045532226562, 0.1446857452392578, 0.15631103515625, 0.1679363250732422, 0.17956161499023438, 0.19118690490722656, 0.20281219482421875, 0.21443748474121094, 0.22606277465820312, 0.2376880645751953, 0.2493133544921875, 0.2609386444091797, 0.2725639343261719, 0.28418922424316406, 0.29581451416015625, 0.30743980407714844, 0.3190650939941406, 0.3306903839111328, 0.342315673828125, 0.3539409637451172, 0.3655662536621094, 0.37719154357910156, 0.38881683349609375, 0.40044212341308594, 0.4120674133300781, 0.4236927032470703, 0.4353179931640625, 0.4469432830810547, 0.4585685729980469, 0.47019386291503906, 0.48181915283203125, 0.49344444274902344, 0.5050697326660156, 0.5166950225830078, 0.5283203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 6.0, 10.0, 10.0, 11.0, 20.0, 16.0, 24.0, 32.0, 53.0, 69.0, 132.0, 327.0, 1675.0, 24329.0, 958739.0, 59195.0, 2915.0, 522.0, 160.0, 87.0, 46.0, 42.0, 22.0, 19.0, 18.0, 15.0, 10.0, 10.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.45703125, -1.4094390869140625, -1.361846923828125, -1.3142547607421875, -1.26666259765625, -1.2190704345703125, -1.171478271484375, -1.1238861083984375, -1.0762939453125, -1.0287017822265625, -0.981109619140625, -0.9335174560546875, -0.88592529296875, -0.8383331298828125, -0.790740966796875, -0.7431488037109375, -0.695556640625, -0.6479644775390625, -0.600372314453125, -0.5527801513671875, -0.50518798828125, -0.4575958251953125, -0.410003662109375, -0.3624114990234375, -0.3148193359375, -0.2672271728515625, -0.219635009765625, -0.1720428466796875, -0.12445068359375, -0.0768585205078125, -0.029266357421875, 0.0183258056640625, 0.06591796875, 0.1135101318359375, 0.161102294921875, 0.2086944580078125, 0.25628662109375, 0.3038787841796875, 0.351470947265625, 0.3990631103515625, 0.4466552734375, 0.4942474365234375, 0.541839599609375, 0.5894317626953125, 0.63702392578125, 0.6846160888671875, 0.732208251953125, 0.7798004150390625, 0.827392578125, 0.8749847412109375, 0.922576904296875, 0.9701690673828125, 1.01776123046875, 1.0653533935546875, 1.112945556640625, 1.1605377197265625, 1.2081298828125, 1.2557220458984375, 1.303314208984375, 1.3509063720703125, 1.39849853515625, 1.4460906982421875, 1.493682861328125, 1.5412750244140625, 1.5888671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 6.0, 5.0, 12.0, 12.0, 10.0, 20.0, 27.0, 15.0, 34.0, 38.0, 43.0, 48.0, 48.0, 56.0, 64.0, 69.0, 64.0, 57.0, 57.0, 48.0, 53.0, 39.0, 31.0, 27.0, 20.0, 24.0, 14.0, 11.0, 8.0, 10.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5706939697265625, -0.551544189453125, -0.5323944091796875, -0.51324462890625, -0.4940948486328125, -0.474945068359375, -0.4557952880859375, -0.4366455078125, -0.4174957275390625, -0.398345947265625, -0.3791961669921875, -0.36004638671875, -0.3408966064453125, -0.321746826171875, -0.3025970458984375, -0.283447265625, -0.2642974853515625, -0.245147705078125, -0.2259979248046875, -0.20684814453125, -0.1876983642578125, -0.168548583984375, -0.1493988037109375, -0.1302490234375, -0.1110992431640625, -0.091949462890625, -0.0727996826171875, -0.05364990234375, -0.0345001220703125, -0.015350341796875, 0.0037994384765625, 0.02294921875, 0.0420989990234375, 0.061248779296875, 0.0803985595703125, 0.09954833984375, 0.1186981201171875, 0.137847900390625, 0.1569976806640625, 0.1761474609375, 0.1952972412109375, 0.214447021484375, 0.2335968017578125, 0.25274658203125, 0.2718963623046875, 0.291046142578125, 0.3101959228515625, 0.329345703125, 0.3484954833984375, 0.367645263671875, 0.3867950439453125, 0.40594482421875, 0.4250946044921875, 0.444244384765625, 0.4633941650390625, 0.4825439453125, 0.5016937255859375, 0.520843505859375, 0.5399932861328125, 0.55914306640625, 0.5782928466796875, 0.597442626953125, 0.6165924072265625, 0.6357421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 15.0, 31.0, 61.0, 162.0, 413.0, 2031.0, 56682.0, 982031.0, 5890.0, 816.0, 226.0, 81.0, 48.0, 20.0, 13.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62939453125, -0.5948715209960938, -0.5603485107421875, -0.5258255004882812, -0.491302490234375, -0.45677947998046875, -0.4222564697265625, -0.38773345947265625, -0.35321044921875, -0.31868743896484375, -0.2841644287109375, -0.24964141845703125, -0.215118408203125, -0.18059539794921875, -0.1460723876953125, -0.11154937744140625, -0.0770263671875, -0.04250335693359375, -0.0079803466796875, 0.02654266357421875, 0.061065673828125, 0.09558868408203125, 0.1301116943359375, 0.16463470458984375, 0.19915771484375, 0.23368072509765625, 0.2682037353515625, 0.30272674560546875, 0.337249755859375, 0.37177276611328125, 0.4062957763671875, 0.44081878662109375, 0.475341796875, 0.5098648071289062, 0.5443878173828125, 0.5789108276367188, 0.613433837890625, 0.6479568481445312, 0.6824798583984375, 0.7170028686523438, 0.75152587890625, 0.7860488891601562, 0.8205718994140625, 0.8550949096679688, 0.889617919921875, 0.9241409301757812, 0.9586639404296875, 0.9931869506835938, 1.0277099609375, 1.0622329711914062, 1.0967559814453125, 1.1312789916992188, 1.165802001953125, 1.2003250122070312, 1.2348480224609375, 1.2693710327148438, 1.30389404296875, 1.3384170532226562, 1.3729400634765625, 1.4074630737304688, 1.441986083984375, 1.4765090942382812, 1.5110321044921875, 1.5455551147460938, 1.580078125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 7.0, 12.0, 11.0, 15.0, 17.0, 18.0, 23.0, 38.0, 52.0, 59.0, 64.0, 87.0, 94.0, 104.0, 84.0, 69.0, 52.0, 47.0, 32.0, 23.0, 21.0, 8.0, 11.0, 7.0, 4.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.658367156982422e-05, -2.5704503059387207e-05, -2.4825334548950195e-05, -2.3946166038513184e-05, -2.3066997528076172e-05, -2.218782901763916e-05, -2.130866050720215e-05, -2.0429491996765137e-05, -1.9550323486328125e-05, -1.8671154975891113e-05, -1.77919864654541e-05, -1.691281795501709e-05, -1.6033649444580078e-05, -1.5154480934143066e-05, -1.4275312423706055e-05, -1.3396143913269043e-05, -1.2516975402832031e-05, -1.163780689239502e-05, -1.0758638381958008e-05, -9.879469871520996e-06, -9.000301361083984e-06, -8.121132850646973e-06, -7.241964340209961e-06, -6.362795829772949e-06, -5.4836273193359375e-06, -4.604458808898926e-06, -3.725290298461914e-06, -2.8461217880249023e-06, -1.9669532775878906e-06, -1.087784767150879e-06, -2.086162567138672e-07, 6.705522537231445e-07, 1.5497207641601562e-06, 2.428889274597168e-06, 3.3080577850341797e-06, 4.187226295471191e-06, 5.066394805908203e-06, 5.945563316345215e-06, 6.8247318267822266e-06, 7.703900337219238e-06, 8.58306884765625e-06, 9.462237358093262e-06, 1.0341405868530273e-05, 1.1220574378967285e-05, 1.2099742889404297e-05, 1.2978911399841309e-05, 1.385807991027832e-05, 1.4737248420715332e-05, 1.5616416931152344e-05, 1.6495585441589355e-05, 1.7374753952026367e-05, 1.825392246246338e-05, 1.913309097290039e-05, 2.0012259483337402e-05, 2.0891427993774414e-05, 2.1770596504211426e-05, 2.2649765014648438e-05, 2.352893352508545e-05, 2.440810203552246e-05, 2.5287270545959473e-05, 2.6166439056396484e-05, 2.7045607566833496e-05, 2.7924776077270508e-05, 2.880394458770752e-05, 2.968311309814453e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 10.0, 16.0, 28.0, 56.0, 121.0, 506.0, 4044.0, 967391.0, 74213.0, 1577.0, 347.0, 115.0, 52.0, 25.0, 15.0, 9.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6640625, -0.6305389404296875, -0.597015380859375, -0.5634918212890625, -0.52996826171875, -0.4964447021484375, -0.462921142578125, -0.4293975830078125, -0.3958740234375, -0.3623504638671875, -0.328826904296875, -0.2953033447265625, -0.26177978515625, -0.2282562255859375, -0.194732666015625, -0.1612091064453125, -0.127685546875, -0.0941619873046875, -0.060638427734375, -0.0271148681640625, 0.00640869140625, 0.0399322509765625, 0.073455810546875, 0.1069793701171875, 0.1405029296875, 0.1740264892578125, 0.207550048828125, 0.2410736083984375, 0.27459716796875, 0.3081207275390625, 0.341644287109375, 0.3751678466796875, 0.40869140625, 0.4422149658203125, 0.475738525390625, 0.5092620849609375, 0.54278564453125, 0.5763092041015625, 0.609832763671875, 0.6433563232421875, 0.6768798828125, 0.7104034423828125, 0.743927001953125, 0.7774505615234375, 0.81097412109375, 0.8444976806640625, 0.878021240234375, 0.9115447998046875, 0.945068359375, 0.9785919189453125, 1.012115478515625, 1.0456390380859375, 1.07916259765625, 1.1126861572265625, 1.146209716796875, 1.1797332763671875, 1.2132568359375, 1.2467803955078125, 1.280303955078125, 1.3138275146484375, 1.34735107421875, 1.3808746337890625, 1.414398193359375, 1.4479217529296875, 1.4814453125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 13.0, 23.0, 34.0, 60.0, 111.0, 221.0, 227.0, 131.0, 49.0, 34.0, 33.0, 14.0, 10.0, 7.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265380859375, -0.2521171569824219, -0.23885345458984375, -0.22558975219726562, -0.2123260498046875, -0.19906234741210938, -0.18579864501953125, -0.17253494262695312, -0.159271240234375, -0.14600753784179688, -0.13274383544921875, -0.11948013305664062, -0.1062164306640625, -0.09295272827148438, -0.07968902587890625, -0.06642532348632812, -0.05316162109375, -0.039897918701171875, -0.02663421630859375, -0.013370513916015625, -0.0001068115234375, 0.013156890869140625, 0.02642059326171875, 0.039684295654296875, 0.052947998046875, 0.06621170043945312, 0.07947540283203125, 0.09273910522460938, 0.1060028076171875, 0.11926651000976562, 0.13253021240234375, 0.14579391479492188, 0.1590576171875, 0.17232131958007812, 0.18558502197265625, 0.19884872436523438, 0.2121124267578125, 0.22537612915039062, 0.23863983154296875, 0.2519035339355469, 0.265167236328125, 0.2784309387207031, 0.29169464111328125, 0.3049583435058594, 0.3182220458984375, 0.3314857482910156, 0.34474945068359375, 0.3580131530761719, 0.37127685546875, 0.3845405578613281, 0.39780426025390625, 0.4110679626464844, 0.4243316650390625, 0.4375953674316406, 0.45085906982421875, 0.4641227722167969, 0.477386474609375, 0.4906501770019531, 0.5039138793945312, 0.5171775817871094, 0.5304412841796875, 0.5437049865722656, 0.5569686889648438, 0.5702323913574219, 0.58349609375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 34.0, 533.0, 417.0, 15.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.94917106628418, -12.410395622253418, -11.871620178222656, -11.332844734191895, -10.794069290161133, -10.255293846130371, -9.71651840209961, -9.177742958068848, -8.638967514038086, -8.100192070007324, -7.5614166259765625, -7.022641181945801, -6.483865737915039, -5.945090293884277, -5.406314849853516, -4.867539405822754, -4.328763961791992, -3.7899885177612305, -3.2512130737304688, -2.712437629699707, -2.1736621856689453, -1.6348867416381836, -1.0961112976074219, -0.5573358535766602, -0.018560409545898438, 0.5202150344848633, 1.058990478515625, 1.5977659225463867, 2.1365413665771484, 2.67531681060791, 3.214092254638672, 3.7528676986694336, 4.291645050048828, 4.83042049407959, 5.369195938110352, 5.907971382141113, 6.446746826171875, 6.985522270202637, 7.524297714233398, 8.06307315826416, 8.601848602294922, 9.140624046325684, 9.679399490356445, 10.218174934387207, 10.756950378417969, 11.29572582244873, 11.834501266479492, 12.373276710510254, 12.912052154541016, 13.450827598571777, 13.989603042602539, 14.5283784866333, 15.067153930664062, 15.605929374694824, 16.144704818725586, 16.68347930908203, 17.22225570678711, 17.761032104492188, 18.299806594848633, 18.838581085205078, 19.377357482910156, 19.916133880615234, 20.45490837097168, 20.993682861328125, 21.532459259033203]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 8.0, 13.0, 11.0, 15.0, 23.0, 29.0, 30.0, 37.0, 43.0, 38.0, 50.0, 74.0, 66.0, 79.0, 67.0, 74.0, 47.0, 36.0, 53.0, 49.0, 45.0, 23.0, 23.0, 23.0, 9.0, 13.0, 4.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.90798282623291, -4.772911548614502, -4.637840270996094, -4.502769470214844, -4.3676981925964355, -4.232626914978027, -4.097555637359619, -3.962484359741211, -3.8274130821228027, -3.6923418045043945, -3.5572707653045654, -3.4221994876861572, -3.287128210067749, -3.15205717086792, -3.0169858932495117, -2.8819146156311035, -2.7468435764312744, -2.611772298812866, -2.476701259613037, -2.341629981994629, -2.2065587043762207, -2.0714874267578125, -1.9364163875579834, -1.8013451099395752, -1.6662739515304565, -1.531202793121338, -1.3961315155029297, -1.261060357093811, -1.1259891986846924, -0.9909179210662842, -0.8558467626571655, -0.7207755446434021, -0.5857043266296387, -0.45063310861587524, -0.3155619204044342, -0.18049073219299316, -0.045419514179229736, 0.08965170383453369, 0.22472286224365234, 0.35979408025741577, 0.4948652982711792, 0.6299365162849426, 0.765007734298706, 0.9000788927078247, 1.0351500511169434, 1.1702213287353516, 1.3052924871444702, 1.4403636455535889, 1.575434923171997, 1.7105060815811157, 1.845577359199524, 1.9806485176086426, 2.115719795227051, 2.250791072845459, 2.385862112045288, 2.5209333896636963, 2.6560044288635254, 2.7910757064819336, 2.9261467456817627, 3.061218023300171, 3.196289300918579, 3.331360340118408, 3.4664316177368164, 3.6015028953552246, 3.736574172973633]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 10.0, 21.0, 32.0, 100.0, 291.0, 701.0, 2907.0, 17730.0, 488714.0, 3650416.0, 26501.0, 4052.0, 1308.0, 566.0, 315.0, 178.0, 106.0, 70.0, 59.0, 38.0, 34.0, 28.0, 15.0, 18.0, 20.0, 7.0, 6.0, 10.0, 4.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8555526733398438, -0.7848358154296875, -0.7141189575195312, -0.643402099609375, -0.5726852416992188, -0.5019683837890625, -0.43125152587890625, -0.36053466796875, -0.28981781005859375, -0.2191009521484375, -0.14838409423828125, -0.077667236328125, -0.00695037841796875, 0.0637664794921875, 0.13448333740234375, 0.2052001953125, 0.27591705322265625, 0.3466339111328125, 0.41735076904296875, 0.488067626953125, 0.5587844848632812, 0.6295013427734375, 0.7002182006835938, 0.77093505859375, 0.8416519165039062, 0.9123687744140625, 0.9830856323242188, 1.053802490234375, 1.1245193481445312, 1.1952362060546875, 1.2659530639648438, 1.336669921875, 1.4073867797851562, 1.4781036376953125, 1.5488204956054688, 1.619537353515625, 1.6902542114257812, 1.7609710693359375, 1.8316879272460938, 1.90240478515625, 1.9731216430664062, 2.0438385009765625, 2.1145553588867188, 2.185272216796875, 2.2559890747070312, 2.3267059326171875, 2.3974227905273438, 2.4681396484375, 2.5388565063476562, 2.6095733642578125, 2.6802902221679688, 2.751007080078125, 2.8217239379882812, 2.8924407958984375, 2.9631576538085938, 3.03387451171875, 3.1045913696289062, 3.1753082275390625, 3.2460250854492188, 3.316741943359375, 3.3874588012695312, 3.4581756591796875, 3.5288925170898438, 3.599609375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 9.0, 17.0, 35.0, 51.0, 76.0, 123.0, 156.0, 162.0, 132.0, 93.0, 66.0, 51.0, 15.0, 9.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14111328125, -0.130462646484375, -0.11981201171875, -0.109161376953125, -0.0985107421875, -0.087860107421875, -0.07720947265625, -0.066558837890625, -0.055908203125, -0.045257568359375, -0.03460693359375, -0.023956298828125, -0.0133056640625, -0.002655029296875, 0.00799560546875, 0.018646240234375, 0.029296875, 0.039947509765625, 0.05059814453125, 0.061248779296875, 0.0718994140625, 0.082550048828125, 0.09320068359375, 0.103851318359375, 0.114501953125, 0.125152587890625, 0.13580322265625, 0.146453857421875, 0.1571044921875, 0.167755126953125, 0.17840576171875, 0.189056396484375, 0.19970703125, 0.210357666015625, 0.22100830078125, 0.231658935546875, 0.2423095703125, 0.252960205078125, 0.26361083984375, 0.274261474609375, 0.284912109375, 0.295562744140625, 0.30621337890625, 0.316864013671875, 0.3275146484375, 0.338165283203125, 0.34881591796875, 0.359466552734375, 0.3701171875, 0.380767822265625, 0.39141845703125, 0.402069091796875, 0.4127197265625, 0.423370361328125, 0.43402099609375, 0.444671630859375, 0.455322265625, 0.465972900390625, 0.47662353515625, 0.487274169921875, 0.4979248046875, 0.508575439453125, 0.51922607421875, 0.529876708984375, 0.54052734375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 26.0, 84.0, 420.0, 4178732.0, 14266.0, 515.0, 140.0, 62.0, 17.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.23394775390625, -5.7843017578125, -5.33465576171875, -4.885009765625, -4.43536376953125, -3.9857177734375, -3.53607177734375, -3.08642578125, -2.63677978515625, -2.1871337890625, -1.73748779296875, -1.287841796875, -0.83819580078125, -0.3885498046875, 0.06109619140625, 0.5107421875, 0.96038818359375, 1.4100341796875, 1.85968017578125, 2.309326171875, 2.75897216796875, 3.2086181640625, 3.65826416015625, 4.10791015625, 4.55755615234375, 5.0072021484375, 5.45684814453125, 5.906494140625, 6.35614013671875, 6.8057861328125, 7.25543212890625, 7.705078125, 8.15472412109375, 8.6043701171875, 9.05401611328125, 9.503662109375, 9.95330810546875, 10.4029541015625, 10.85260009765625, 11.30224609375, 11.75189208984375, 12.2015380859375, 12.65118408203125, 13.100830078125, 13.55047607421875, 14.0001220703125, 14.44976806640625, 14.8994140625, 15.34906005859375, 15.7987060546875, 16.24835205078125, 16.697998046875, 17.14764404296875, 17.5972900390625, 18.04693603515625, 18.49658203125, 18.94622802734375, 19.3958740234375, 19.84552001953125, 20.295166015625, 20.74481201171875, 21.1944580078125, 21.64410400390625, 22.09375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 9.0, 16.0, 50.0, 369.0, 3446.0, 144.0, 26.0, 11.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.321044921875, -0.2821235656738281, -0.24320220947265625, -0.20428085327148438, -0.1653594970703125, -0.12643814086914062, -0.08751678466796875, -0.048595428466796875, -0.009674072265625, 0.029247283935546875, 0.06816864013671875, 0.10708999633789062, 0.1460113525390625, 0.18493270874023438, 0.22385406494140625, 0.2627754211425781, 0.30169677734375, 0.3406181335449219, 0.37953948974609375, 0.4184608459472656, 0.4573822021484375, 0.4963035583496094, 0.5352249145507812, 0.5741462707519531, 0.613067626953125, 0.6519889831542969, 0.6909103393554688, 0.7298316955566406, 0.7687530517578125, 0.8076744079589844, 0.8465957641601562, 0.8855171203613281, 0.9244384765625, 0.9633598327636719, 1.0022811889648438, 1.0412025451660156, 1.0801239013671875, 1.1190452575683594, 1.1579666137695312, 1.1968879699707031, 1.235809326171875, 1.2747306823730469, 1.3136520385742188, 1.3525733947753906, 1.3914947509765625, 1.4304161071777344, 1.4693374633789062, 1.5082588195800781, 1.54718017578125, 1.5861015319824219, 1.6250228881835938, 1.6639442443847656, 1.7028656005859375, 1.7417869567871094, 1.7807083129882812, 1.8196296691894531, 1.858551025390625, 1.8974723815917969, 1.9363937377929688, 1.9753150939941406, 2.0142364501953125, 2.0531578063964844, 2.0920791625976562, 2.131000518798828, 2.169921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 12.0, 42.0, 514.0, 370.0, 42.0, 16.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.468570232391357, -6.208056449890137, -5.947543144226074, -5.6870293617248535, -5.426516056060791, -5.16600227355957, -4.905488967895508, -4.644975185394287, -4.384461402893066, -4.123947620391846, -3.863434314727783, -3.6029205322265625, -3.3424072265625, -3.0818934440612793, -2.8213798999786377, -2.560866355895996, -2.3003530502319336, -2.039839506149292, -1.7793259620666504, -1.5188122987747192, -1.2582987546920776, -0.997785210609436, -0.7372715473175049, -0.4767580032348633, -0.21624445915222168, 0.04426911473274231, 0.3047826886177063, 0.5652962923049927, 0.8258098363876343, 1.0863233804702759, 1.346837043762207, 1.6073505878448486, 1.867863655090332, 2.1283771991729736, 2.3888907432556152, 2.649404525756836, 2.9099178314208984, 3.170431613922119, 3.4309451580047607, 3.6914587020874023, 3.951972246170044, 4.2124857902526855, 4.472999572753906, 4.733512878417969, 4.9940266609191895, 5.254539966583252, 5.515053749084473, 5.775567054748535, 6.036080837249756, 6.296594619750977, 6.557107925415039, 6.81762170791626, 7.078135013580322, 7.338648796081543, 7.5991621017456055, 7.859675884246826, 8.120189666748047, 8.38070297241211, 8.641217231750488, 8.90173053741455, 9.162243843078613, 9.422757148742676, 9.683271408081055, 9.943784713745117, 10.20429801940918]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 6.0, 20.0, 23.0, 44.0, 69.0, 99.0, 88.0, 121.0, 126.0, 115.0, 87.0, 70.0, 49.0, 39.0, 20.0, 12.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5938639640808105, -4.434754848480225, -4.275645732879639, -4.116536617279053, -3.957427501678467, -3.798318386077881, -3.639209270477295, -3.480100154876709, -3.320991039276123, -3.161881923675537, -3.002772808074951, -2.8436636924743652, -2.6845545768737793, -2.5254454612731934, -2.3663363456726074, -2.2072272300720215, -2.0481183528900146, -1.8890092372894287, -1.7299001216888428, -1.5707910060882568, -1.411681890487671, -1.252572774887085, -1.0934637784957886, -0.9343546628952026, -0.7752455472946167, -0.6161364316940308, -0.4570273458957672, -0.29791826009750366, -0.13880914449691772, 0.020299971103668213, 0.17940902709960938, 0.3385181427001953, 0.49762725830078125, 0.6567363739013672, 0.8158454895019531, 0.9749545454978943, 1.134063720703125, 1.293172836303711, 1.4522818326950073, 1.6113909482955933, 1.7705000638961792, 1.9296091794967651, 2.0887181758880615, 2.2478272914886475, 2.4069364070892334, 2.5660455226898193, 2.7251546382904053, 2.884263753890991, 3.043372869491577, 3.202481985092163, 3.361591100692749, 3.520700216293335, 3.679809331893921, 3.838918447494507, 3.9980273246765137, 4.1571364402771, 4.3162455558776855, 4.4753546714782715, 4.634463787078857, 4.793572902679443, 4.952682018280029, 5.111791133880615, 5.270900249481201, 5.430009365081787, 5.589118480682373]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 6.0, 11.0, 10.0, 13.0, 16.0, 24.0, 36.0, 35.0, 68.0, 93.0, 136.0, 184.0, 321.0, 497.0, 932.0, 2201.0, 6660.0, 27247.0, 173226.0, 718571.0, 92728.0, 17234.0, 4663.0, 1669.0, 751.0, 371.0, 228.0, 154.0, 118.0, 85.0, 70.0, 45.0, 27.0, 37.0, 17.0, 20.0, 12.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.0140380859375, -0.978271484375, -0.9425048828125, -0.90673828125, -0.8709716796875, -0.835205078125, -0.7994384765625, -0.763671875, -0.7279052734375, -0.692138671875, -0.6563720703125, -0.62060546875, -0.5848388671875, -0.549072265625, -0.5133056640625, -0.4775390625, -0.4417724609375, -0.406005859375, -0.3702392578125, -0.33447265625, -0.2987060546875, -0.262939453125, -0.2271728515625, -0.19140625, -0.1556396484375, -0.119873046875, -0.0841064453125, -0.04833984375, -0.0125732421875, 0.023193359375, 0.0589599609375, 0.0947265625, 0.1304931640625, 0.166259765625, 0.2020263671875, 0.23779296875, 0.2735595703125, 0.309326171875, 0.3450927734375, 0.380859375, 0.4166259765625, 0.452392578125, 0.4881591796875, 0.52392578125, 0.5596923828125, 0.595458984375, 0.6312255859375, 0.6669921875, 0.7027587890625, 0.738525390625, 0.7742919921875, 0.81005859375, 0.8458251953125, 0.881591796875, 0.9173583984375, 0.953125, 0.9888916015625, 1.024658203125, 1.0604248046875, 1.09619140625, 1.1319580078125, 1.167724609375, 1.2034912109375, 1.2392578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 13.0, 26.0, 42.0, 47.0, 67.0, 90.0, 113.0, 101.0, 128.0, 76.0, 82.0, 72.0, 51.0, 29.0, 24.0, 15.0, 9.0, 7.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26318359375, -0.25064849853515625, -0.2381134033203125, -0.22557830810546875, -0.213043212890625, -0.20050811767578125, -0.1879730224609375, -0.17543792724609375, -0.16290283203125, -0.15036773681640625, -0.1378326416015625, -0.12529754638671875, -0.112762451171875, -0.10022735595703125, -0.0876922607421875, -0.07515716552734375, -0.0626220703125, -0.05008697509765625, -0.0375518798828125, -0.02501678466796875, -0.012481689453125, 5.340576171875e-05, 0.0125885009765625, 0.02512359619140625, 0.03765869140625, 0.05019378662109375, 0.0627288818359375, 0.07526397705078125, 0.087799072265625, 0.10033416748046875, 0.1128692626953125, 0.12540435791015625, 0.137939453125, 0.15047454833984375, 0.1630096435546875, 0.17554473876953125, 0.188079833984375, 0.20061492919921875, 0.2131500244140625, 0.22568511962890625, 0.23822021484375, 0.25075531005859375, 0.2632904052734375, 0.27582550048828125, 0.288360595703125, 0.30089569091796875, 0.3134307861328125, 0.32596588134765625, 0.3385009765625, 0.35103607177734375, 0.3635711669921875, 0.37610626220703125, 0.388641357421875, 0.40117645263671875, 0.4137115478515625, 0.42624664306640625, 0.43878173828125, 0.45131683349609375, 0.4638519287109375, 0.47638702392578125, 0.488922119140625, 0.5014572143554688, 0.5139923095703125, 0.5265274047851562, 0.5390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 9.0, 15.0, 16.0, 18.0, 31.0, 37.0, 56.0, 101.0, 185.0, 502.0, 1941.0, 11831.0, 197825.0, 800550.0, 30255.0, 3743.0, 804.0, 279.0, 122.0, 73.0, 35.0, 21.0, 17.0, 20.0, 12.0, 6.0, 13.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5166015625, -1.472259521484375, -1.42791748046875, -1.383575439453125, -1.3392333984375, -1.294891357421875, -1.25054931640625, -1.206207275390625, -1.161865234375, -1.117523193359375, -1.07318115234375, -1.028839111328125, -0.9844970703125, -0.940155029296875, -0.89581298828125, -0.851470947265625, -0.80712890625, -0.762786865234375, -0.71844482421875, -0.674102783203125, -0.6297607421875, -0.585418701171875, -0.54107666015625, -0.496734619140625, -0.452392578125, -0.408050537109375, -0.36370849609375, -0.319366455078125, -0.2750244140625, -0.230682373046875, -0.18634033203125, -0.141998291015625, -0.09765625, -0.053314208984375, -0.00897216796875, 0.035369873046875, 0.0797119140625, 0.124053955078125, 0.16839599609375, 0.212738037109375, 0.257080078125, 0.301422119140625, 0.34576416015625, 0.390106201171875, 0.4344482421875, 0.478790283203125, 0.52313232421875, 0.567474365234375, 0.61181640625, 0.656158447265625, 0.70050048828125, 0.744842529296875, 0.7891845703125, 0.833526611328125, 0.87786865234375, 0.922210693359375, 0.966552734375, 1.010894775390625, 1.05523681640625, 1.099578857421875, 1.1439208984375, 1.188262939453125, 1.23260498046875, 1.276947021484375, 1.3212890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 10.0, 16.0, 9.0, 19.0, 22.0, 24.0, 34.0, 38.0, 44.0, 47.0, 59.0, 65.0, 70.0, 53.0, 60.0, 53.0, 65.0, 60.0, 36.0, 41.0, 33.0, 29.0, 11.0, 18.0, 20.0, 11.0, 5.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0185546875, -0.9882659912109375, -0.957977294921875, -0.9276885986328125, -0.89739990234375, -0.8671112060546875, -0.836822509765625, -0.8065338134765625, -0.7762451171875, -0.7459564208984375, -0.715667724609375, -0.6853790283203125, -0.65509033203125, -0.6248016357421875, -0.594512939453125, -0.5642242431640625, -0.533935546875, -0.5036468505859375, -0.473358154296875, -0.4430694580078125, -0.41278076171875, -0.3824920654296875, -0.352203369140625, -0.3219146728515625, -0.2916259765625, -0.2613372802734375, -0.231048583984375, -0.2007598876953125, -0.17047119140625, -0.1401824951171875, -0.109893798828125, -0.0796051025390625, -0.04931640625, -0.0190277099609375, 0.011260986328125, 0.0415496826171875, 0.07183837890625, 0.1021270751953125, 0.132415771484375, 0.1627044677734375, 0.1929931640625, 0.2232818603515625, 0.253570556640625, 0.2838592529296875, 0.31414794921875, 0.3444366455078125, 0.374725341796875, 0.4050140380859375, 0.435302734375, 0.4655914306640625, 0.495880126953125, 0.5261688232421875, 0.55645751953125, 0.5867462158203125, 0.617034912109375, 0.6473236083984375, 0.6776123046875, 0.7079010009765625, 0.738189697265625, 0.7684783935546875, 0.79876708984375, 0.8290557861328125, 0.859344482421875, 0.8896331787109375, 0.919921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 12.0, 8.0, 10.0, 11.0, 25.0, 28.0, 50.0, 88.0, 156.0, 363.0, 945.0, 3093.0, 18833.0, 651371.0, 357076.0, 12580.0, 2442.0, 743.0, 309.0, 142.0, 79.0, 52.0, 34.0, 25.0, 17.0, 8.0, 8.0, 7.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.34375, -0.3326301574707031, -0.32151031494140625, -0.3103904724121094, -0.2992706298828125, -0.2881507873535156, -0.27703094482421875, -0.2659111022949219, -0.254791259765625, -0.24367141723632812, -0.23255157470703125, -0.22143173217773438, -0.2103118896484375, -0.19919204711914062, -0.18807220458984375, -0.17695236206054688, -0.16583251953125, -0.15471267700195312, -0.14359283447265625, -0.13247299194335938, -0.1213531494140625, -0.11023330688476562, -0.09911346435546875, -0.08799362182617188, -0.076873779296875, -0.06575393676757812, -0.05463409423828125, -0.043514251708984375, -0.0323944091796875, -0.021274566650390625, -0.01015472412109375, 0.000965118408203125, 0.0120849609375, 0.023204803466796875, 0.03432464599609375, 0.045444488525390625, 0.0565643310546875, 0.06768417358398438, 0.07880401611328125, 0.08992385864257812, 0.101043701171875, 0.11216354370117188, 0.12328338623046875, 0.13440322875976562, 0.1455230712890625, 0.15664291381835938, 0.16776275634765625, 0.17888259887695312, 0.19000244140625, 0.20112228393554688, 0.21224212646484375, 0.22336196899414062, 0.2344818115234375, 0.24560165405273438, 0.25672149658203125, 0.2678413391113281, 0.278961181640625, 0.2900810241699219, 0.30120086669921875, 0.3123207092285156, 0.3234405517578125, 0.3345603942871094, 0.34568023681640625, 0.3568000793457031, 0.367919921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 8.0, 5.0, 12.0, 12.0, 18.0, 22.0, 39.0, 45.0, 67.0, 77.0, 61.0, 75.0, 76.0, 76.0, 97.0, 60.0, 69.0, 38.0, 23.0, 25.0, 24.0, 18.0, 15.0, 8.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.7222948372364044e-05, -1.662410795688629e-05, -1.602526754140854e-05, -1.5426427125930786e-05, -1.4827586710453033e-05, -1.422874629497528e-05, -1.3629905879497528e-05, -1.3031065464019775e-05, -1.2432225048542023e-05, -1.183338463306427e-05, -1.1234544217586517e-05, -1.0635703802108765e-05, -1.0036863386631012e-05, -9.43802297115326e-06, -8.839182555675507e-06, -8.240342140197754e-06, -7.641501724720001e-06, -7.0426613092422485e-06, -6.443820893764496e-06, -5.844980478286743e-06, -5.2461400628089905e-06, -4.647299647331238e-06, -4.048459231853485e-06, -3.4496188163757324e-06, -2.8507784008979797e-06, -2.251937985420227e-06, -1.6530975699424744e-06, -1.0542571544647217e-06, -4.55416738986969e-07, 1.434236764907837e-07, 7.422640919685364e-07, 1.341104507446289e-06, 1.9399449229240417e-06, 2.5387853384017944e-06, 3.137625753879547e-06, 3.7364661693573e-06, 4.3353065848350525e-06, 4.934147000312805e-06, 5.532987415790558e-06, 6.1318278312683105e-06, 6.730668246746063e-06, 7.329508662223816e-06, 7.928349077701569e-06, 8.527189493179321e-06, 9.126029908657074e-06, 9.724870324134827e-06, 1.032371073961258e-05, 1.0922551155090332e-05, 1.1521391570568085e-05, 1.2120231986045837e-05, 1.271907240152359e-05, 1.3317912817001343e-05, 1.3916753232479095e-05, 1.4515593647956848e-05, 1.51144340634346e-05, 1.5713274478912354e-05, 1.6312114894390106e-05, 1.691095530986786e-05, 1.750979572534561e-05, 1.8108636140823364e-05, 1.8707476556301117e-05, 1.930631697177887e-05, 1.9905157387256622e-05, 2.0503997802734375e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 9.0, 10.0, 12.0, 38.0, 58.0, 113.0, 295.0, 807.0, 3151.0, 31545.0, 908156.0, 96904.0, 5496.0, 1204.0, 406.0, 165.0, 82.0, 38.0, 23.0, 11.0, 12.0, 5.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.349609375, -0.33820343017578125, -0.3267974853515625, -0.31539154052734375, -0.303985595703125, -0.29257965087890625, -0.2811737060546875, -0.26976776123046875, -0.25836181640625, -0.24695587158203125, -0.2355499267578125, -0.22414398193359375, -0.212738037109375, -0.20133209228515625, -0.1899261474609375, -0.17852020263671875, -0.1671142578125, -0.15570831298828125, -0.1443023681640625, -0.13289642333984375, -0.121490478515625, -0.11008453369140625, -0.0986785888671875, -0.08727264404296875, -0.07586669921875, -0.06446075439453125, -0.0530548095703125, -0.04164886474609375, -0.030242919921875, -0.01883697509765625, -0.0074310302734375, 0.00397491455078125, 0.015380859375, 0.02678680419921875, 0.0381927490234375, 0.04959869384765625, 0.061004638671875, 0.07241058349609375, 0.0838165283203125, 0.09522247314453125, 0.10662841796875, 0.11803436279296875, 0.1294403076171875, 0.14084625244140625, 0.152252197265625, 0.16365814208984375, 0.1750640869140625, 0.18647003173828125, 0.1978759765625, 0.20928192138671875, 0.2206878662109375, 0.23209381103515625, 0.243499755859375, 0.25490570068359375, 0.2663116455078125, 0.27771759033203125, 0.28912353515625, 0.30052947998046875, 0.3119354248046875, 0.32334136962890625, 0.334747314453125, 0.34615325927734375, 0.3575592041015625, 0.36896514892578125, 0.38037109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 9.0, 6.0, 7.0, 16.0, 25.0, 30.0, 56.0, 83.0, 140.0, 183.0, 149.0, 120.0, 69.0, 36.0, 18.0, 18.0, 7.0, 9.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.2351837158203125, -0.226959228515625, -0.2187347412109375, -0.21051025390625, -0.2022857666015625, -0.194061279296875, -0.1858367919921875, -0.1776123046875, -0.1693878173828125, -0.161163330078125, -0.1529388427734375, -0.14471435546875, -0.1364898681640625, -0.128265380859375, -0.1200408935546875, -0.11181640625, -0.1035919189453125, -0.095367431640625, -0.0871429443359375, -0.07891845703125, -0.0706939697265625, -0.062469482421875, -0.0542449951171875, -0.0460205078125, -0.0377960205078125, -0.029571533203125, -0.0213470458984375, -0.01312255859375, -0.0048980712890625, 0.003326416015625, 0.0115509033203125, 0.019775390625, 0.0279998779296875, 0.036224365234375, 0.0444488525390625, 0.05267333984375, 0.0608978271484375, 0.069122314453125, 0.0773468017578125, 0.0855712890625, 0.0937957763671875, 0.102020263671875, 0.1102447509765625, 0.11846923828125, 0.1266937255859375, 0.134918212890625, 0.1431427001953125, 0.1513671875, 0.1595916748046875, 0.167816162109375, 0.1760406494140625, 0.18426513671875, 0.1924896240234375, 0.200714111328125, 0.2089385986328125, 0.2171630859375, 0.2253875732421875, 0.233612060546875, 0.2418365478515625, 0.25006103515625, 0.2582855224609375, 0.266510009765625, 0.2747344970703125, 0.282958984375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 13.0, 15.0, 37.0, 62.0, 128.0, 331.0, 257.0, 84.0, 32.0, 17.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9143617153167725, -2.7317936420440674, -2.5492255687713623, -2.366657257080078, -2.184089183807373, -2.001521110534668, -1.818953037261963, -1.6363849639892578, -1.4538168907165527, -1.2712488174438477, -1.0886807441711426, -0.906112551689148, -0.7235444784164429, -0.5409764051437378, -0.35840821266174316, -0.17584013938903809, 0.006727933883666992, 0.18929603695869446, 0.3718641400337219, 0.5544322729110718, 0.7370003461837769, 0.9195684194564819, 1.1021366119384766, 1.2847046852111816, 1.4672727584838867, 1.6498408317565918, 1.8324089050292969, 2.014976978302002, 2.197545051574707, 2.380113124847412, 2.5626814365386963, 2.7452495098114014, 2.9278173446655273, 3.1103854179382324, 3.2929534912109375, 3.4755215644836426, 3.6580896377563477, 3.8406577110290527, 4.023225784301758, 4.205794334411621, 4.388361930847168, 4.570930004119873, 4.753498077392578, 4.936066150665283, 5.118634223937988, 5.301202297210693, 5.483770370483398, 5.666338920593262, 5.848906993865967, 6.031475067138672, 6.214043140411377, 6.396611213684082, 6.579179286956787, 6.761747360229492, 6.9443159103393555, 7.126883506774902, 7.309452056884766, 7.492020130157471, 7.674588203430176, 7.857156276702881, 8.039724349975586, 8.22229290008545, 8.404860496520996, 8.58742904663086, 8.769996643066406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 7.0, 2.0, 10.0, 7.0, 16.0, 21.0, 26.0, 24.0, 22.0, 23.0, 41.0, 30.0, 49.0, 50.0, 57.0, 58.0, 66.0, 51.0, 47.0, 49.0, 47.0, 49.0, 49.0, 37.0, 31.0, 27.0, 13.0, 20.0, 12.0, 17.0, 7.0, 7.0, 4.0, 6.0, 10.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.621009826660156, -4.4645256996154785, -4.308041572570801, -4.151557445526123, -3.9950733184814453, -3.8385891914367676, -3.68210506439209, -3.525620937347412, -3.3691368103027344, -3.2126526832580566, -3.056168556213379, -2.899684429168701, -2.7432003021240234, -2.5867161750793457, -2.430232048034668, -2.2737479209899902, -2.1172635555267334, -1.9607794284820557, -1.804295301437378, -1.6478111743927002, -1.4913270473480225, -1.3348429203033447, -1.1783586740493774, -1.0218745470046997, -0.865390419960022, -0.7089062929153442, -0.5524221658706665, -0.395937979221344, -0.23945385217666626, -0.08296972513198853, 0.07351446151733398, 0.22999858856201172, 0.38648271560668945, 0.5429668426513672, 0.6994509696960449, 0.8559351563453674, 1.0124192237854004, 1.1689033508300781, 1.3253875970840454, 1.4818717241287231, 1.6383558511734009, 1.7948399782180786, 1.9513241052627563, 2.1078083515167236, 2.2642924785614014, 2.420776605606079, 2.577260732650757, 2.7337448596954346, 2.8902289867401123, 3.04671311378479, 3.2031972408294678, 3.3596813678741455, 3.5161654949188232, 3.672649621963501, 3.829133987426758, 3.9856181144714355, 4.142102241516113, 4.298586368560791, 4.455070495605469, 4.6115546226501465, 4.768038749694824, 4.924522876739502, 5.08100700378418, 5.237491130828857, 5.393975257873535]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 8.0, 6.0, 20.0, 28.0, 37.0, 60.0, 101.0, 177.0, 315.0, 560.0, 1198.0, 2834.0, 7543.0, 26374.0, 190763.0, 3808742.0, 122035.0, 20810.0, 6495.0, 2726.0, 1335.0, 682.0, 412.0, 282.0, 170.0, 119.0, 101.0, 62.0, 58.0, 43.0, 32.0, 22.0, 25.0, 20.0, 15.0, 17.0, 10.0, 8.0, 12.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.6664657592773438, -0.6302947998046875, -0.5941238403320312, -0.557952880859375, -0.5217819213867188, -0.4856109619140625, -0.44944000244140625, -0.41326904296875, -0.37709808349609375, -0.3409271240234375, -0.30475616455078125, -0.268585205078125, -0.23241424560546875, -0.1962432861328125, -0.16007232666015625, -0.1239013671875, -0.08773040771484375, -0.0515594482421875, -0.01538848876953125, 0.020782470703125, 0.05695343017578125, 0.0931243896484375, 0.12929534912109375, 0.16546630859375, 0.20163726806640625, 0.2378082275390625, 0.27397918701171875, 0.310150146484375, 0.34632110595703125, 0.3824920654296875, 0.41866302490234375, 0.454833984375, 0.49100494384765625, 0.5271759033203125, 0.5633468627929688, 0.599517822265625, 0.6356887817382812, 0.6718597412109375, 0.7080307006835938, 0.74420166015625, 0.7803726196289062, 0.8165435791015625, 0.8527145385742188, 0.888885498046875, 0.9250564575195312, 0.9612274169921875, 0.9973983764648438, 1.0335693359375, 1.0697402954101562, 1.1059112548828125, 1.1420822143554688, 1.178253173828125, 1.2144241333007812, 1.2505950927734375, 1.2867660522460938, 1.32293701171875, 1.3591079711914062, 1.3952789306640625, 1.4314498901367188, 1.467620849609375, 1.5037918090820312, 1.5399627685546875, 1.5761337280273438, 1.6123046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 25.0, 33.0, 56.0, 71.0, 82.0, 93.0, 98.0, 108.0, 106.0, 78.0, 71.0, 50.0, 48.0, 17.0, 15.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271484375, -0.25862884521484375, -0.2457733154296875, -0.23291778564453125, -0.220062255859375, -0.20720672607421875, -0.1943511962890625, -0.18149566650390625, -0.16864013671875, -0.15578460693359375, -0.1429290771484375, -0.13007354736328125, -0.117218017578125, -0.10436248779296875, -0.0915069580078125, -0.07865142822265625, -0.0657958984375, -0.05294036865234375, -0.0400848388671875, -0.02722930908203125, -0.014373779296875, -0.00151824951171875, 0.0113372802734375, 0.02419281005859375, 0.03704833984375, 0.04990386962890625, 0.0627593994140625, 0.07561492919921875, 0.088470458984375, 0.10132598876953125, 0.1141815185546875, 0.12703704833984375, 0.139892578125, 0.15274810791015625, 0.1656036376953125, 0.17845916748046875, 0.191314697265625, 0.20417022705078125, 0.2170257568359375, 0.22988128662109375, 0.24273681640625, 0.25559234619140625, 0.2684478759765625, 0.28130340576171875, 0.294158935546875, 0.30701446533203125, 0.3198699951171875, 0.33272552490234375, 0.3455810546875, 0.35843658447265625, 0.3712921142578125, 0.38414764404296875, 0.397003173828125, 0.40985870361328125, 0.4227142333984375, 0.43556976318359375, 0.44842529296875, 0.46128082275390625, 0.4741363525390625, 0.48699188232421875, 0.499847412109375, 0.5127029418945312, 0.5255584716796875, 0.5384140014648438, 0.55126953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 12.0, 21.0, 46.0, 69.0, 136.0, 289.0, 1568.0, 4189570.0, 2103.0, 267.0, 109.0, 51.0, 17.0, 17.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.96734619140625, -11.6925048828125, -11.41766357421875, -11.142822265625, -10.86798095703125, -10.5931396484375, -10.31829833984375, -10.04345703125, -9.76861572265625, -9.4937744140625, -9.21893310546875, -8.944091796875, -8.66925048828125, -8.3944091796875, -8.11956787109375, -7.8447265625, -7.56988525390625, -7.2950439453125, -7.02020263671875, -6.745361328125, -6.47052001953125, -6.1956787109375, -5.92083740234375, -5.64599609375, -5.37115478515625, -5.0963134765625, -4.82147216796875, -4.546630859375, -4.27178955078125, -3.9969482421875, -3.72210693359375, -3.447265625, -3.17242431640625, -2.8975830078125, -2.62274169921875, -2.347900390625, -2.07305908203125, -1.7982177734375, -1.52337646484375, -1.24853515625, -0.97369384765625, -0.6988525390625, -0.42401123046875, -0.149169921875, 0.12567138671875, 0.4005126953125, 0.67535400390625, 0.9501953125, 1.22503662109375, 1.4998779296875, 1.77471923828125, 2.049560546875, 2.32440185546875, 2.5992431640625, 2.87408447265625, 3.14892578125, 3.42376708984375, 3.6986083984375, 3.97344970703125, 4.248291015625, 4.52313232421875, 4.7979736328125, 5.07281494140625, 5.34765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 18.0, 44.0, 2860.0, 1099.0, 49.0, 12.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.2476882934570312, -2.1965484619140625, -2.1454086303710938, -2.094268798828125, -2.0431289672851562, -1.9919891357421875, -1.9408493041992188, -1.88970947265625, -1.8385696411132812, -1.7874298095703125, -1.7362899780273438, -1.685150146484375, -1.6340103149414062, -1.5828704833984375, -1.5317306518554688, -1.4805908203125, -1.4294509887695312, -1.3783111572265625, -1.3271713256835938, -1.276031494140625, -1.2248916625976562, -1.1737518310546875, -1.1226119995117188, -1.07147216796875, -1.0203323364257812, -0.9691925048828125, -0.9180526733398438, -0.866912841796875, -0.8157730102539062, -0.7646331787109375, -0.7134933471679688, -0.662353515625, -0.6112136840820312, -0.5600738525390625, -0.5089340209960938, -0.457794189453125, -0.40665435791015625, -0.3555145263671875, -0.30437469482421875, -0.25323486328125, -0.20209503173828125, -0.1509552001953125, -0.09981536865234375, -0.048675537109375, 0.00246429443359375, 0.0536041259765625, 0.10474395751953125, 0.1558837890625, 0.20702362060546875, 0.2581634521484375, 0.30930328369140625, 0.360443115234375, 0.41158294677734375, 0.4627227783203125, 0.5138626098632812, 0.56500244140625, 0.6161422729492188, 0.6672821044921875, 0.7184219360351562, 0.769561767578125, 0.8207015991210938, 0.8718414306640625, 0.9229812622070312, 0.97412109375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 893.0, 108.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.087545394897461, -10.620718002319336, -10.153890609741211, -9.687063217163086, -9.220235824584961, -8.753408432006836, -8.286581039428711, -7.8197526931762695, -7.3529253005981445, -6.8860979080200195, -6.4192705154418945, -5.9524431228637695, -5.485615253448486, -5.018787860870361, -4.551960468292236, -4.085132598876953, -3.6183056831359863, -3.1514782905578613, -2.6846506595611572, -2.2178232669830322, -1.7509957551956177, -1.2841682434082031, -0.8173408508300781, -0.350513219833374, 0.11631417274475098, 0.5831416845321655, 1.04996919631958, 1.516796588897705, 1.9836241006851196, 2.450451612472534, 2.917279005050659, 3.3841066360473633, 3.8509340286254883, 4.317761421203613, 4.784588813781738, 5.251416206359863, 5.7182440757751465, 6.1850714683532715, 6.6518988609313965, 7.11872673034668, 7.585554122924805, 8.05238151550293, 8.519208908081055, 8.98603630065918, 9.452863693237305, 9.91969108581543, 10.386518478393555, 10.853346824645996, 11.320173263549805, 11.78700065612793, 12.253828048706055, 12.72065544128418, 13.187482833862305, 13.65431022644043, 14.121137619018555, 14.587965965270996, 15.054793357849121, 15.521620750427246, 15.988448143005371, 16.455276489257812, 16.922103881835938, 17.388931274414062, 17.855758666992188, 18.322586059570312, 18.789413452148438]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 4.0, 16.0, 27.0, 44.0, 70.0, 88.0, 129.0, 121.0, 125.0, 108.0, 95.0, 73.0, 41.0, 26.0, 21.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.228074073791504, -2.1390023231506348, -2.0499305725097656, -1.9608588218688965, -1.8717870712280273, -1.7827153205871582, -1.693643569946289, -1.60457181930542, -1.5155000686645508, -1.4264283180236816, -1.3373565673828125, -1.2482848167419434, -1.1592130661010742, -1.070141315460205, -0.9810695648193359, -0.8919978141784668, -0.8029260635375977, -0.7138543128967285, -0.6247825622558594, -0.5357108116149902, -0.4466390609741211, -0.35756731033325195, -0.2684955596923828, -0.17942380905151367, -0.09035205841064453, -0.0012803077697753906, 0.08779144287109375, 0.1768631935119629, 0.26593494415283203, 0.35500669479370117, 0.4440784454345703, 0.5331501960754395, 0.6222219467163086, 0.7112936973571777, 0.8003654479980469, 0.889437198638916, 0.9785089492797852, 1.0675806999206543, 1.1566524505615234, 1.2457242012023926, 1.3347959518432617, 1.4238677024841309, 1.512939453125, 1.6020112037658691, 1.6910829544067383, 1.7801547050476074, 1.8692264556884766, 1.9582982063293457, 2.047369956970215, 2.136441707611084, 2.225513458251953, 2.3145852088928223, 2.4036569595336914, 2.4927287101745605, 2.5818004608154297, 2.670872211456299, 2.759943962097168, 2.849015712738037, 2.9380874633789062, 3.0271592140197754, 3.1162309646606445, 3.2053027153015137, 3.294374465942383, 3.383446216583252, 3.472517967224121]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 19.0, 27.0, 41.0, 53.0, 76.0, 113.0, 221.0, 441.0, 853.0, 1978.0, 6274.0, 30174.0, 294511.0, 645111.0, 54181.0, 9519.0, 2578.0, 1086.0, 547.0, 268.0, 183.0, 94.0, 60.0, 38.0, 29.0, 13.0, 13.0, 15.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09375, -1.0586395263671875, -1.023529052734375, -0.9884185791015625, -0.95330810546875, -0.9181976318359375, -0.883087158203125, -0.8479766845703125, -0.8128662109375, -0.7777557373046875, -0.742645263671875, -0.7075347900390625, -0.67242431640625, -0.6373138427734375, -0.602203369140625, -0.5670928955078125, -0.531982421875, -0.4968719482421875, -0.461761474609375, -0.4266510009765625, -0.39154052734375, -0.3564300537109375, -0.321319580078125, -0.2862091064453125, -0.2510986328125, -0.2159881591796875, -0.180877685546875, -0.1457672119140625, -0.11065673828125, -0.0755462646484375, -0.040435791015625, -0.0053253173828125, 0.02978515625, 0.0648956298828125, 0.100006103515625, 0.1351165771484375, 0.17022705078125, 0.2053375244140625, 0.240447998046875, 0.2755584716796875, 0.3106689453125, 0.3457794189453125, 0.380889892578125, 0.4160003662109375, 0.45111083984375, 0.4862213134765625, 0.521331787109375, 0.5564422607421875, 0.591552734375, 0.6266632080078125, 0.661773681640625, 0.6968841552734375, 0.73199462890625, 0.7671051025390625, 0.802215576171875, 0.8373260498046875, 0.8724365234375, 0.9075469970703125, 0.942657470703125, 0.9777679443359375, 1.01287841796875, 1.0479888916015625, 1.083099365234375, 1.1182098388671875, 1.1533203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 14.0, 30.0, 38.0, 32.0, 61.0, 54.0, 84.0, 83.0, 101.0, 91.0, 85.0, 77.0, 57.0, 55.0, 39.0, 22.0, 33.0, 10.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.250244140625, -0.23934173583984375, -0.2284393310546875, -0.21753692626953125, -0.206634521484375, -0.19573211669921875, -0.1848297119140625, -0.17392730712890625, -0.16302490234375, -0.15212249755859375, -0.1412200927734375, -0.13031768798828125, -0.119415283203125, -0.10851287841796875, -0.0976104736328125, -0.08670806884765625, -0.0758056640625, -0.06490325927734375, -0.0540008544921875, -0.04309844970703125, -0.032196044921875, -0.02129364013671875, -0.0103912353515625, 0.00051116943359375, 0.01141357421875, 0.02231597900390625, 0.0332183837890625, 0.04412078857421875, 0.055023193359375, 0.06592559814453125, 0.0768280029296875, 0.08773040771484375, 0.0986328125, 0.10953521728515625, 0.1204376220703125, 0.13134002685546875, 0.142242431640625, 0.15314483642578125, 0.1640472412109375, 0.17494964599609375, 0.18585205078125, 0.19675445556640625, 0.2076568603515625, 0.21855926513671875, 0.229461669921875, 0.24036407470703125, 0.2512664794921875, 0.26216888427734375, 0.2730712890625, 0.28397369384765625, 0.2948760986328125, 0.30577850341796875, 0.316680908203125, 0.32758331298828125, 0.3384857177734375, 0.34938812255859375, 0.36029052734375, 0.37119293212890625, 0.3820953369140625, 0.39299774169921875, 0.403900146484375, 0.41480255126953125, 0.4257049560546875, 0.43660736083984375, 0.447509765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 9.0, 9.0, 10.0, 18.0, 17.0, 40.0, 49.0, 112.0, 228.0, 542.0, 1697.0, 7876.0, 76144.0, 883063.0, 68676.0, 7316.0, 1708.0, 524.0, 226.0, 91.0, 55.0, 39.0, 37.0, 16.0, 10.0, 7.0, 4.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.2197113037109375, -1.169891357421875, -1.1200714111328125, -1.07025146484375, -1.0204315185546875, -0.970611572265625, -0.9207916259765625, -0.8709716796875, -0.8211517333984375, -0.771331787109375, -0.7215118408203125, -0.67169189453125, -0.6218719482421875, -0.572052001953125, -0.5222320556640625, -0.472412109375, -0.4225921630859375, -0.372772216796875, -0.3229522705078125, -0.27313232421875, -0.2233123779296875, -0.173492431640625, -0.1236724853515625, -0.0738525390625, -0.0240325927734375, 0.025787353515625, 0.0756072998046875, 0.12542724609375, 0.1752471923828125, 0.225067138671875, 0.2748870849609375, 0.32470703125, 0.3745269775390625, 0.424346923828125, 0.4741668701171875, 0.52398681640625, 0.5738067626953125, 0.623626708984375, 0.6734466552734375, 0.7232666015625, 0.7730865478515625, 0.822906494140625, 0.8727264404296875, 0.92254638671875, 0.9723663330078125, 1.022186279296875, 1.0720062255859375, 1.121826171875, 1.1716461181640625, 1.221466064453125, 1.2712860107421875, 1.32110595703125, 1.3709259033203125, 1.420745849609375, 1.4705657958984375, 1.5203857421875, 1.5702056884765625, 1.620025634765625, 1.6698455810546875, 1.71966552734375, 1.7694854736328125, 1.819305419921875, 1.8691253662109375, 1.9189453125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 11.0, 13.0, 12.0, 26.0, 28.0, 55.0, 44.0, 53.0, 63.0, 74.0, 59.0, 83.0, 84.0, 70.0, 67.0, 54.0, 38.0, 27.0, 27.0, 23.0, 20.0, 10.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0537109375, -1.011962890625, -0.97021484375, -0.928466796875, -0.88671875, -0.844970703125, -0.80322265625, -0.761474609375, -0.7197265625, -0.677978515625, -0.63623046875, -0.594482421875, -0.552734375, -0.510986328125, -0.46923828125, -0.427490234375, -0.3857421875, -0.343994140625, -0.30224609375, -0.260498046875, -0.21875, -0.177001953125, -0.13525390625, -0.093505859375, -0.0517578125, -0.010009765625, 0.03173828125, 0.073486328125, 0.115234375, 0.156982421875, 0.19873046875, 0.240478515625, 0.2822265625, 0.323974609375, 0.36572265625, 0.407470703125, 0.44921875, 0.490966796875, 0.53271484375, 0.574462890625, 0.6162109375, 0.657958984375, 0.69970703125, 0.741455078125, 0.783203125, 0.824951171875, 0.86669921875, 0.908447265625, 0.9501953125, 0.991943359375, 1.03369140625, 1.075439453125, 1.1171875, 1.158935546875, 1.20068359375, 1.242431640625, 1.2841796875, 1.325927734375, 1.36767578125, 1.409423828125, 1.451171875, 1.492919921875, 1.53466796875, 1.576416015625, 1.6181640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 12.0, 12.0, 12.0, 31.0, 33.0, 62.0, 108.0, 180.0, 368.0, 843.0, 2345.0, 12426.0, 389794.0, 621302.0, 16272.0, 2862.0, 971.0, 388.0, 212.0, 114.0, 67.0, 34.0, 22.0, 28.0, 14.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.3858909606933594, -0.37261199951171875, -0.3593330383300781, -0.3460540771484375, -0.3327751159667969, -0.31949615478515625, -0.3062171936035156, -0.292938232421875, -0.2796592712402344, -0.26638031005859375, -0.2531013488769531, -0.2398223876953125, -0.22654342651367188, -0.21326446533203125, -0.19998550415039062, -0.18670654296875, -0.17342758178710938, -0.16014862060546875, -0.14686965942382812, -0.1335906982421875, -0.12031173706054688, -0.10703277587890625, -0.09375381469726562, -0.080474853515625, -0.06719589233398438, -0.05391693115234375, -0.040637969970703125, -0.0273590087890625, -0.014080047607421875, -0.00080108642578125, 0.012477874755859375, 0.0257568359375, 0.039035797119140625, 0.05231475830078125, 0.06559371948242188, 0.0788726806640625, 0.09215164184570312, 0.10543060302734375, 0.11870956420898438, 0.131988525390625, 0.14526748657226562, 0.15854644775390625, 0.17182540893554688, 0.1851043701171875, 0.19838333129882812, 0.21166229248046875, 0.22494125366210938, 0.23822021484375, 0.2514991760253906, 0.26477813720703125, 0.2780570983886719, 0.2913360595703125, 0.3046150207519531, 0.31789398193359375, 0.3311729431152344, 0.344451904296875, 0.3577308654785156, 0.37100982666015625, 0.3842887878417969, 0.3975677490234375, 0.4108467102050781, 0.42412567138671875, 0.4374046325683594, 0.45068359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 13.0, 33.0, 51.0, 109.0, 177.0, 224.0, 182.0, 98.0, 57.0, 23.0, 13.0, 8.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.295608520507812e-05, -7.131509482860565e-05, -6.967410445213318e-05, -6.80331140756607e-05, -6.639212369918823e-05, -6.475113332271576e-05, -6.311014294624329e-05, -6.146915256977081e-05, -5.982816219329834e-05, -5.818717181682587e-05, -5.6546181440353394e-05, -5.490519106388092e-05, -5.326420068740845e-05, -5.1623210310935974e-05, -4.99822199344635e-05, -4.834122955799103e-05, -4.6700239181518555e-05, -4.505924880504608e-05, -4.341825842857361e-05, -4.1777268052101135e-05, -4.013627767562866e-05, -3.849528729915619e-05, -3.6854296922683716e-05, -3.521330654621124e-05, -3.357231616973877e-05, -3.1931325793266296e-05, -3.0290335416793823e-05, -2.864934504032135e-05, -2.7008354663848877e-05, -2.5367364287376404e-05, -2.372637391090393e-05, -2.2085383534431458e-05, -2.0444393157958984e-05, -1.880340278148651e-05, -1.7162412405014038e-05, -1.5521422028541565e-05, -1.3880431652069092e-05, -1.2239441275596619e-05, -1.0598450899124146e-05, -8.957460522651672e-06, -7.316470146179199e-06, -5.675479769706726e-06, -4.034489393234253e-06, -2.3934990167617798e-06, -7.525086402893066e-07, 8.884817361831665e-07, 2.5294721126556396e-06, 4.170462489128113e-06, 5.811452865600586e-06, 7.452443242073059e-06, 9.093433618545532e-06, 1.0734423995018005e-05, 1.2375414371490479e-05, 1.4016404747962952e-05, 1.5657395124435425e-05, 1.7298385500907898e-05, 1.893937587738037e-05, 2.0580366253852844e-05, 2.2221356630325317e-05, 2.386234700679779e-05, 2.5503337383270264e-05, 2.7144327759742737e-05, 2.878531813621521e-05, 3.0426308512687683e-05, 3.2067298889160156e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 6.0, 9.0, 7.0, 23.0, 36.0, 61.0, 142.0, 238.0, 671.0, 2747.0, 25328.0, 914037.0, 98298.0, 5257.0, 1027.0, 327.0, 158.0, 93.0, 33.0, 21.0, 14.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.62841796875, -0.6143531799316406, -0.6002883911132812, -0.5862236022949219, -0.5721588134765625, -0.5580940246582031, -0.5440292358398438, -0.5299644470214844, -0.515899658203125, -0.5018348693847656, -0.48777008056640625, -0.4737052917480469, -0.4596405029296875, -0.4455757141113281, -0.43151092529296875, -0.4174461364746094, -0.40338134765625, -0.3893165588378906, -0.37525177001953125, -0.3611869812011719, -0.3471221923828125, -0.3330574035644531, -0.31899261474609375, -0.3049278259277344, -0.290863037109375, -0.2767982482910156, -0.26273345947265625, -0.24866867065429688, -0.2346038818359375, -0.22053909301757812, -0.20647430419921875, -0.19240951538085938, -0.1783447265625, -0.16427993774414062, -0.15021514892578125, -0.13615036010742188, -0.1220855712890625, -0.10802078247070312, -0.09395599365234375, -0.07989120483398438, -0.065826416015625, -0.051761627197265625, -0.03769683837890625, -0.023632049560546875, -0.0095672607421875, 0.004497528076171875, 0.01856231689453125, 0.032627105712890625, 0.04669189453125, 0.060756683349609375, 0.07482147216796875, 0.08888626098632812, 0.1029510498046875, 0.11701583862304688, 0.13108062744140625, 0.14514541625976562, 0.159210205078125, 0.17327499389648438, 0.18733978271484375, 0.20140457153320312, 0.2154693603515625, 0.22953414916992188, 0.24359893798828125, 0.2576637268066406, 0.271728515625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 11.0, 14.0, 19.0, 31.0, 63.0, 117.0, 202.0, 200.0, 151.0, 72.0, 46.0, 23.0, 20.0, 10.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.55908203125, -0.5475196838378906, -0.5359573364257812, -0.5243949890136719, -0.5128326416015625, -0.5012702941894531, -0.48970794677734375, -0.4781455993652344, -0.466583251953125, -0.4550209045410156, -0.44345855712890625, -0.4318962097167969, -0.4203338623046875, -0.4087715148925781, -0.39720916748046875, -0.3856468200683594, -0.37408447265625, -0.3625221252441406, -0.35095977783203125, -0.3393974304199219, -0.3278350830078125, -0.3162727355957031, -0.30471038818359375, -0.2931480407714844, -0.281585693359375, -0.2700233459472656, -0.25846099853515625, -0.24689865112304688, -0.2353363037109375, -0.22377395629882812, -0.21221160888671875, -0.20064926147460938, -0.1890869140625, -0.17752456665039062, -0.16596221923828125, -0.15439987182617188, -0.1428375244140625, -0.13127517700195312, -0.11971282958984375, -0.10815048217773438, -0.096588134765625, -0.08502578735351562, -0.07346343994140625, -0.061901092529296875, -0.0503387451171875, -0.038776397705078125, -0.02721405029296875, -0.015651702880859375, -0.00408935546875, 0.007472991943359375, 0.01903533935546875, 0.030597686767578125, 0.0421600341796875, 0.053722381591796875, 0.06528472900390625, 0.07684707641601562, 0.088409423828125, 0.09997177124023438, 0.11153411865234375, 0.12309646606445312, 0.1346588134765625, 0.14622116088867188, 0.15778350830078125, 0.16934585571289062, 0.180908203125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 11.0, 28.0, 90.0, 469.0, 313.0, 60.0, 24.0, 10.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07448673248291, -4.60782527923584, -4.1411638259887695, -3.67450213432312, -3.20784068107605, -2.7411792278289795, -2.27451753616333, -1.8078560829162598, -1.3411946296691895, -0.8745331168174744, -0.4078716039657593, 0.058789968490600586, 0.5254514217376709, 0.9921128749847412, 1.4587745666503906, 1.925436019897461, 2.3920974731445312, 2.8587589263916016, 3.325420379638672, 3.7920820713043213, 4.2587432861328125, 4.725404739379883, 5.192066669464111, 5.658728122711182, 6.125389575958252, 6.592051029205322, 7.058712482452393, 7.525374412536621, 7.992035865783691, 8.458697319030762, 8.925358772277832, 9.392020225524902, 9.858682632446289, 10.32534408569336, 10.79200553894043, 11.2586669921875, 11.72532844543457, 12.19198989868164, 12.658651351928711, 13.125312805175781, 13.591974258422852, 14.058635711669922, 14.525297164916992, 14.991958618164062, 15.458620071411133, 15.925281524658203, 16.391942977905273, 16.858604431152344, 17.325267791748047, 17.791929244995117, 18.258590698242188, 18.725252151489258, 19.191913604736328, 19.6585750579834, 20.12523651123047, 20.59189796447754, 21.05855941772461, 21.52522087097168, 21.99188232421875, 22.45854377746582, 22.92520523071289, 23.39186668395996, 23.85852813720703, 24.3251895904541, 24.791851043701172]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 8.0, 4.0, 4.0, 7.0, 11.0, 10.0, 7.0, 9.0, 15.0, 16.0, 16.0, 20.0, 25.0, 34.0, 32.0, 24.0, 37.0, 54.0, 52.0, 39.0, 38.0, 50.0, 43.0, 64.0, 38.0, 42.0, 44.0, 43.0, 31.0, 32.0, 25.0, 25.0, 18.0, 20.0, 13.0, 8.0, 9.0, 9.0, 5.0, 5.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.202214241027832, -5.026708126068115, -4.851202487945557, -4.67569637298584, -4.500190734863281, -4.3246846199035645, -4.149178504943848, -3.973672866821289, -3.7981669902801514, -3.6226611137390137, -3.447155237197876, -3.2716493606567383, -3.0961432456970215, -2.920637607574463, -2.745131492614746, -2.5696256160736084, -2.3941197395324707, -2.218613862991333, -2.0431079864501953, -1.867601990699768, -1.6920961141586304, -1.5165902376174927, -1.3410842418670654, -1.1655783653259277, -0.99007248878479, -0.8145666122436523, -0.6390606760978699, -0.4635547399520874, -0.2880488634109497, -0.11254298686981201, 0.06296300888061523, 0.23846888542175293, 0.41397523880004883, 0.5894811153411865, 0.764987051486969, 0.9404929876327515, 1.1159988641738892, 1.2915047407150269, 1.467010736465454, 1.6425166130065918, 1.8180224895477295, 1.9935283660888672, 2.169034242630005, 2.3445401191711426, 2.5200462341308594, 2.695551872253418, 2.8710579872131348, 3.0465638637542725, 3.22206974029541, 3.397575616836548, 3.5730814933776855, 3.7485876083374023, 3.924093246459961, 4.099599361419678, 4.2751054763793945, 4.450611114501953, 4.626116752624512, 4.8016228675842285, 4.977128505706787, 5.152634620666504, 5.3281402587890625, 5.503646373748779, 5.679152488708496, 5.854658126831055, 6.0301642417907715]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 17.0, 33.0, 32.0, 85.0, 98.0, 184.0, 387.0, 736.0, 1600.0, 3570.0, 10752.0, 53677.0, 3546001.0, 531050.0, 31822.0, 8038.0, 2992.0, 1441.0, 705.0, 390.0, 211.0, 127.0, 96.0, 52.0, 39.0, 26.0, 27.0, 14.0, 11.0, 9.0, 7.0, 10.0, 3.0, 5.0, 6.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.203125, -1.148101806640625, -1.09307861328125, -1.038055419921875, -0.9830322265625, -0.928009033203125, -0.87298583984375, -0.817962646484375, -0.762939453125, -0.707916259765625, -0.65289306640625, -0.597869873046875, -0.5428466796875, -0.487823486328125, -0.43280029296875, -0.377777099609375, -0.32275390625, -0.267730712890625, -0.21270751953125, -0.157684326171875, -0.1026611328125, -0.047637939453125, 0.00738525390625, 0.062408447265625, 0.117431640625, 0.172454833984375, 0.22747802734375, 0.282501220703125, 0.3375244140625, 0.392547607421875, 0.44757080078125, 0.502593994140625, 0.5576171875, 0.612640380859375, 0.66766357421875, 0.722686767578125, 0.7777099609375, 0.832733154296875, 0.88775634765625, 0.942779541015625, 0.997802734375, 1.052825927734375, 1.10784912109375, 1.162872314453125, 1.2178955078125, 1.272918701171875, 1.32794189453125, 1.382965087890625, 1.43798828125, 1.493011474609375, 1.54803466796875, 1.603057861328125, 1.6580810546875, 1.713104248046875, 1.76812744140625, 1.823150634765625, 1.878173828125, 1.933197021484375, 1.98822021484375, 2.043243408203125, 2.0982666015625, 2.153289794921875, 2.20831298828125, 2.263336181640625, 2.318359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 16.0, 20.0, 21.0, 38.0, 36.0, 55.0, 70.0, 68.0, 74.0, 97.0, 87.0, 72.0, 84.0, 59.0, 55.0, 29.0, 37.0, 26.0, 19.0, 16.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23234176635742188, -0.22127532958984375, -0.21020889282226562, -0.1991424560546875, -0.18807601928710938, -0.17700958251953125, -0.16594314575195312, -0.154876708984375, -0.14381027221679688, -0.13274383544921875, -0.12167739868164062, -0.1106109619140625, -0.09954452514648438, -0.08847808837890625, -0.07741165161132812, -0.06634521484375, -0.055278778076171875, -0.04421234130859375, -0.033145904541015625, -0.0220794677734375, -0.011013031005859375, 5.340576171875e-05, 0.011119842529296875, 0.022186279296875, 0.033252716064453125, 0.04431915283203125, 0.055385589599609375, 0.0664520263671875, 0.07751846313476562, 0.08858489990234375, 0.09965133666992188, 0.1107177734375, 0.12178421020507812, 0.13285064697265625, 0.14391708374023438, 0.1549835205078125, 0.16604995727539062, 0.17711639404296875, 0.18818283081054688, 0.199249267578125, 0.21031570434570312, 0.22138214111328125, 0.23244857788085938, 0.2435150146484375, 0.2545814514160156, 0.26564788818359375, 0.2767143249511719, 0.28778076171875, 0.2988471984863281, 0.30991363525390625, 0.3209800720214844, 0.3320465087890625, 0.3431129455566406, 0.35417938232421875, 0.3652458190917969, 0.376312255859375, 0.3873786926269531, 0.39844512939453125, 0.4095115661621094, 0.4205780029296875, 0.4316444396972656, 0.44271087646484375, 0.4537773132324219, 0.46484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 4.0, 11.0, 26.0, 39.0, 57.0, 121.0, 285.0, 1077.0, 5832.0, 454216.0, 3722656.0, 7762.0, 1345.0, 404.0, 178.0, 103.0, 52.0, 42.0, 27.0, 17.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.017578125, -2.906036376953125, -2.79449462890625, -2.682952880859375, -2.5714111328125, -2.459869384765625, -2.34832763671875, -2.236785888671875, -2.125244140625, -2.013702392578125, -1.90216064453125, -1.790618896484375, -1.6790771484375, -1.567535400390625, -1.45599365234375, -1.344451904296875, -1.23291015625, -1.121368408203125, -1.00982666015625, -0.898284912109375, -0.7867431640625, -0.675201416015625, -0.56365966796875, -0.452117919921875, -0.340576171875, -0.229034423828125, -0.11749267578125, -0.005950927734375, 0.1055908203125, 0.217132568359375, 0.32867431640625, 0.440216064453125, 0.5517578125, 0.663299560546875, 0.77484130859375, 0.886383056640625, 0.9979248046875, 1.109466552734375, 1.22100830078125, 1.332550048828125, 1.444091796875, 1.555633544921875, 1.66717529296875, 1.778717041015625, 1.8902587890625, 2.001800537109375, 2.11334228515625, 2.224884033203125, 2.33642578125, 2.447967529296875, 2.55950927734375, 2.671051025390625, 2.7825927734375, 2.894134521484375, 3.00567626953125, 3.117218017578125, 3.228759765625, 3.340301513671875, 3.45184326171875, 3.563385009765625, 3.6749267578125, 3.786468505859375, 3.89801025390625, 4.009552001953125, 4.12109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 11.0, 36.0, 70.0, 335.0, 3085.0, 363.0, 74.0, 37.0, 14.0, 10.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6875, -0.645843505859375, -0.60418701171875, -0.562530517578125, -0.5208740234375, -0.479217529296875, -0.43756103515625, -0.395904541015625, -0.354248046875, -0.312591552734375, -0.27093505859375, -0.229278564453125, -0.1876220703125, -0.145965576171875, -0.10430908203125, -0.062652587890625, -0.02099609375, 0.020660400390625, 0.06231689453125, 0.103973388671875, 0.1456298828125, 0.187286376953125, 0.22894287109375, 0.270599365234375, 0.312255859375, 0.353912353515625, 0.39556884765625, 0.437225341796875, 0.4788818359375, 0.520538330078125, 0.56219482421875, 0.603851318359375, 0.6455078125, 0.687164306640625, 0.72882080078125, 0.770477294921875, 0.8121337890625, 0.853790283203125, 0.89544677734375, 0.937103271484375, 0.978759765625, 1.020416259765625, 1.06207275390625, 1.103729248046875, 1.1453857421875, 1.187042236328125, 1.22869873046875, 1.270355224609375, 1.31201171875, 1.353668212890625, 1.39532470703125, 1.436981201171875, 1.4786376953125, 1.520294189453125, 1.56195068359375, 1.603607177734375, 1.645263671875, 1.686920166015625, 1.72857666015625, 1.770233154296875, 1.8118896484375, 1.853546142578125, 1.89520263671875, 1.936859130859375, 1.978515625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 17.0, 61.0, 459.0, 392.0, 49.0, 13.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302525758743286, -3.0660243034362793, -2.8295230865478516, -2.5930216312408447, -2.356520175933838, -2.12001895904541, -1.8835175037384033, -1.6470160484313965, -1.4105147123336792, -1.174013376235962, -0.9375119209289551, -0.7010105848312378, -0.46450918912887573, -0.22800779342651367, 0.008493542671203613, 0.24499499797821045, 0.48149633407592773, 0.7179977297782898, 0.9544991254806519, 1.1910004615783691, 1.427501916885376, 1.6640032529830933, 1.9005045890808105, 2.1370060443878174, 2.373507499694824, 2.610008955001831, 2.846510171890259, 3.0830116271972656, 3.3195130825042725, 3.5560145378112793, 3.792515754699707, 4.029017448425293, 4.265518665313721, 4.502019882202148, 4.738521575927734, 4.975022792816162, 5.21152400970459, 5.448025703430176, 5.6845269203186035, 5.921028137207031, 6.157529830932617, 6.394031047821045, 6.630532741546631, 6.867033958435059, 7.103535175323486, 7.340036869049072, 7.5765380859375, 7.813039779663086, 8.049540519714355, 8.286042213439941, 8.522542953491211, 8.759044647216797, 8.995546340942383, 9.232047080993652, 9.468548774719238, 9.705050468444824, 9.94155216217041, 10.178053855895996, 10.414554595947266, 10.651056289672852, 10.887557983398438, 11.124058723449707, 11.360560417175293, 11.597062110900879, 11.833562850952148]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 20.0, 20.0, 36.0, 54.0, 69.0, 103.0, 105.0, 119.0, 114.0, 111.0, 72.0, 69.0, 43.0, 20.0, 17.0, 9.0, 4.0, 9.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6013617515563965, -4.462551116943359, -4.323740482330322, -4.184929847717285, -4.046119213104248, -3.907308578491211, -3.768497943878174, -3.6296873092651367, -3.4908766746520996, -3.3520660400390625, -3.2132554054260254, -3.0744447708129883, -2.935634136199951, -2.796823501586914, -2.658012866973877, -2.51920223236084, -2.3803915977478027, -2.2415809631347656, -2.1027703285217285, -1.9639596939086914, -1.8251490592956543, -1.6863384246826172, -1.54752779006958, -1.408717155456543, -1.2699065208435059, -1.1310958862304688, -0.9922852516174316, -0.8534746170043945, -0.7146639823913574, -0.5758533477783203, -0.4370427131652832, -0.2982320785522461, -0.15942096710205078, -0.020610332489013672, 0.11820030212402344, 0.25701093673706055, 0.39582157135009766, 0.5346322059631348, 0.6734428405761719, 0.812253475189209, 0.9510641098022461, 1.0898747444152832, 1.2286853790283203, 1.3674960136413574, 1.5063066482543945, 1.6451172828674316, 1.7839279174804688, 1.9227385520935059, 2.061549186706543, 2.20035982131958, 2.339170455932617, 2.4779810905456543, 2.6167917251586914, 2.7556023597717285, 2.8944129943847656, 3.0332236289978027, 3.17203426361084, 3.310844898223877, 3.449655532836914, 3.588466167449951, 3.7272768020629883, 3.8660874366760254, 4.0048980712890625, 4.1437087059021, 4.282519340515137]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 6.0, 11.0, 16.0, 23.0, 33.0, 29.0, 69.0, 147.0, 186.0, 326.0, 716.0, 1527.0, 4669.0, 21242.0, 164089.0, 738297.0, 96677.0, 14370.0, 3491.0, 1255.0, 588.0, 288.0, 169.0, 101.0, 67.0, 48.0, 24.0, 25.0, 13.0, 13.0, 7.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.3429718017578125, -1.306060791015625, -1.2691497802734375, -1.23223876953125, -1.1953277587890625, -1.158416748046875, -1.1215057373046875, -1.0845947265625, -1.0476837158203125, -1.010772705078125, -0.9738616943359375, -0.93695068359375, -0.9000396728515625, -0.863128662109375, -0.8262176513671875, -0.789306640625, -0.7523956298828125, -0.715484619140625, -0.6785736083984375, -0.64166259765625, -0.6047515869140625, -0.567840576171875, -0.5309295654296875, -0.4940185546875, -0.4571075439453125, -0.420196533203125, -0.3832855224609375, -0.34637451171875, -0.3094635009765625, -0.272552490234375, -0.2356414794921875, -0.19873046875, -0.1618194580078125, -0.124908447265625, -0.0879974365234375, -0.05108642578125, -0.0141754150390625, 0.022735595703125, 0.0596466064453125, 0.0965576171875, 0.1334686279296875, 0.170379638671875, 0.2072906494140625, 0.24420166015625, 0.2811126708984375, 0.318023681640625, 0.3549346923828125, 0.391845703125, 0.4287567138671875, 0.465667724609375, 0.5025787353515625, 0.53948974609375, 0.5764007568359375, 0.613311767578125, 0.6502227783203125, 0.6871337890625, 0.7240447998046875, 0.760955810546875, 0.7978668212890625, 0.83477783203125, 0.8716888427734375, 0.908599853515625, 0.9455108642578125, 0.982421875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 7.0, 15.0, 28.0, 49.0, 53.0, 78.0, 85.0, 104.0, 104.0, 107.0, 81.0, 91.0, 54.0, 51.0, 46.0, 20.0, 11.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.2553863525390625, -0.241729736328125, -0.2280731201171875, -0.21441650390625, -0.2007598876953125, -0.187103271484375, -0.1734466552734375, -0.1597900390625, -0.1461334228515625, -0.132476806640625, -0.1188201904296875, -0.10516357421875, -0.0915069580078125, -0.077850341796875, -0.0641937255859375, -0.050537109375, -0.0368804931640625, -0.023223876953125, -0.0095672607421875, 0.00408935546875, 0.0177459716796875, 0.031402587890625, 0.0450592041015625, 0.0587158203125, 0.0723724365234375, 0.086029052734375, 0.0996856689453125, 0.11334228515625, 0.1269989013671875, 0.140655517578125, 0.1543121337890625, 0.16796875, 0.1816253662109375, 0.195281982421875, 0.2089385986328125, 0.22259521484375, 0.2362518310546875, 0.249908447265625, 0.2635650634765625, 0.2772216796875, 0.2908782958984375, 0.304534912109375, 0.3181915283203125, 0.33184814453125, 0.3455047607421875, 0.359161376953125, 0.3728179931640625, 0.386474609375, 0.4001312255859375, 0.413787841796875, 0.4274444580078125, 0.44110107421875, 0.4547576904296875, 0.468414306640625, 0.4820709228515625, 0.4957275390625, 0.5093841552734375, 0.523040771484375, 0.5366973876953125, 0.55035400390625, 0.5640106201171875, 0.577667236328125, 0.5913238525390625, 0.60498046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 12.0, 15.0, 13.0, 23.0, 39.0, 43.0, 78.0, 92.0, 167.0, 308.0, 578.0, 1303.0, 2723.0, 6785.0, 17111.0, 53224.0, 229626.0, 549186.0, 130186.0, 35697.0, 12325.0, 4807.0, 2063.0, 951.0, 488.0, 275.0, 156.0, 84.0, 60.0, 28.0, 31.0, 18.0, 16.0, 12.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61181640625, -0.59228515625, -0.57275390625, -0.55322265625, -0.53369140625, -0.51416015625, -0.49462890625, -0.47509765625, -0.45556640625, -0.43603515625, -0.41650390625, -0.39697265625, -0.37744140625, -0.35791015625, -0.33837890625, -0.31884765625, -0.29931640625, -0.27978515625, -0.26025390625, -0.24072265625, -0.22119140625, -0.20166015625, -0.18212890625, -0.16259765625, -0.14306640625, -0.12353515625, -0.10400390625, -0.08447265625, -0.06494140625, -0.04541015625, -0.02587890625, -0.00634765625, 0.01318359375, 0.03271484375, 0.05224609375, 0.07177734375, 0.09130859375, 0.11083984375, 0.13037109375, 0.14990234375, 0.16943359375, 0.18896484375, 0.20849609375, 0.22802734375, 0.24755859375, 0.26708984375, 0.28662109375, 0.30615234375, 0.32568359375, 0.34521484375, 0.36474609375, 0.38427734375, 0.40380859375, 0.42333984375, 0.44287109375, 0.46240234375, 0.48193359375, 0.50146484375, 0.52099609375, 0.54052734375, 0.56005859375, 0.57958984375, 0.59912109375, 0.61865234375, 0.63818359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 12.0, 11.0, 14.0, 18.0, 13.0, 16.0, 17.0, 31.0, 29.0, 29.0, 40.0, 42.0, 48.0, 36.0, 37.0, 54.0, 62.0, 50.0, 35.0, 51.0, 47.0, 43.0, 40.0, 29.0, 26.0, 27.0, 23.0, 30.0, 19.0, 13.0, 7.0, 7.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.908203125, -0.8798370361328125, -0.851470947265625, -0.8231048583984375, -0.79473876953125, -0.7663726806640625, -0.738006591796875, -0.7096405029296875, -0.6812744140625, -0.6529083251953125, -0.624542236328125, -0.5961761474609375, -0.56781005859375, -0.5394439697265625, -0.511077880859375, -0.4827117919921875, -0.454345703125, -0.4259796142578125, -0.397613525390625, -0.3692474365234375, -0.34088134765625, -0.3125152587890625, -0.284149169921875, -0.2557830810546875, -0.2274169921875, -0.1990509033203125, -0.170684814453125, -0.1423187255859375, -0.11395263671875, -0.0855865478515625, -0.057220458984375, -0.0288543701171875, -0.00048828125, 0.0278778076171875, 0.056243896484375, 0.0846099853515625, 0.11297607421875, 0.1413421630859375, 0.169708251953125, 0.1980743408203125, 0.2264404296875, 0.2548065185546875, 0.283172607421875, 0.3115386962890625, 0.33990478515625, 0.3682708740234375, 0.396636962890625, 0.4250030517578125, 0.453369140625, 0.4817352294921875, 0.510101318359375, 0.5384674072265625, 0.56683349609375, 0.5951995849609375, 0.623565673828125, 0.6519317626953125, 0.6802978515625, 0.7086639404296875, 0.737030029296875, 0.7653961181640625, 0.79376220703125, 0.8221282958984375, 0.850494384765625, 0.8788604736328125, 0.9072265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 9.0, 14.0, 26.0, 36.0, 54.0, 95.0, 190.0, 367.0, 721.0, 1694.0, 4482.0, 16183.0, 132473.0, 719342.0, 147358.0, 17523.0, 4618.0, 1795.0, 745.0, 338.0, 168.0, 118.0, 62.0, 30.0, 27.0, 16.0, 15.0, 11.0, 8.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.269287109375, -0.26125335693359375, -0.2532196044921875, -0.24518585205078125, -0.237152099609375, -0.22911834716796875, -0.2210845947265625, -0.21305084228515625, -0.20501708984375, -0.19698333740234375, -0.1889495849609375, -0.18091583251953125, -0.172882080078125, -0.16484832763671875, -0.1568145751953125, -0.14878082275390625, -0.1407470703125, -0.13271331787109375, -0.1246795654296875, -0.11664581298828125, -0.108612060546875, -0.10057830810546875, -0.0925445556640625, -0.08451080322265625, -0.07647705078125, -0.06844329833984375, -0.0604095458984375, -0.05237579345703125, -0.044342041015625, -0.03630828857421875, -0.0282745361328125, -0.02024078369140625, -0.01220703125, -0.00417327880859375, 0.0038604736328125, 0.01189422607421875, 0.019927978515625, 0.02796173095703125, 0.0359954833984375, 0.04402923583984375, 0.05206298828125, 0.06009674072265625, 0.0681304931640625, 0.07616424560546875, 0.084197998046875, 0.09223175048828125, 0.1002655029296875, 0.10829925537109375, 0.1163330078125, 0.12436676025390625, 0.1324005126953125, 0.14043426513671875, 0.148468017578125, 0.15650177001953125, 0.1645355224609375, 0.17256927490234375, 0.18060302734375, 0.18863677978515625, 0.1966705322265625, 0.20470428466796875, 0.212738037109375, 0.22077178955078125, 0.2288055419921875, 0.23683929443359375, 0.244873046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 13.0, 23.0, 17.0, 26.0, 34.0, 41.0, 56.0, 65.0, 59.0, 75.0, 80.0, 49.0, 66.0, 69.0, 61.0, 47.0, 44.0, 27.0, 23.0, 20.0, 16.0, 19.0, 12.0, 9.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.09808349609375e-05, -2.036523073911667e-05, -1.9749626517295837e-05, -1.9134022295475006e-05, -1.8518418073654175e-05, -1.7902813851833344e-05, -1.7287209630012512e-05, -1.667160540819168e-05, -1.605600118637085e-05, -1.544039696455002e-05, -1.4824792742729187e-05, -1.4209188520908356e-05, -1.3593584299087524e-05, -1.2977980077266693e-05, -1.2362375855445862e-05, -1.174677163362503e-05, -1.11311674118042e-05, -1.0515563189983368e-05, -9.899958968162537e-06, -9.284354746341705e-06, -8.668750524520874e-06, -8.053146302700043e-06, -7.4375420808792114e-06, -6.82193785905838e-06, -6.206333637237549e-06, -5.5907294154167175e-06, -4.975125193595886e-06, -4.359520971775055e-06, -3.7439167499542236e-06, -3.1283125281333923e-06, -2.512708306312561e-06, -1.8971040844917297e-06, -1.2814998626708984e-06, -6.658956408500671e-07, -5.029141902923584e-08, 5.653128027915955e-07, 1.1809170246124268e-06, 1.796521246433258e-06, 2.4121254682540894e-06, 3.0277296900749207e-06, 3.643333911895752e-06, 4.258938133716583e-06, 4.8745423555374146e-06, 5.490146577358246e-06, 6.105750799179077e-06, 6.7213550209999084e-06, 7.33695924282074e-06, 7.952563464641571e-06, 8.568167686462402e-06, 9.183771908283234e-06, 9.799376130104065e-06, 1.0414980351924896e-05, 1.1030584573745728e-05, 1.1646188795566559e-05, 1.226179301738739e-05, 1.2877397239208221e-05, 1.3493001461029053e-05, 1.4108605682849884e-05, 1.4724209904670715e-05, 1.5339814126491547e-05, 1.5955418348312378e-05, 1.657102257013321e-05, 1.718662679195404e-05, 1.7802231013774872e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 6.0, 6.0, 9.0, 6.0, 12.0, 20.0, 35.0, 47.0, 74.0, 153.0, 299.0, 705.0, 1912.0, 6939.0, 29587.0, 304340.0, 623530.0, 64446.0, 11516.0, 3041.0, 1048.0, 394.0, 179.0, 97.0, 53.0, 32.0, 23.0, 19.0, 15.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.297607421875, -0.28960609436035156, -0.2816047668457031, -0.2736034393310547, -0.26560211181640625, -0.2576007843017578, -0.24959945678710938, -0.24159812927246094, -0.2335968017578125, -0.22559547424316406, -0.21759414672851562, -0.2095928192138672, -0.20159149169921875, -0.1935901641845703, -0.18558883666992188, -0.17758750915527344, -0.169586181640625, -0.16158485412597656, -0.15358352661132812, -0.1455821990966797, -0.13758087158203125, -0.1295795440673828, -0.12157821655273438, -0.11357688903808594, -0.1055755615234375, -0.09757423400878906, -0.08957290649414062, -0.08157157897949219, -0.07357025146484375, -0.06556892395019531, -0.057567596435546875, -0.04956626892089844, -0.04156494140625, -0.03356361389160156, -0.025562286376953125, -0.017560958862304688, -0.00955963134765625, -0.0015583038330078125, 0.006443023681640625, 0.014444351196289062, 0.0224456787109375, 0.030447006225585938, 0.038448333740234375, 0.04644966125488281, 0.05445098876953125, 0.06245231628417969, 0.07045364379882812, 0.07845497131347656, 0.086456298828125, 0.09445762634277344, 0.10245895385742188, 0.11046028137207031, 0.11846160888671875, 0.1264629364013672, 0.13446426391601562, 0.14246559143066406, 0.1504669189453125, 0.15846824645996094, 0.16646957397460938, 0.1744709014892578, 0.18247222900390625, 0.1904735565185547, 0.19847488403320312, 0.20647621154785156, 0.2144775390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 9.0, 13.0, 16.0, 13.0, 16.0, 31.0, 52.0, 61.0, 84.0, 110.0, 138.0, 112.0, 114.0, 57.0, 54.0, 34.0, 18.0, 11.0, 10.0, 8.0, 10.0, 5.0, 7.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2127685546875, -0.20378684997558594, -0.19480514526367188, -0.1858234405517578, -0.17684173583984375, -0.1678600311279297, -0.15887832641601562, -0.14989662170410156, -0.1409149169921875, -0.13193321228027344, -0.12295150756835938, -0.11396980285644531, -0.10498809814453125, -0.09600639343261719, -0.08702468872070312, -0.07804298400878906, -0.069061279296875, -0.06007957458496094, -0.051097869873046875, -0.04211616516113281, -0.03313446044921875, -0.024152755737304688, -0.015171051025390625, -0.0061893463134765625, 0.0027923583984375, 0.011774063110351562, 0.020755767822265625, 0.029737472534179688, 0.03871917724609375, 0.04770088195800781, 0.056682586669921875, 0.06566429138183594, 0.07464599609375, 0.08362770080566406, 0.09260940551757812, 0.10159111022949219, 0.11057281494140625, 0.11955451965332031, 0.12853622436523438, 0.13751792907714844, 0.1464996337890625, 0.15548133850097656, 0.16446304321289062, 0.1734447479248047, 0.18242645263671875, 0.1914081573486328, 0.20038986206054688, 0.20937156677246094, 0.218353271484375, 0.22733497619628906, 0.23631668090820312, 0.2452983856201172, 0.25428009033203125, 0.2632617950439453, 0.2722434997558594, 0.28122520446777344, 0.2902069091796875, 0.29918861389160156, 0.3081703186035156, 0.3171520233154297, 0.32613372802734375, 0.3351154327392578, 0.3440971374511719, 0.35307884216308594, 0.362060546875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 10.0, 35.0, 78.0, 296.0, 408.0, 120.0, 41.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.297154426574707, -6.937311172485352, -6.577467918395996, -6.217624664306641, -5.857781410217285, -5.49793815612793, -5.138094902038574, -4.778251647949219, -4.418408393859863, -4.058565139770508, -3.6987218856811523, -3.338878631591797, -2.9790353775024414, -2.619192123413086, -2.2593491077423096, -1.899505853652954, -1.5396628379821777, -1.1798195838928223, -0.8199763894081116, -0.4601331949234009, -0.10028994083404541, 0.25955331325531006, 0.619396448135376, 0.9792397022247314, 1.339082956314087, 1.6989262104034424, 2.058769464492798, 2.418612480163574, 2.7784557342529297, 3.138298988342285, 3.4981422424316406, 3.857985496520996, 4.217828750610352, 4.577672004699707, 4.9375152587890625, 5.297358512878418, 5.657201766967773, 6.017045021057129, 6.376888275146484, 6.73673152923584, 7.096574783325195, 7.456418037414551, 7.816261291503906, 8.176104545593262, 8.535947799682617, 8.895791053771973, 9.255634307861328, 9.615477561950684, 9.975320816040039, 10.335164070129395, 10.69500732421875, 11.054850578308105, 11.414693832397461, 11.774537086486816, 12.134380340576172, 12.494223594665527, 12.854065895080566, 13.213909149169922, 13.573752403259277, 13.933595657348633, 14.293438911437988, 14.653282165527344, 15.0131254196167, 15.372968673706055, 15.73281192779541]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 10.0, 10.0, 7.0, 11.0, 15.0, 16.0, 22.0, 24.0, 39.0, 43.0, 62.0, 54.0, 44.0, 58.0, 55.0, 60.0, 41.0, 57.0, 48.0, 36.0, 42.0, 37.0, 30.0, 29.0, 31.0, 27.0, 16.0, 19.0, 15.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38321590423584, -5.181885719299316, -4.980555534362793, -4.779224872589111, -4.577894687652588, -4.3765645027160645, -4.175233840942383, -3.9739036560058594, -3.772573471069336, -3.5712432861328125, -3.36991286277771, -3.1685824394226074, -2.967252254486084, -2.7659220695495605, -2.564591646194458, -2.3632612228393555, -2.161931037902832, -1.960600733757019, -1.759270429611206, -1.557940125465393, -1.35660982131958, -1.155279517173767, -0.9539492130279541, -0.7526189088821411, -0.5512886047363281, -0.34995830059051514, -0.14862799644470215, 0.05270230770111084, 0.25403261184692383, 0.4553629159927368, 0.6566932201385498, 0.8580235242843628, 1.059354305267334, 1.260684609413147, 1.46201491355896, 1.663345217704773, 1.864675521850586, 2.0660057067871094, 2.267336130142212, 2.4686665534973145, 2.669996738433838, 2.8713269233703613, 3.072657346725464, 3.2739877700805664, 3.47531795501709, 3.6766481399536133, 3.877978563308716, 4.079308986663818, 4.280639171600342, 4.481969356536865, 4.683300018310547, 4.88463020324707, 5.085960388183594, 5.287290573120117, 5.488620758056641, 5.689951419830322, 5.891281604766846, 6.092611789703369, 6.293942451477051, 6.495272636413574, 6.696602821350098, 6.897933006286621, 7.0992631912231445, 7.300593852996826, 7.50192403793335]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 5.0, 9.0, 19.0, 22.0, 52.0, 98.0, 232.0, 480.0, 964.0, 2728.0, 10347.0, 66175.0, 3806763.0, 274725.0, 22894.0, 5197.0, 1727.0, 805.0, 407.0, 218.0, 135.0, 75.0, 52.0, 31.0, 26.0, 21.0, 15.0, 12.0, 11.0, 8.0, 4.0, 6.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5785064697265625, -0.547637939453125, -0.5167694091796875, -0.48590087890625, -0.4550323486328125, -0.424163818359375, -0.3932952880859375, -0.3624267578125, -0.3315582275390625, -0.300689697265625, -0.2698211669921875, -0.23895263671875, -0.2080841064453125, -0.177215576171875, -0.1463470458984375, -0.115478515625, -0.0846099853515625, -0.053741455078125, -0.0228729248046875, 0.00799560546875, 0.0388641357421875, 0.069732666015625, 0.1006011962890625, 0.1314697265625, 0.1623382568359375, 0.193206787109375, 0.2240753173828125, 0.25494384765625, 0.2858123779296875, 0.316680908203125, 0.3475494384765625, 0.37841796875, 0.4092864990234375, 0.440155029296875, 0.4710235595703125, 0.50189208984375, 0.5327606201171875, 0.563629150390625, 0.5944976806640625, 0.6253662109375, 0.6562347412109375, 0.687103271484375, 0.7179718017578125, 0.74884033203125, 0.7797088623046875, 0.810577392578125, 0.8414459228515625, 0.872314453125, 0.9031829833984375, 0.934051513671875, 0.9649200439453125, 0.99578857421875, 1.0266571044921875, 1.057525634765625, 1.0883941650390625, 1.1192626953125, 1.1501312255859375, 1.180999755859375, 1.2118682861328125, 1.24273681640625, 1.2736053466796875, 1.304473876953125, 1.3353424072265625, 1.3662109375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 6.0, 17.0, 36.0, 37.0, 53.0, 77.0, 100.0, 97.0, 89.0, 86.0, 82.0, 82.0, 72.0, 56.0, 44.0, 21.0, 15.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281005859375, -0.2669181823730469, -0.25283050537109375, -0.23874282836914062, -0.2246551513671875, -0.21056747436523438, -0.19647979736328125, -0.18239212036132812, -0.168304443359375, -0.15421676635742188, -0.14012908935546875, -0.12604141235351562, -0.1119537353515625, -0.09786605834960938, -0.08377838134765625, -0.06969070434570312, -0.05560302734375, -0.041515350341796875, -0.02742767333984375, -0.013339996337890625, 0.0007476806640625, 0.014835357666015625, 0.02892303466796875, 0.043010711669921875, 0.057098388671875, 0.07118606567382812, 0.08527374267578125, 0.09936141967773438, 0.1134490966796875, 0.12753677368164062, 0.14162445068359375, 0.15571212768554688, 0.1697998046875, 0.18388748168945312, 0.19797515869140625, 0.21206283569335938, 0.2261505126953125, 0.24023818969726562, 0.25432586669921875, 0.2684135437011719, 0.282501220703125, 0.2965888977050781, 0.31067657470703125, 0.3247642517089844, 0.3388519287109375, 0.3529396057128906, 0.36702728271484375, 0.3811149597167969, 0.39520263671875, 0.4092903137207031, 0.42337799072265625, 0.4374656677246094, 0.4515533447265625, 0.4656410217285156, 0.47972869873046875, 0.4938163757324219, 0.507904052734375, 0.5219917297363281, 0.5360794067382812, 0.5501670837402344, 0.5642547607421875, 0.5783424377441406, 0.5924301147460938, 0.6065177917480469, 0.62060546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 7.0, 6.0, 15.0, 30.0, 67.0, 71.0, 121.0, 292.0, 477.0, 1133.0, 3652.0, 26335.0, 3976993.0, 173430.0, 8557.0, 1729.0, 643.0, 296.0, 182.0, 95.0, 51.0, 34.0, 25.0, 16.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.9912109375, -0.951171875, -0.9111328125, -0.87109375, -0.8310546875, -0.791015625, -0.7509765625, -0.7109375, -0.6708984375, -0.630859375, -0.5908203125, -0.55078125, -0.5107421875, -0.470703125, -0.4306640625, -0.390625, -0.3505859375, -0.310546875, -0.2705078125, -0.23046875, -0.1904296875, -0.150390625, -0.1103515625, -0.0703125, -0.0302734375, 0.009765625, 0.0498046875, 0.08984375, 0.1298828125, 0.169921875, 0.2099609375, 0.25, 0.2900390625, 0.330078125, 0.3701171875, 0.41015625, 0.4501953125, 0.490234375, 0.5302734375, 0.5703125, 0.6103515625, 0.650390625, 0.6904296875, 0.73046875, 0.7705078125, 0.810546875, 0.8505859375, 0.890625, 0.9306640625, 0.970703125, 1.0107421875, 1.05078125, 1.0908203125, 1.130859375, 1.1708984375, 1.2109375, 1.2509765625, 1.291015625, 1.3310546875, 1.37109375, 1.4111328125, 1.451171875, 1.4912109375, 1.53125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 11.0, 20.0, 33.0, 54.0, 168.0, 885.0, 2542.0, 197.0, 70.0, 39.0, 13.0, 15.0, 11.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6300468444824219, -0.6126327514648438, -0.5952186584472656, -0.5778045654296875, -0.5603904724121094, -0.5429763793945312, -0.5255622863769531, -0.508148193359375, -0.4907341003417969, -0.47332000732421875, -0.4559059143066406, -0.4384918212890625, -0.4210777282714844, -0.40366363525390625, -0.3862495422363281, -0.36883544921875, -0.3514213562011719, -0.33400726318359375, -0.3165931701660156, -0.2991790771484375, -0.2817649841308594, -0.26435089111328125, -0.24693679809570312, -0.229522705078125, -0.21210861206054688, -0.19469451904296875, -0.17728042602539062, -0.1598663330078125, -0.14245223999023438, -0.12503814697265625, -0.10762405395507812, -0.0902099609375, -0.07279586791992188, -0.05538177490234375, -0.037967681884765625, -0.0205535888671875, -0.003139495849609375, 0.01427459716796875, 0.031688690185546875, 0.049102783203125, 0.06651687622070312, 0.08393096923828125, 0.10134506225585938, 0.1187591552734375, 0.13617324829101562, 0.15358734130859375, 0.17100143432617188, 0.18841552734375, 0.20582962036132812, 0.22324371337890625, 0.24065780639648438, 0.2580718994140625, 0.2754859924316406, 0.29290008544921875, 0.3103141784667969, 0.327728271484375, 0.3451423645019531, 0.36255645751953125, 0.3799705505371094, 0.3973846435546875, 0.4147987365722656, 0.43221282958984375, 0.4496269226074219, 0.467041015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 10.0, 14.0, 47.0, 183.0, 462.0, 211.0, 52.0, 8.0, 11.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.306103229522705, -4.197890281677246, -4.089677810668945, -3.9814648628234863, -3.8732519149780273, -3.7650389671325684, -3.6568262577056885, -3.5486135482788086, -3.4404006004333496, -3.3321876525878906, -3.2239749431610107, -3.115762233734131, -3.007549285888672, -2.899336338043213, -2.791123628616333, -2.682910919189453, -2.574697971343994, -2.466485023498535, -2.3582723140716553, -2.2500596046447754, -2.1418466567993164, -2.0336337089538574, -1.9254209995269775, -1.817208170890808, -1.7089953422546387, -1.6007825136184692, -1.4925696849822998, -1.3843568563461304, -1.276144027709961, -1.1679311990737915, -1.059718370437622, -0.9515055418014526, -0.8432927131652832, -0.7350798845291138, -0.6268670558929443, -0.5186542272567749, -0.41044139862060547, -0.30222856998443604, -0.1940157413482666, -0.08580291271209717, 0.022409915924072266, 0.1306227445602417, 0.23883557319641113, 0.34704840183258057, 0.45526123046875, 0.5634740591049194, 0.6716868877410889, 0.7798997163772583, 0.8881125450134277, 0.9963253736495972, 1.1045382022857666, 1.212751030921936, 1.3209638595581055, 1.429176688194275, 1.5373895168304443, 1.6456023454666138, 1.7538151741027832, 1.8620280027389526, 1.970240831375122, 2.078453540802002, 2.186666488647461, 2.29487943649292, 2.4030921459198, 2.5113048553466797, 2.6195178031921387]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 5.0, 9.0, 8.0, 19.0, 24.0, 26.0, 38.0, 48.0, 39.0, 59.0, 71.0, 63.0, 69.0, 64.0, 87.0, 70.0, 81.0, 56.0, 46.0, 35.0, 18.0, 16.0, 13.0, 12.0, 8.0, 2.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.142932176589966, -2.086277723312378, -2.029623508453369, -1.9729690551757812, -1.9163146018981934, -1.859660267829895, -1.8030059337615967, -1.7463514804840088, -1.689697027206421, -1.6330426931381226, -1.5763882398605347, -1.5197339057922363, -1.4630794525146484, -1.40642511844635, -1.3497707843780518, -1.2931163311004639, -1.2364619970321655, -1.1798076629638672, -1.1231532096862793, -1.066498875617981, -1.009844422340393, -0.9531900882720947, -0.8965356945991516, -0.8398813009262085, -0.7832269072532654, -0.7265725135803223, -0.6699181199073792, -0.613263726234436, -0.5566093921661377, -0.4999549686908722, -0.44330060482025146, -0.38664621114730835, -0.3299916982650757, -0.27333730459213257, -0.21668292582035065, -0.16002854704856873, -0.10337415337562561, -0.046719759702682495, 0.009934604167938232, 0.06658899784088135, 0.12324339151382446, 0.17989778518676758, 0.2365521639585495, 0.2932065427303314, 0.34986093640327454, 0.40651533007621765, 0.4631696939468384, 0.5198240876197815, 0.5764784812927246, 0.6331328749656677, 0.6897872686386108, 0.7464416027069092, 0.8030960559844971, 0.8597503900527954, 0.9164047837257385, 0.9730591773986816, 1.0297136306762695, 1.0863679647445679, 1.1430224180221558, 1.199676752090454, 1.256331205368042, 1.3129855394363403, 1.3696398735046387, 1.4262943267822266, 1.482948660850525]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 8.0, 17.0, 13.0, 29.0, 33.0, 53.0, 101.0, 170.0, 344.0, 711.0, 1672.0, 5034.0, 20558.0, 115693.0, 658715.0, 202439.0, 31665.0, 7248.0, 2261.0, 896.0, 388.0, 191.0, 94.0, 72.0, 45.0, 28.0, 25.0, 15.0, 11.0, 8.0, 8.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97607421875, -0.9461669921875, -0.916259765625, -0.8863525390625, -0.8564453125, -0.8265380859375, -0.796630859375, -0.7667236328125, -0.73681640625, -0.7069091796875, -0.677001953125, -0.6470947265625, -0.6171875, -0.5872802734375, -0.557373046875, -0.5274658203125, -0.49755859375, -0.4676513671875, -0.437744140625, -0.4078369140625, -0.3779296875, -0.3480224609375, -0.318115234375, -0.2882080078125, -0.25830078125, -0.2283935546875, -0.198486328125, -0.1685791015625, -0.138671875, -0.1087646484375, -0.078857421875, -0.0489501953125, -0.01904296875, 0.0108642578125, 0.040771484375, 0.0706787109375, 0.1005859375, 0.1304931640625, 0.160400390625, 0.1903076171875, 0.22021484375, 0.2501220703125, 0.280029296875, 0.3099365234375, 0.33984375, 0.3697509765625, 0.399658203125, 0.4295654296875, 0.45947265625, 0.4893798828125, 0.519287109375, 0.5491943359375, 0.5791015625, 0.6090087890625, 0.638916015625, 0.6688232421875, 0.69873046875, 0.7286376953125, 0.758544921875, 0.7884521484375, 0.818359375, 0.8482666015625, 0.878173828125, 0.9080810546875, 0.93798828125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 1.0, 5.0, 5.0, 14.0, 16.0, 32.0, 53.0, 61.0, 75.0, 78.0, 93.0, 85.0, 94.0, 67.0, 83.0, 65.0, 56.0, 38.0, 38.0, 10.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.29150390625, -0.2787628173828125, -0.266021728515625, -0.2532806396484375, -0.24053955078125, -0.2277984619140625, -0.215057373046875, -0.2023162841796875, -0.1895751953125, -0.1768341064453125, -0.164093017578125, -0.1513519287109375, -0.13861083984375, -0.1258697509765625, -0.113128662109375, -0.1003875732421875, -0.087646484375, -0.0749053955078125, -0.062164306640625, -0.0494232177734375, -0.03668212890625, -0.0239410400390625, -0.011199951171875, 0.0015411376953125, 0.0142822265625, 0.0270233154296875, 0.039764404296875, 0.0525054931640625, 0.06524658203125, 0.0779876708984375, 0.090728759765625, 0.1034698486328125, 0.1162109375, 0.1289520263671875, 0.141693115234375, 0.1544342041015625, 0.16717529296875, 0.1799163818359375, 0.192657470703125, 0.2053985595703125, 0.2181396484375, 0.2308807373046875, 0.243621826171875, 0.2563629150390625, 0.26910400390625, 0.2818450927734375, 0.294586181640625, 0.3073272705078125, 0.320068359375, 0.3328094482421875, 0.345550537109375, 0.3582916259765625, 0.37103271484375, 0.3837738037109375, 0.396514892578125, 0.4092559814453125, 0.4219970703125, 0.4347381591796875, 0.447479248046875, 0.4602203369140625, 0.47296142578125, 0.4857025146484375, 0.498443603515625, 0.5111846923828125, 0.52392578125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 11.0, 7.0, 15.0, 14.0, 18.0, 40.0, 31.0, 56.0, 89.0, 114.0, 198.0, 307.0, 611.0, 1154.0, 2209.0, 4683.0, 10624.0, 25327.0, 67825.0, 234110.0, 468840.0, 149476.0, 48374.0, 18639.0, 8089.0, 3681.0, 1782.0, 899.0, 513.0, 304.0, 179.0, 94.0, 82.0, 34.0, 29.0, 33.0, 19.0, 14.0, 7.0, 8.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.51953125, -0.5034637451171875, -0.487396240234375, -0.4713287353515625, -0.45526123046875, -0.4391937255859375, -0.423126220703125, -0.4070587158203125, -0.3909912109375, -0.3749237060546875, -0.358856201171875, -0.3427886962890625, -0.32672119140625, -0.3106536865234375, -0.294586181640625, -0.2785186767578125, -0.262451171875, -0.2463836669921875, -0.230316162109375, -0.2142486572265625, -0.19818115234375, -0.1821136474609375, -0.166046142578125, -0.1499786376953125, -0.1339111328125, -0.1178436279296875, -0.101776123046875, -0.0857086181640625, -0.06964111328125, -0.0535736083984375, -0.037506103515625, -0.0214385986328125, -0.00537109375, 0.0106964111328125, 0.026763916015625, 0.0428314208984375, 0.05889892578125, 0.0749664306640625, 0.091033935546875, 0.1071014404296875, 0.1231689453125, 0.1392364501953125, 0.155303955078125, 0.1713714599609375, 0.18743896484375, 0.2035064697265625, 0.219573974609375, 0.2356414794921875, 0.251708984375, 0.2677764892578125, 0.283843994140625, 0.2999114990234375, 0.31597900390625, 0.3320465087890625, 0.348114013671875, 0.3641815185546875, 0.3802490234375, 0.3963165283203125, 0.412384033203125, 0.4284515380859375, 0.44451904296875, 0.4605865478515625, 0.476654052734375, 0.4927215576171875, 0.5087890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 17.0, 10.0, 16.0, 16.0, 24.0, 22.0, 29.0, 32.0, 31.0, 40.0, 44.0, 40.0, 37.0, 49.0, 53.0, 53.0, 49.0, 39.0, 45.0, 39.0, 39.0, 45.0, 50.0, 31.0, 19.0, 22.0, 22.0, 15.0, 10.0, 10.0, 8.0, 13.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8682098388671875, -0.837982177734375, -0.8077545166015625, -0.77752685546875, -0.7472991943359375, -0.717071533203125, -0.6868438720703125, -0.6566162109375, -0.6263885498046875, -0.596160888671875, -0.5659332275390625, -0.53570556640625, -0.5054779052734375, -0.475250244140625, -0.4450225830078125, -0.414794921875, -0.3845672607421875, -0.354339599609375, -0.3241119384765625, -0.29388427734375, -0.2636566162109375, -0.233428955078125, -0.2032012939453125, -0.1729736328125, -0.1427459716796875, -0.112518310546875, -0.0822906494140625, -0.05206298828125, -0.0218353271484375, 0.008392333984375, 0.0386199951171875, 0.06884765625, 0.0990753173828125, 0.129302978515625, 0.1595306396484375, 0.18975830078125, 0.2199859619140625, 0.250213623046875, 0.2804412841796875, 0.3106689453125, 0.3408966064453125, 0.371124267578125, 0.4013519287109375, 0.43157958984375, 0.4618072509765625, 0.492034912109375, 0.5222625732421875, 0.552490234375, 0.5827178955078125, 0.612945556640625, 0.6431732177734375, 0.67340087890625, 0.7036285400390625, 0.733856201171875, 0.7640838623046875, 0.7943115234375, 0.8245391845703125, 0.854766845703125, 0.8849945068359375, 0.91522216796875, 0.9454498291015625, 0.975677490234375, 1.0059051513671875, 1.0361328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 7.0, 5.0, 5.0, 12.0, 11.0, 18.0, 42.0, 55.0, 84.0, 174.0, 310.0, 685.0, 1597.0, 6101.0, 48491.0, 640127.0, 324004.0, 20862.0, 3699.0, 1202.0, 506.0, 216.0, 128.0, 70.0, 44.0, 32.0, 28.0, 10.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.2579536437988281, -0.24930572509765625, -0.24065780639648438, -0.2320098876953125, -0.22336196899414062, -0.21471405029296875, -0.20606613159179688, -0.197418212890625, -0.18877029418945312, -0.18012237548828125, -0.17147445678710938, -0.1628265380859375, -0.15417861938476562, -0.14553070068359375, -0.13688278198242188, -0.12823486328125, -0.11958694458007812, -0.11093902587890625, -0.10229110717773438, -0.0936431884765625, -0.08499526977539062, -0.07634735107421875, -0.06769943237304688, -0.059051513671875, -0.050403594970703125, -0.04175567626953125, -0.033107757568359375, -0.0244598388671875, -0.015811920166015625, -0.00716400146484375, 0.001483917236328125, 0.0101318359375, 0.018779754638671875, 0.02742767333984375, 0.036075592041015625, 0.0447235107421875, 0.053371429443359375, 0.06201934814453125, 0.07066726684570312, 0.079315185546875, 0.08796310424804688, 0.09661102294921875, 0.10525894165039062, 0.1139068603515625, 0.12255477905273438, 0.13120269775390625, 0.13985061645507812, 0.14849853515625, 0.15714645385742188, 0.16579437255859375, 0.17444229125976562, 0.1830902099609375, 0.19173812866210938, 0.20038604736328125, 0.20903396606445312, 0.217681884765625, 0.22632980346679688, 0.23497772216796875, 0.24362564086914062, 0.2522735595703125, 0.2609214782714844, 0.26956939697265625, 0.2782173156738281, 0.286865234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 8.0, 13.0, 17.0, 19.0, 27.0, 34.0, 49.0, 50.0, 69.0, 86.0, 84.0, 76.0, 84.0, 85.0, 64.0, 53.0, 38.0, 30.0, 34.0, 21.0, 12.0, 11.0, 12.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7821788787841797e-05, -1.706741750240326e-05, -1.631304621696472e-05, -1.5558674931526184e-05, -1.4804303646087646e-05, -1.4049932360649109e-05, -1.3295561075210571e-05, -1.2541189789772034e-05, -1.1786818504333496e-05, -1.1032447218894958e-05, -1.0278075933456421e-05, -9.523704648017883e-06, -8.769333362579346e-06, -8.014962077140808e-06, -7.2605907917022705e-06, -6.506219506263733e-06, -5.751848220825195e-06, -4.997476935386658e-06, -4.24310564994812e-06, -3.4887343645095825e-06, -2.734363079071045e-06, -1.9799917936325073e-06, -1.2256205081939697e-06, -4.7124922275543213e-07, 2.8312206268310547e-07, 1.037493348121643e-06, 1.7918646335601807e-06, 2.5462359189987183e-06, 3.300607204437256e-06, 4.0549784898757935e-06, 4.809349775314331e-06, 5.563721060752869e-06, 6.318092346191406e-06, 7.072463631629944e-06, 7.826834917068481e-06, 8.581206202507019e-06, 9.335577487945557e-06, 1.0089948773384094e-05, 1.0844320058822632e-05, 1.159869134426117e-05, 1.2353062629699707e-05, 1.3107433915138245e-05, 1.3861805200576782e-05, 1.461617648601532e-05, 1.5370547771453857e-05, 1.6124919056892395e-05, 1.6879290342330933e-05, 1.763366162776947e-05, 1.8388032913208008e-05, 1.9142404198646545e-05, 1.9896775484085083e-05, 2.065114676952362e-05, 2.1405518054962158e-05, 2.2159889340400696e-05, 2.2914260625839233e-05, 2.366863191127777e-05, 2.442300319671631e-05, 2.5177374482154846e-05, 2.5931745767593384e-05, 2.668611705303192e-05, 2.744048833847046e-05, 2.8194859623908997e-05, 2.8949230909347534e-05, 2.9703602194786072e-05, 3.045797348022461e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 11.0, 16.0, 28.0, 33.0, 85.0, 192.0, 385.0, 815.0, 2608.0, 12058.0, 132429.0, 744042.0, 139152.0, 12499.0, 2545.0, 872.0, 386.0, 184.0, 91.0, 50.0, 22.0, 21.0, 10.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.230224609375, -0.22214889526367188, -0.21407318115234375, -0.20599746704101562, -0.1979217529296875, -0.18984603881835938, -0.18177032470703125, -0.17369461059570312, -0.165618896484375, -0.15754318237304688, -0.14946746826171875, -0.14139175415039062, -0.1333160400390625, -0.12524032592773438, -0.11716461181640625, -0.10908889770507812, -0.10101318359375, -0.09293746948242188, -0.08486175537109375, -0.07678604125976562, -0.0687103271484375, -0.060634613037109375, -0.05255889892578125, -0.044483184814453125, -0.036407470703125, -0.028331756591796875, -0.02025604248046875, -0.012180328369140625, -0.0041046142578125, 0.003971099853515625, 0.01204681396484375, 0.020122528076171875, 0.0281982421875, 0.036273956298828125, 0.04434967041015625, 0.052425384521484375, 0.0605010986328125, 0.06857681274414062, 0.07665252685546875, 0.08472824096679688, 0.092803955078125, 0.10087966918945312, 0.10895538330078125, 0.11703109741210938, 0.1251068115234375, 0.13318252563476562, 0.14125823974609375, 0.14933395385742188, 0.15740966796875, 0.16548538208007812, 0.17356109619140625, 0.18163681030273438, 0.1897125244140625, 0.19778823852539062, 0.20586395263671875, 0.21393966674804688, 0.222015380859375, 0.23009109497070312, 0.23816680908203125, 0.24624252319335938, 0.2543182373046875, 0.2623939514160156, 0.27046966552734375, 0.2785453796386719, 0.28662109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 11.0, 11.0, 21.0, 20.0, 41.0, 48.0, 77.0, 113.0, 136.0, 115.0, 129.0, 86.0, 74.0, 32.0, 35.0, 18.0, 9.0, 6.0, 8.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2880859375, -0.27854156494140625, -0.2689971923828125, -0.25945281982421875, -0.249908447265625, -0.24036407470703125, -0.2308197021484375, -0.22127532958984375, -0.21173095703125, -0.20218658447265625, -0.1926422119140625, -0.18309783935546875, -0.173553466796875, -0.16400909423828125, -0.1544647216796875, -0.14492034912109375, -0.1353759765625, -0.12583160400390625, -0.1162872314453125, -0.10674285888671875, -0.097198486328125, -0.08765411376953125, -0.0781097412109375, -0.06856536865234375, -0.05902099609375, -0.04947662353515625, -0.0399322509765625, -0.03038787841796875, -0.020843505859375, -0.01129913330078125, -0.0017547607421875, 0.00778961181640625, 0.017333984375, 0.02687835693359375, 0.0364227294921875, 0.04596710205078125, 0.055511474609375, 0.06505584716796875, 0.0746002197265625, 0.08414459228515625, 0.09368896484375, 0.10323333740234375, 0.1127777099609375, 0.12232208251953125, 0.131866455078125, 0.14141082763671875, 0.1509552001953125, 0.16049957275390625, 0.1700439453125, 0.17958831787109375, 0.1891326904296875, 0.19867706298828125, 0.208221435546875, 0.21776580810546875, 0.2273101806640625, 0.23685455322265625, 0.24639892578125, 0.25594329833984375, 0.2654876708984375, 0.27503204345703125, 0.284576416015625, 0.29412078857421875, 0.3036651611328125, 0.31320953369140625, 0.32275390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 9.0, 31.0, 186.0, 623.0, 137.0, 19.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.887975692749023, -12.259434700012207, -11.63089370727539, -11.002352714538574, -10.373811721801758, -9.745270729064941, -9.116729736328125, -8.488187789916992, -7.859647274017334, -7.231106281280518, -6.602565288543701, -5.974023818969727, -5.34548282623291, -4.716941833496094, -4.088400840759277, -3.459859848022461, -2.8313188552856445, -2.202777862548828, -1.5742367506027222, -0.9456956386566162, -0.3171546459197998, 0.3113863468170166, 0.9399275779724121, 1.5684685707092285, 2.197009563446045, 2.8255505561828613, 3.4540915489196777, 4.082633018493652, 4.711174011230469, 5.339715003967285, 5.968255996704102, 6.596796989440918, 7.225337982177734, 7.853878974914551, 8.482419967651367, 9.110960960388184, 9.739501953125, 10.368042945861816, 10.996583938598633, 11.625125885009766, 12.253665924072266, 12.882206916809082, 13.510747909545898, 14.139288902282715, 14.767829895019531, 15.396370887756348, 16.024911880493164, 16.653453826904297, 17.281993865966797, 17.91053581237793, 18.53907585144043, 19.167617797851562, 19.796157836914062, 20.424699783325195, 21.053239822387695, 21.681781768798828, 22.31032371520996, 22.938865661621094, 23.567405700683594, 24.195947647094727, 24.824487686157227, 25.45302963256836, 26.08156967163086, 26.710111618041992, 27.338651657104492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 0.0, 7.0, 8.0, 9.0, 10.0, 16.0, 12.0, 22.0, 20.0, 16.0, 28.0, 32.0, 23.0, 30.0, 36.0, 41.0, 49.0, 45.0, 44.0, 42.0, 52.0, 46.0, 44.0, 41.0, 36.0, 36.0, 35.0, 26.0, 37.0, 34.0, 17.0, 20.0, 7.0, 15.0, 15.0, 11.0, 13.0, 6.0, 5.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.777278900146484, -5.60857629776001, -5.439873218536377, -5.271170616149902, -5.102468013763428, -4.933765411376953, -4.76506233215332, -4.596359729766846, -4.427657127380371, -4.2589545249938965, -4.090251445770264, -3.921548843383789, -3.7528462409973145, -3.5841434001922607, -3.415440559387207, -3.2467379570007324, -3.0780351161956787, -2.909332275390625, -2.7406296730041504, -2.5719268321990967, -2.403224229812622, -2.2345213890075684, -2.0658187866210938, -1.89711594581604, -1.7284132242202759, -1.5597105026245117, -1.3910077810287476, -1.2223050594329834, -1.0536022186279297, -0.8848995566368103, -0.7161967754364014, -0.5474940538406372, -0.37879133224487305, -0.2100885957479477, -0.04138585925102234, 0.1273168921470642, 0.29601961374282837, 0.46472233533859253, 0.6334251165390015, 0.8021278381347656, 0.9708305597305298, 1.139533281326294, 1.308236002922058, 1.4769387245178223, 1.645641565322876, 1.8143441677093506, 1.9830470085144043, 2.151749610900879, 2.3204524517059326, 2.4891552925109863, 2.657857894897461, 2.8265607357025146, 2.9952633380889893, 3.163966178894043, 3.3326687812805176, 3.5013716220855713, 3.670074462890625, 3.8387773036956787, 4.007480144500732, 4.176182746887207, 4.344885349273682, 4.513587951660156, 4.682291030883789, 4.850993633270264, 5.019696235656738]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 11.0, 18.0, 26.0, 45.0, 63.0, 113.0, 201.0, 433.0, 928.0, 2409.0, 9800.0, 109979.0, 4005229.0, 53696.0, 7349.0, 2141.0, 829.0, 411.0, 218.0, 140.0, 89.0, 43.0, 31.0, 11.0, 20.0, 13.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23828125, -1.18951416015625, -1.1407470703125, -1.09197998046875, -1.043212890625, -0.99444580078125, -0.9456787109375, -0.89691162109375, -0.84814453125, -0.79937744140625, -0.7506103515625, -0.70184326171875, -0.653076171875, -0.60430908203125, -0.5555419921875, -0.50677490234375, -0.4580078125, -0.40924072265625, -0.3604736328125, -0.31170654296875, -0.262939453125, -0.21417236328125, -0.1654052734375, -0.11663818359375, -0.06787109375, -0.01910400390625, 0.0296630859375, 0.07843017578125, 0.127197265625, 0.17596435546875, 0.2247314453125, 0.27349853515625, 0.322265625, 0.37103271484375, 0.4197998046875, 0.46856689453125, 0.517333984375, 0.56610107421875, 0.6148681640625, 0.66363525390625, 0.71240234375, 0.76116943359375, 0.8099365234375, 0.85870361328125, 0.907470703125, 0.95623779296875, 1.0050048828125, 1.05377197265625, 1.1025390625, 1.15130615234375, 1.2000732421875, 1.24884033203125, 1.297607421875, 1.34637451171875, 1.3951416015625, 1.44390869140625, 1.49267578125, 1.54144287109375, 1.5902099609375, 1.63897705078125, 1.687744140625, 1.73651123046875, 1.7852783203125, 1.83404541015625, 1.8828125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 6.0, 11.0, 20.0, 25.0, 28.0, 38.0, 54.0, 61.0, 52.0, 65.0, 70.0, 70.0, 68.0, 63.0, 60.0, 65.0, 59.0, 36.0, 36.0, 25.0, 21.0, 19.0, 9.0, 11.0, 9.0, 2.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30078125, -0.2887229919433594, -0.27666473388671875, -0.2646064758300781, -0.2525482177734375, -0.24048995971679688, -0.22843170166015625, -0.21637344360351562, -0.204315185546875, -0.19225692749023438, -0.18019866943359375, -0.16814041137695312, -0.1560821533203125, -0.14402389526367188, -0.13196563720703125, -0.11990737915039062, -0.10784912109375, -0.09579086303710938, -0.08373260498046875, -0.07167434692382812, -0.0596160888671875, -0.047557830810546875, -0.03549957275390625, -0.023441314697265625, -0.011383056640625, 0.000675201416015625, 0.01273345947265625, 0.024791717529296875, 0.0368499755859375, 0.048908233642578125, 0.06096649169921875, 0.07302474975585938, 0.0850830078125, 0.09714126586914062, 0.10919952392578125, 0.12125778198242188, 0.1333160400390625, 0.14537429809570312, 0.15743255615234375, 0.16949081420898438, 0.181549072265625, 0.19360733032226562, 0.20566558837890625, 0.21772384643554688, 0.2297821044921875, 0.24184036254882812, 0.25389862060546875, 0.2659568786621094, 0.27801513671875, 0.2900733947753906, 0.30213165283203125, 0.3141899108886719, 0.3262481689453125, 0.3383064270019531, 0.35036468505859375, 0.3624229431152344, 0.374481201171875, 0.3865394592285156, 0.39859771728515625, 0.4106559753417969, 0.4227142333984375, 0.4347724914550781, 0.44683074951171875, 0.4588890075683594, 0.470947265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 4.0, 11.0, 12.0, 18.0, 34.0, 49.0, 85.0, 101.0, 179.0, 301.0, 532.0, 1006.0, 2071.0, 5502.0, 23508.0, 426061.0, 3669019.0, 51192.0, 9253.0, 2838.0, 1183.0, 555.0, 306.0, 155.0, 112.0, 73.0, 47.0, 33.0, 18.0, 11.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93212890625, -0.9040374755859375, -0.875946044921875, -0.8478546142578125, -0.81976318359375, -0.7916717529296875, -0.763580322265625, -0.7354888916015625, -0.7073974609375, -0.6793060302734375, -0.651214599609375, -0.6231231689453125, -0.59503173828125, -0.5669403076171875, -0.538848876953125, -0.5107574462890625, -0.482666015625, -0.4545745849609375, -0.426483154296875, -0.3983917236328125, -0.37030029296875, -0.3422088623046875, -0.314117431640625, -0.2860260009765625, -0.2579345703125, -0.2298431396484375, -0.201751708984375, -0.1736602783203125, -0.14556884765625, -0.1174774169921875, -0.089385986328125, -0.0612945556640625, -0.033203125, -0.0051116943359375, 0.022979736328125, 0.0510711669921875, 0.07916259765625, 0.1072540283203125, 0.135345458984375, 0.1634368896484375, 0.1915283203125, 0.2196197509765625, 0.247711181640625, 0.2758026123046875, 0.30389404296875, 0.3319854736328125, 0.360076904296875, 0.3881683349609375, 0.416259765625, 0.4443511962890625, 0.472442626953125, 0.5005340576171875, 0.52862548828125, 0.5567169189453125, 0.584808349609375, 0.6128997802734375, 0.6409912109375, 0.6690826416015625, 0.697174072265625, 0.7252655029296875, 0.75335693359375, 0.7814483642578125, 0.809539794921875, 0.8376312255859375, 0.86572265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 4.0, 12.0, 14.0, 29.0, 40.0, 106.0, 255.0, 2131.0, 1033.0, 200.0, 88.0, 49.0, 25.0, 23.0, 26.0, 8.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66455078125, -0.64788818359375, -0.6312255859375, -0.61456298828125, -0.597900390625, -0.58123779296875, -0.5645751953125, -0.54791259765625, -0.53125, -0.51458740234375, -0.4979248046875, -0.48126220703125, -0.464599609375, -0.44793701171875, -0.4312744140625, -0.41461181640625, -0.39794921875, -0.38128662109375, -0.3646240234375, -0.34796142578125, -0.331298828125, -0.31463623046875, -0.2979736328125, -0.28131103515625, -0.2646484375, -0.24798583984375, -0.2313232421875, -0.21466064453125, -0.197998046875, -0.18133544921875, -0.1646728515625, -0.14801025390625, -0.13134765625, -0.11468505859375, -0.0980224609375, -0.08135986328125, -0.064697265625, -0.04803466796875, -0.0313720703125, -0.01470947265625, 0.001953125, 0.01861572265625, 0.0352783203125, 0.05194091796875, 0.068603515625, 0.08526611328125, 0.1019287109375, 0.11859130859375, 0.13525390625, 0.15191650390625, 0.1685791015625, 0.18524169921875, 0.201904296875, 0.21856689453125, 0.2352294921875, 0.25189208984375, 0.2685546875, 0.28521728515625, 0.3018798828125, 0.31854248046875, 0.335205078125, 0.35186767578125, 0.3685302734375, 0.38519287109375, 0.40185546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 26.0, 49.0, 159.0, 351.0, 284.0, 91.0, 18.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46932053565979, -3.360344409942627, -3.2513680458068848, -3.1423919200897217, -3.0334157943725586, -2.9244394302368164, -2.8154633045196533, -2.7064871788024902, -2.597510814666748, -2.488534688949585, -2.3795583248138428, -2.2705821990966797, -2.1616060733795166, -2.0526299476623535, -1.9436535835266113, -1.8346774578094482, -1.7257013320922852, -1.6167250871658325, -1.5077489614486694, -1.3987727165222168, -1.2897965908050537, -1.180820345878601, -1.0718441009521484, -0.9628679156303406, -0.8538917303085327, -0.7449155449867249, -0.635939359664917, -0.5269631147384644, -0.4179869294166565, -0.30901074409484863, -0.200034499168396, -0.09105831384658813, 0.017917633056640625, 0.12689383327960968, 0.23587003350257874, 0.344846248626709, 0.45382243394851685, 0.5627986192703247, 0.6717748641967773, 0.7807510495185852, 0.8897272348403931, 0.9987034201622009, 1.1076796054840088, 1.2166558504104614, 1.325632095336914, 1.4346082210540771, 1.5435844659805298, 1.6525607109069824, 1.7615368366241455, 1.8705130815505981, 1.9794892072677612, 2.088465452194214, 2.197441577911377, 2.306417942047119, 2.4153940677642822, 2.5243701934814453, 2.6333465576171875, 2.7423226833343506, 2.8512990474700928, 2.960275173187256, 3.069251298904419, 3.178227424621582, 3.287203788757324, 3.3961799144744873, 3.5051560401916504]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 6.0, 18.0, 21.0, 23.0, 16.0, 41.0, 32.0, 38.0, 47.0, 44.0, 56.0, 47.0, 50.0, 50.0, 68.0, 59.0, 58.0, 47.0, 41.0, 40.0, 44.0, 25.0, 23.0, 20.0, 18.0, 11.0, 10.0, 12.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.013291120529175, -1.9637080430984497, -1.914124846458435, -1.86454176902771, -1.8149585723876953, -1.7653754949569702, -1.7157924175262451, -1.6662092208862305, -1.6166260242462158, -1.5670429468154907, -1.517459750175476, -1.467876672744751, -1.4182934761047363, -1.3687103986740112, -1.3191273212432861, -1.2695441246032715, -1.2199610471725464, -1.1703779697418213, -1.1207947731018066, -1.0712116956710815, -1.021628499031067, -0.9720454216003418, -0.9224622845649719, -0.872879147529602, -0.8232960104942322, -0.7737128734588623, -0.7241297364234924, -0.6745465993881226, -0.6249635219573975, -0.5753803253173828, -0.5257972478866577, -0.47621411085128784, -0.4266310930252075, -0.37704795598983765, -0.3274648189544678, -0.2778817117214203, -0.22829857468605042, -0.17871543765068054, -0.12913233041763306, -0.07954919338226318, -0.02996605634689331, 0.019617073237895966, 0.06920020282268524, 0.11878332495689392, 0.1683664619922638, 0.21794959902763367, 0.26753270626068115, 0.317115843296051, 0.3666989803314209, 0.41628211736679077, 0.46586525440216064, 0.5154483318328857, 0.5650315284729004, 0.6146146059036255, 0.6641977429389954, 0.7137808799743652, 0.7633640170097351, 0.812947154045105, 0.8625302910804749, 0.9121134281158447, 0.9616965055465698, 1.0112797021865845, 1.0608627796173096, 1.1104459762573242, 1.1600290536880493]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 17.0, 8.0, 19.0, 23.0, 40.0, 54.0, 93.0, 125.0, 244.0, 357.0, 610.0, 1063.0, 2045.0, 4419.0, 10831.0, 32316.0, 137457.0, 625477.0, 173103.0, 37952.0, 12172.0, 4992.0, 2262.0, 1224.0, 599.0, 374.0, 252.0, 133.0, 88.0, 57.0, 48.0, 23.0, 23.0, 14.0, 5.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7656784057617188, -0.7378997802734375, -0.7101211547851562, -0.682342529296875, -0.6545639038085938, -0.6267852783203125, -0.5990066528320312, -0.57122802734375, -0.5434494018554688, -0.5156707763671875, -0.48789215087890625, -0.460113525390625, -0.43233489990234375, -0.4045562744140625, -0.37677764892578125, -0.3489990234375, -0.32122039794921875, -0.2934417724609375, -0.26566314697265625, -0.237884521484375, -0.21010589599609375, -0.1823272705078125, -0.15454864501953125, -0.12677001953125, -0.09899139404296875, -0.0712127685546875, -0.04343414306640625, -0.015655517578125, 0.01212310791015625, 0.0399017333984375, 0.06768035888671875, 0.095458984375, 0.12323760986328125, 0.1510162353515625, 0.17879486083984375, 0.206573486328125, 0.23435211181640625, 0.2621307373046875, 0.28990936279296875, 0.31768798828125, 0.34546661376953125, 0.3732452392578125, 0.40102386474609375, 0.428802490234375, 0.45658111572265625, 0.4843597412109375, 0.5121383666992188, 0.5399169921875, 0.5676956176757812, 0.5954742431640625, 0.6232528686523438, 0.651031494140625, 0.6788101196289062, 0.7065887451171875, 0.7343673706054688, 0.76214599609375, 0.7899246215820312, 0.8177032470703125, 0.8454818725585938, 0.873260498046875, 0.9010391235351562, 0.9288177490234375, 0.9565963745117188, 0.984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 6.0, 23.0, 22.0, 12.0, 30.0, 41.0, 28.0, 53.0, 41.0, 54.0, 67.0, 66.0, 64.0, 56.0, 59.0, 56.0, 51.0, 57.0, 43.0, 41.0, 23.0, 23.0, 17.0, 13.0, 14.0, 9.0, 8.0, 6.0, 4.0, 1.0, 0.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30322265625, -0.2923164367675781, -0.28141021728515625, -0.2705039978027344, -0.2595977783203125, -0.24869155883789062, -0.23778533935546875, -0.22687911987304688, -0.215972900390625, -0.20506668090820312, -0.19416046142578125, -0.18325424194335938, -0.1723480224609375, -0.16144180297851562, -0.15053558349609375, -0.13962936401367188, -0.12872314453125, -0.11781692504882812, -0.10691070556640625, -0.09600448608398438, -0.0850982666015625, -0.07419204711914062, -0.06328582763671875, -0.052379608154296875, -0.041473388671875, -0.030567169189453125, -0.01966094970703125, -0.008754730224609375, 0.0021514892578125, 0.013057708740234375, 0.02396392822265625, 0.034870147705078125, 0.0457763671875, 0.056682586669921875, 0.06758880615234375, 0.07849502563476562, 0.0894012451171875, 0.10030746459960938, 0.11121368408203125, 0.12211990356445312, 0.133026123046875, 0.14393234252929688, 0.15483856201171875, 0.16574478149414062, 0.1766510009765625, 0.18755722045898438, 0.19846343994140625, 0.20936965942382812, 0.22027587890625, 0.23118209838867188, 0.24208831787109375, 0.2529945373535156, 0.2639007568359375, 0.2748069763183594, 0.28571319580078125, 0.2966194152832031, 0.307525634765625, 0.3184318542480469, 0.32933807373046875, 0.3402442932128906, 0.3511505126953125, 0.3620567321777344, 0.37296295166015625, 0.3838691711425781, 0.394775390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 11.0, 10.0, 9.0, 9.0, 13.0, 19.0, 25.0, 41.0, 72.0, 87.0, 151.0, 282.0, 554.0, 1382.0, 3947.0, 15801.0, 96957.0, 736038.0, 162294.0, 22547.0, 5187.0, 1599.0, 694.0, 341.0, 191.0, 104.0, 60.0, 39.0, 19.0, 17.0, 10.0, 11.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0303955078125, -0.994384765625, -0.9583740234375, -0.92236328125, -0.8863525390625, -0.850341796875, -0.8143310546875, -0.7783203125, -0.7423095703125, -0.706298828125, -0.6702880859375, -0.63427734375, -0.5982666015625, -0.562255859375, -0.5262451171875, -0.490234375, -0.4542236328125, -0.418212890625, -0.3822021484375, -0.34619140625, -0.3101806640625, -0.274169921875, -0.2381591796875, -0.2021484375, -0.1661376953125, -0.130126953125, -0.0941162109375, -0.05810546875, -0.0220947265625, 0.013916015625, 0.0499267578125, 0.0859375, 0.1219482421875, 0.157958984375, 0.1939697265625, 0.22998046875, 0.2659912109375, 0.302001953125, 0.3380126953125, 0.3740234375, 0.4100341796875, 0.446044921875, 0.4820556640625, 0.51806640625, 0.5540771484375, 0.590087890625, 0.6260986328125, 0.662109375, 0.6981201171875, 0.734130859375, 0.7701416015625, 0.80615234375, 0.8421630859375, 0.878173828125, 0.9141845703125, 0.9501953125, 0.9862060546875, 1.022216796875, 1.0582275390625, 1.09423828125, 1.1302490234375, 1.166259765625, 1.2022705078125, 1.23828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 8.0, 13.0, 9.0, 12.0, 13.0, 17.0, 26.0, 26.0, 34.0, 37.0, 33.0, 37.0, 51.0, 50.0, 49.0, 67.0, 56.0, 53.0, 52.0, 57.0, 37.0, 39.0, 39.0, 41.0, 30.0, 20.0, 13.0, 13.0, 19.0, 11.0, 8.0, 8.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.171539306640625, -1.13018798828125, -1.088836669921875, -1.0474853515625, -1.006134033203125, -0.96478271484375, -0.923431396484375, -0.882080078125, -0.840728759765625, -0.79937744140625, -0.758026123046875, -0.7166748046875, -0.675323486328125, -0.63397216796875, -0.592620849609375, -0.55126953125, -0.509918212890625, -0.46856689453125, -0.427215576171875, -0.3858642578125, -0.344512939453125, -0.30316162109375, -0.261810302734375, -0.220458984375, -0.179107666015625, -0.13775634765625, -0.096405029296875, -0.0550537109375, -0.013702392578125, 0.02764892578125, 0.069000244140625, 0.1103515625, 0.151702880859375, 0.19305419921875, 0.234405517578125, 0.2757568359375, 0.317108154296875, 0.35845947265625, 0.399810791015625, 0.441162109375, 0.482513427734375, 0.52386474609375, 0.565216064453125, 0.6065673828125, 0.647918701171875, 0.68927001953125, 0.730621337890625, 0.77197265625, 0.813323974609375, 0.85467529296875, 0.896026611328125, 0.9373779296875, 0.978729248046875, 1.02008056640625, 1.061431884765625, 1.102783203125, 1.144134521484375, 1.18548583984375, 1.226837158203125, 1.2681884765625, 1.309539794921875, 1.35089111328125, 1.392242431640625, 1.43359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 6.0, 5.0, 18.0, 32.0, 100.0, 322.0, 1781.0, 993598.0, 51452.0, 892.0, 236.0, 66.0, 24.0, 9.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9833984375, -1.9211273193359375, -1.858856201171875, -1.7965850830078125, -1.73431396484375, -1.6720428466796875, -1.609771728515625, -1.5475006103515625, -1.4852294921875, -1.4229583740234375, -1.360687255859375, -1.2984161376953125, -1.23614501953125, -1.1738739013671875, -1.111602783203125, -1.0493316650390625, -0.987060546875, -0.9247894287109375, -0.862518310546875, -0.8002471923828125, -0.73797607421875, -0.6757049560546875, -0.613433837890625, -0.5511627197265625, -0.4888916015625, -0.4266204833984375, -0.364349365234375, -0.3020782470703125, -0.23980712890625, -0.1775360107421875, -0.115264892578125, -0.0529937744140625, 0.00927734375, 0.0715484619140625, 0.133819580078125, 0.1960906982421875, 0.25836181640625, 0.3206329345703125, 0.382904052734375, 0.4451751708984375, 0.5074462890625, 0.5697174072265625, 0.631988525390625, 0.6942596435546875, 0.75653076171875, 0.8188018798828125, 0.881072998046875, 0.9433441162109375, 1.005615234375, 1.0678863525390625, 1.130157470703125, 1.1924285888671875, 1.25469970703125, 1.3169708251953125, 1.379241943359375, 1.4415130615234375, 1.5037841796875, 1.5660552978515625, 1.628326416015625, 1.6905975341796875, 1.75286865234375, 1.8151397705078125, 1.877410888671875, 1.9396820068359375, 2.001953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 14.0, 28.0, 46.0, 98.0, 152.0, 180.0, 168.0, 141.0, 74.0, 36.0, 16.0, 12.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.963180541992188e-05, -7.78520479798317e-05, -7.607229053974152e-05, -7.429253309965134e-05, -7.251277565956116e-05, -7.073301821947098e-05, -6.89532607793808e-05, -6.717350333929062e-05, -6.539374589920044e-05, -6.361398845911026e-05, -6.183423101902008e-05, -6.00544735789299e-05, -5.827471613883972e-05, -5.649495869874954e-05, -5.471520125865936e-05, -5.293544381856918e-05, -5.1155686378479004e-05, -4.9375928938388824e-05, -4.7596171498298645e-05, -4.5816414058208466e-05, -4.4036656618118286e-05, -4.225689917802811e-05, -4.047714173793793e-05, -3.869738429784775e-05, -3.691762685775757e-05, -3.513786941766739e-05, -3.335811197757721e-05, -3.157835453748703e-05, -2.979859709739685e-05, -2.801883965730667e-05, -2.6239082217216492e-05, -2.4459324777126312e-05, -2.2679567337036133e-05, -2.0899809896945953e-05, -1.9120052456855774e-05, -1.7340295016765594e-05, -1.5560537576675415e-05, -1.3780780136585236e-05, -1.2001022696495056e-05, -1.0221265256404877e-05, -8.441507816314697e-06, -6.661750376224518e-06, -4.881992936134338e-06, -3.102235496044159e-06, -1.3224780559539795e-06, 4.5727938413619995e-07, 2.2370368242263794e-06, 4.016794264316559e-06, 5.796551704406738e-06, 7.576309144496918e-06, 9.356066584587097e-06, 1.1135824024677277e-05, 1.2915581464767456e-05, 1.4695338904857635e-05, 1.6475096344947815e-05, 1.8254853785037994e-05, 2.0034611225128174e-05, 2.1814368665218353e-05, 2.3594126105308533e-05, 2.5373883545398712e-05, 2.715364098548889e-05, 2.893339842557907e-05, 3.071315586566925e-05, 3.249291330575943e-05, 3.427267074584961e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 12.0, 19.0, 42.0, 88.0, 191.0, 374.0, 3035.0, 1039154.0, 4831.0, 420.0, 196.0, 83.0, 56.0, 23.0, 14.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.91015625, -1.84552001953125, -1.7808837890625, -1.71624755859375, -1.651611328125, -1.58697509765625, -1.5223388671875, -1.45770263671875, -1.39306640625, -1.32843017578125, -1.2637939453125, -1.19915771484375, -1.134521484375, -1.06988525390625, -1.0052490234375, -0.94061279296875, -0.8759765625, -0.81134033203125, -0.7467041015625, -0.68206787109375, -0.617431640625, -0.55279541015625, -0.4881591796875, -0.42352294921875, -0.35888671875, -0.29425048828125, -0.2296142578125, -0.16497802734375, -0.100341796875, -0.03570556640625, 0.0289306640625, 0.09356689453125, 0.158203125, 0.22283935546875, 0.2874755859375, 0.35211181640625, 0.416748046875, 0.48138427734375, 0.5460205078125, 0.61065673828125, 0.67529296875, 0.73992919921875, 0.8045654296875, 0.86920166015625, 0.933837890625, 0.99847412109375, 1.0631103515625, 1.12774658203125, 1.1923828125, 1.25701904296875, 1.3216552734375, 1.38629150390625, 1.450927734375, 1.51556396484375, 1.5802001953125, 1.64483642578125, 1.70947265625, 1.77410888671875, 1.8387451171875, 1.90338134765625, 1.968017578125, 2.03265380859375, 2.0972900390625, 2.16192626953125, 2.2265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 20.0, 199.0, 637.0, 128.0, 11.0, 8.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.845703125, -1.77838134765625, -1.7110595703125, -1.64373779296875, -1.576416015625, -1.50909423828125, -1.4417724609375, -1.37445068359375, -1.30712890625, -1.23980712890625, -1.1724853515625, -1.10516357421875, -1.037841796875, -0.97052001953125, -0.9031982421875, -0.83587646484375, -0.7685546875, -0.70123291015625, -0.6339111328125, -0.56658935546875, -0.499267578125, -0.43194580078125, -0.3646240234375, -0.29730224609375, -0.22998046875, -0.16265869140625, -0.0953369140625, -0.02801513671875, 0.039306640625, 0.10662841796875, 0.1739501953125, 0.24127197265625, 0.30859375, 0.37591552734375, 0.4432373046875, 0.51055908203125, 0.577880859375, 0.64520263671875, 0.7125244140625, 0.77984619140625, 0.84716796875, 0.91448974609375, 0.9818115234375, 1.04913330078125, 1.116455078125, 1.18377685546875, 1.2510986328125, 1.31842041015625, 1.3857421875, 1.45306396484375, 1.5203857421875, 1.58770751953125, 1.655029296875, 1.72235107421875, 1.7896728515625, 1.85699462890625, 1.92431640625, 1.99163818359375, 2.0589599609375, 2.12628173828125, 2.193603515625, 2.26092529296875, 2.3282470703125, 2.39556884765625, 2.462890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 17.0, 52.0, 108.0, 326.0, 334.0, 122.0, 26.0, 9.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.279420852661133, -3.861116409301758, -3.442812204360962, -3.024507761001587, -2.606203556060791, -2.187899112701416, -1.769594669342041, -1.3512904644012451, -0.9329860210418701, -0.5146816968917847, -0.09637731313705444, 0.3219270706176758, 0.7402313947677612, 1.1585357189178467, 1.5768401622772217, 1.9951443672180176, 2.4134488105773926, 2.8317532539367676, 3.2500574588775635, 3.6683619022369385, 4.086666107177734, 4.504970550537109, 4.923274993896484, 5.341579437255859, 5.759883880615234, 6.178188323974609, 6.596492767333984, 7.014797210693359, 7.433101177215576, 7.851405620574951, 8.269710540771484, 8.688014030456543, 9.106318473815918, 9.524622917175293, 9.942927360534668, 10.361231803894043, 10.779536247253418, 11.197839736938477, 11.616144180297852, 12.034448623657227, 12.452753067016602, 12.871057510375977, 13.289361953735352, 13.707666397094727, 14.125970840454102, 14.544275283813477, 14.962579727172852, 15.38088321685791, 15.799188613891602, 16.217493057250977, 16.63579750061035, 17.054101943969727, 17.4724063873291, 17.890710830688477, 18.30901527404785, 18.727319717407227, 19.14562225341797, 19.563926696777344, 19.98223114013672, 20.400535583496094, 20.81884002685547, 21.237144470214844, 21.65544891357422, 22.073753356933594, 22.49205780029297]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 7.0, 5.0, 13.0, 19.0, 18.0, 20.0, 19.0, 26.0, 20.0, 31.0, 45.0, 28.0, 36.0, 49.0, 43.0, 46.0, 35.0, 42.0, 40.0, 41.0, 45.0, 37.0, 38.0, 29.0, 40.0, 28.0, 25.0, 28.0, 17.0, 20.0, 12.0, 9.0, 15.0, 14.0, 9.0, 6.0, 4.0, 8.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.7211198806762695, -5.543257713317871, -5.365395545959473, -5.187533378601074, -5.009671688079834, -4.8318095207214355, -4.653947353363037, -4.476085186004639, -4.29822301864624, -4.120360851287842, -3.9424989223480225, -3.764636754989624, -3.5867745876312256, -3.4089126586914062, -3.231050491333008, -3.0531883239746094, -2.87532639503479, -2.6974642276763916, -2.5196022987365723, -2.341740131378174, -2.1638779640197754, -1.9860159158706665, -1.8081538677215576, -1.6302917003631592, -1.4524296522140503, -1.2745676040649414, -1.096705436706543, -0.9188433885574341, -0.7409812808036804, -0.5631191730499268, -0.38525712490081787, -0.20739495754241943, -0.029532909393310547, 0.14832918345928192, 0.3261912763118744, 0.5040533542633057, 0.6819154620170593, 0.859777569770813, 1.0376396179199219, 1.2155017852783203, 1.3933638334274292, 1.571225881576538, 1.7490880489349365, 1.9269500970840454, 2.1048121452331543, 2.2826743125915527, 2.460536479949951, 2.6383986473083496, 2.816260576248169, 2.9941227436065674, 3.1719846725463867, 3.349846839904785, 3.5277090072631836, 3.705571174621582, 3.8834331035614014, 4.061295509338379, 4.239157199859619, 4.417019367218018, 4.594881534576416, 4.772743225097656, 4.950605392456055, 5.128467559814453, 5.306329727172852, 5.48419189453125, 5.662054061889648]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 12.0, 11.0, 7.0, 11.0, 17.0, 20.0, 33.0, 64.0, 72.0, 121.0, 155.0, 222.0, 370.0, 578.0, 1025.0, 1851.0, 3850.0, 8558.0, 24076.0, 118059.0, 3758479.0, 221112.0, 33970.0, 11089.0, 4711.0, 2370.0, 1339.0, 754.0, 433.0, 280.0, 182.0, 126.0, 93.0, 59.0, 57.0, 26.0, 27.0, 16.0, 15.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6069564819335938, -0.5864715576171875, -0.5659866333007812, -0.545501708984375, -0.5250167846679688, -0.5045318603515625, -0.48404693603515625, -0.46356201171875, -0.44307708740234375, -0.4225921630859375, -0.40210723876953125, -0.381622314453125, -0.36113739013671875, -0.3406524658203125, -0.32016754150390625, -0.2996826171875, -0.27919769287109375, -0.2587127685546875, -0.23822784423828125, -0.217742919921875, -0.19725799560546875, -0.1767730712890625, -0.15628814697265625, -0.13580322265625, -0.11531829833984375, -0.0948333740234375, -0.07434844970703125, -0.053863525390625, -0.03337860107421875, -0.0128936767578125, 0.00759124755859375, 0.028076171875, 0.04856109619140625, 0.0690460205078125, 0.08953094482421875, 0.110015869140625, 0.13050079345703125, 0.1509857177734375, 0.17147064208984375, 0.19195556640625, 0.21244049072265625, 0.2329254150390625, 0.25341033935546875, 0.273895263671875, 0.29438018798828125, 0.3148651123046875, 0.33535003662109375, 0.3558349609375, 0.37631988525390625, 0.3968048095703125, 0.41728973388671875, 0.437774658203125, 0.45825958251953125, 0.4787445068359375, 0.49922943115234375, 0.51971435546875, 0.5401992797851562, 0.5606842041015625, 0.5811691284179688, 0.601654052734375, 0.6221389770507812, 0.6426239013671875, 0.6631088256835938, 0.68359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 8.0, 6.0, 6.0, 10.0, 16.0, 24.0, 33.0, 26.0, 42.0, 54.0, 41.0, 60.0, 67.0, 52.0, 50.0, 66.0, 52.0, 58.0, 46.0, 47.0, 43.0, 32.0, 31.0, 36.0, 23.0, 10.0, 21.0, 12.0, 9.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31591796875, -0.30384063720703125, -0.2917633056640625, -0.27968597412109375, -0.267608642578125, -0.25553131103515625, -0.2434539794921875, -0.23137664794921875, -0.21929931640625, -0.20722198486328125, -0.1951446533203125, -0.18306732177734375, -0.170989990234375, -0.15891265869140625, -0.1468353271484375, -0.13475799560546875, -0.1226806640625, -0.11060333251953125, -0.0985260009765625, -0.08644866943359375, -0.074371337890625, -0.06229400634765625, -0.0502166748046875, -0.03813934326171875, -0.02606201171875, -0.01398468017578125, -0.0019073486328125, 0.01016998291015625, 0.022247314453125, 0.03432464599609375, 0.0464019775390625, 0.05847930908203125, 0.070556640625, 0.08263397216796875, 0.0947113037109375, 0.10678863525390625, 0.118865966796875, 0.13094329833984375, 0.1430206298828125, 0.15509796142578125, 0.16717529296875, 0.17925262451171875, 0.1913299560546875, 0.20340728759765625, 0.215484619140625, 0.22756195068359375, 0.2396392822265625, 0.25171661376953125, 0.2637939453125, 0.27587127685546875, 0.2879486083984375, 0.30002593994140625, 0.312103271484375, 0.32418060302734375, 0.3362579345703125, 0.34833526611328125, 0.36041259765625, 0.37248992919921875, 0.3845672607421875, 0.39664459228515625, 0.408721923828125, 0.42079925537109375, 0.4328765869140625, 0.44495391845703125, 0.45703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 13.0, 10.0, 12.0, 31.0, 42.0, 63.0, 93.0, 216.0, 412.0, 839.0, 2083.0, 8207.0, 209765.0, 3948213.0, 19040.0, 3112.0, 1119.0, 447.0, 250.0, 116.0, 82.0, 44.0, 30.0, 20.0, 9.0, 11.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.594024658203125, -1.54449462890625, -1.494964599609375, -1.4454345703125, -1.395904541015625, -1.34637451171875, -1.296844482421875, -1.247314453125, -1.197784423828125, -1.14825439453125, -1.098724365234375, -1.0491943359375, -0.999664306640625, -0.95013427734375, -0.900604248046875, -0.85107421875, -0.801544189453125, -0.75201416015625, -0.702484130859375, -0.6529541015625, -0.603424072265625, -0.55389404296875, -0.504364013671875, -0.454833984375, -0.405303955078125, -0.35577392578125, -0.306243896484375, -0.2567138671875, -0.207183837890625, -0.15765380859375, -0.108123779296875, -0.05859375, -0.009063720703125, 0.04046630859375, 0.089996337890625, 0.1395263671875, 0.189056396484375, 0.23858642578125, 0.288116455078125, 0.337646484375, 0.387176513671875, 0.43670654296875, 0.486236572265625, 0.5357666015625, 0.585296630859375, 0.63482666015625, 0.684356689453125, 0.73388671875, 0.783416748046875, 0.83294677734375, 0.882476806640625, 0.9320068359375, 0.981536865234375, 1.03106689453125, 1.080596923828125, 1.130126953125, 1.179656982421875, 1.22918701171875, 1.278717041015625, 1.3282470703125, 1.377777099609375, 1.42730712890625, 1.476837158203125, 1.5263671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 29.0, 54.0, 198.0, 3150.0, 442.0, 91.0, 40.0, 19.0, 9.0, 7.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5631027221679688, -0.5392913818359375, -0.5154800415039062, -0.491668701171875, -0.46785736083984375, -0.4440460205078125, -0.42023468017578125, -0.39642333984375, -0.37261199951171875, -0.3488006591796875, -0.32498931884765625, -0.301177978515625, -0.27736663818359375, -0.2535552978515625, -0.22974395751953125, -0.2059326171875, -0.18212127685546875, -0.1583099365234375, -0.13449859619140625, -0.110687255859375, -0.08687591552734375, -0.0630645751953125, -0.03925323486328125, -0.01544189453125, 0.00836944580078125, 0.0321807861328125, 0.05599212646484375, 0.079803466796875, 0.10361480712890625, 0.1274261474609375, 0.15123748779296875, 0.175048828125, 0.19886016845703125, 0.2226715087890625, 0.24648284912109375, 0.270294189453125, 0.29410552978515625, 0.3179168701171875, 0.34172821044921875, 0.36553955078125, 0.38935089111328125, 0.4131622314453125, 0.43697357177734375, 0.460784912109375, 0.48459625244140625, 0.5084075927734375, 0.5322189331054688, 0.5560302734375, 0.5798416137695312, 0.6036529541015625, 0.6274642944335938, 0.651275634765625, 0.6750869750976562, 0.6988983154296875, 0.7227096557617188, 0.74652099609375, 0.7703323364257812, 0.7941436767578125, 0.8179550170898438, 0.841766357421875, 0.8655776977539062, 0.8893890380859375, 0.9132003784179688, 0.93701171875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 20.0, 110.0, 261.0, 348.0, 151.0, 61.0, 15.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.62447452545166, -4.529904365539551, -4.435334205627441, -4.34076452255249, -4.246194362640381, -4.1516242027282715, -4.05705451965332, -3.962484359741211, -3.8679141998291016, -3.773344039916992, -3.678774118423462, -3.5842041969299316, -3.4896340370178223, -3.395063877105713, -3.3004939556121826, -3.2059240341186523, -3.111353874206543, -3.0167837142944336, -2.9222137928009033, -2.827643871307373, -2.7330737113952637, -2.6385035514831543, -2.543933629989624, -2.4493637084960938, -2.3547935485839844, -2.260223388671875, -2.1656534671783447, -2.0710835456848145, -1.976513385772705, -1.8819433450698853, -1.7873733043670654, -1.6928032636642456, -1.5982331037521362, -1.5036630630493164, -1.4090930223464966, -1.3145229816436768, -1.219952940940857, -1.125382900238037, -1.0308128595352173, -0.9362428188323975, -0.8416727781295776, -0.7471027374267578, -0.652532696723938, -0.5579626560211182, -0.46339261531829834, -0.3688225746154785, -0.2742525339126587, -0.17968249320983887, -0.08511245250701904, 0.009457588195800781, 0.1040276288986206, 0.19859766960144043, 0.29316771030426025, 0.3877377510070801, 0.4823077917098999, 0.5768778324127197, 0.6714478731155396, 0.7660179138183594, 0.8605879545211792, 0.955157995223999, 1.0497280359268188, 1.1442980766296387, 1.2388681173324585, 1.3334381580352783, 1.4280081987380981]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 8.0, 3.0, 2.0, 3.0, 5.0, 9.0, 12.0, 12.0, 24.0, 21.0, 24.0, 30.0, 38.0, 41.0, 54.0, 60.0, 56.0, 60.0, 57.0, 72.0, 61.0, 55.0, 62.0, 40.0, 30.0, 29.0, 26.0, 29.0, 22.0, 13.0, 11.0, 9.0, 7.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.449151873588562, -1.4070719480514526, -1.3649920225143433, -1.3229120969772339, -1.2808321714401245, -1.2387522459030151, -1.1966723203659058, -1.1545923948287964, -1.112512469291687, -1.0704325437545776, -1.0283526182174683, -0.9862726926803589, -0.9441927671432495, -0.9021128416061401, -0.8600329160690308, -0.8179529905319214, -0.775873064994812, -0.7337931394577026, -0.6917132139205933, -0.6496332883834839, -0.6075533628463745, -0.5654734373092651, -0.5233935117721558, -0.4813135862350464, -0.439233660697937, -0.39715373516082764, -0.35507380962371826, -0.3129938840866089, -0.2709139585494995, -0.22883403301239014, -0.18675410747528076, -0.1446741819381714, -0.10259437561035156, -0.06051445007324219, -0.018434524536132812, 0.023645401000976562, 0.06572532653808594, 0.10780525207519531, 0.1498851776123047, 0.19196510314941406, 0.23404502868652344, 0.2761249542236328, 0.3182048797607422, 0.36028480529785156, 0.40236473083496094, 0.4444446563720703, 0.4865245819091797, 0.5286045074462891, 0.5706844329833984, 0.6127643585205078, 0.6548442840576172, 0.6969242095947266, 0.7390041351318359, 0.7810840606689453, 0.8231639862060547, 0.8652439117431641, 0.9073238372802734, 0.9494037628173828, 0.9914836883544922, 1.0335636138916016, 1.075643539428711, 1.1177234649658203, 1.1598033905029297, 1.201883316040039, 1.2439632415771484]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 10.0, 17.0, 18.0, 34.0, 54.0, 93.0, 181.0, 268.0, 577.0, 1655.0, 5237.0, 22750.0, 142806.0, 689898.0, 152551.0, 23999.0, 5437.0, 1610.0, 656.0, 260.0, 149.0, 92.0, 59.0, 42.0, 19.0, 18.0, 12.0, 9.0, 8.0, 4.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.166839599609375, -1.12860107421875, -1.090362548828125, -1.0521240234375, -1.013885498046875, -0.97564697265625, -0.937408447265625, -0.899169921875, -0.860931396484375, -0.82269287109375, -0.784454345703125, -0.7462158203125, -0.707977294921875, -0.66973876953125, -0.631500244140625, -0.59326171875, -0.555023193359375, -0.51678466796875, -0.478546142578125, -0.4403076171875, -0.402069091796875, -0.36383056640625, -0.325592041015625, -0.287353515625, -0.249114990234375, -0.21087646484375, -0.172637939453125, -0.1343994140625, -0.096160888671875, -0.05792236328125, -0.019683837890625, 0.0185546875, 0.056793212890625, 0.09503173828125, 0.133270263671875, 0.1715087890625, 0.209747314453125, 0.24798583984375, 0.286224365234375, 0.324462890625, 0.362701416015625, 0.40093994140625, 0.439178466796875, 0.4774169921875, 0.515655517578125, 0.55389404296875, 0.592132568359375, 0.63037109375, 0.668609619140625, 0.70684814453125, 0.745086669921875, 0.7833251953125, 0.821563720703125, 0.85980224609375, 0.898040771484375, 0.936279296875, 0.974517822265625, 1.01275634765625, 1.050994873046875, 1.0892333984375, 1.127471923828125, 1.16571044921875, 1.203948974609375, 1.2421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 7.0, 15.0, 8.0, 18.0, 24.0, 21.0, 39.0, 49.0, 42.0, 48.0, 61.0, 63.0, 49.0, 52.0, 68.0, 75.0, 40.0, 44.0, 41.0, 45.0, 30.0, 36.0, 26.0, 23.0, 21.0, 12.0, 8.0, 8.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.329345703125, -0.3175239562988281, -0.30570220947265625, -0.2938804626464844, -0.2820587158203125, -0.2702369689941406, -0.25841522216796875, -0.24659347534179688, -0.234771728515625, -0.22294998168945312, -0.21112823486328125, -0.19930648803710938, -0.1874847412109375, -0.17566299438476562, -0.16384124755859375, -0.15201950073242188, -0.14019775390625, -0.12837600708007812, -0.11655426025390625, -0.10473251342773438, -0.0929107666015625, -0.08108901977539062, -0.06926727294921875, -0.057445526123046875, -0.045623779296875, -0.033802032470703125, -0.02198028564453125, -0.010158538818359375, 0.0016632080078125, 0.013484954833984375, 0.02530670166015625, 0.037128448486328125, 0.0489501953125, 0.060771942138671875, 0.07259368896484375, 0.08441543579101562, 0.0962371826171875, 0.10805892944335938, 0.11988067626953125, 0.13170242309570312, 0.143524169921875, 0.15534591674804688, 0.16716766357421875, 0.17898941040039062, 0.1908111572265625, 0.20263290405273438, 0.21445465087890625, 0.22627639770507812, 0.23809814453125, 0.24991989135742188, 0.26174163818359375, 0.2735633850097656, 0.2853851318359375, 0.2972068786621094, 0.30902862548828125, 0.3208503723144531, 0.332672119140625, 0.3444938659667969, 0.35631561279296875, 0.3681373596191406, 0.3799591064453125, 0.3917808532714844, 0.40360260009765625, 0.4154243469238281, 0.42724609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 5.0, 15.0, 15.0, 15.0, 12.0, 29.0, 21.0, 29.0, 41.0, 47.0, 68.0, 77.0, 138.0, 210.0, 400.0, 768.0, 1676.0, 4077.0, 11230.0, 36120.0, 145091.0, 565335.0, 210927.0, 48529.0, 14533.0, 5067.0, 2016.0, 858.0, 420.0, 249.0, 141.0, 105.0, 62.0, 52.0, 39.0, 25.0, 22.0, 14.0, 16.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.67333984375, -0.648956298828125, -0.62457275390625, -0.600189208984375, -0.5758056640625, -0.551422119140625, -0.52703857421875, -0.502655029296875, -0.478271484375, -0.453887939453125, -0.42950439453125, -0.405120849609375, -0.3807373046875, -0.356353759765625, -0.33197021484375, -0.307586669921875, -0.283203125, -0.258819580078125, -0.23443603515625, -0.210052490234375, -0.1856689453125, -0.161285400390625, -0.13690185546875, -0.112518310546875, -0.088134765625, -0.063751220703125, -0.03936767578125, -0.014984130859375, 0.0093994140625, 0.033782958984375, 0.05816650390625, 0.082550048828125, 0.10693359375, 0.131317138671875, 0.15570068359375, 0.180084228515625, 0.2044677734375, 0.228851318359375, 0.25323486328125, 0.277618408203125, 0.302001953125, 0.326385498046875, 0.35076904296875, 0.375152587890625, 0.3995361328125, 0.423919677734375, 0.44830322265625, 0.472686767578125, 0.4970703125, 0.521453857421875, 0.54583740234375, 0.570220947265625, 0.5946044921875, 0.618988037109375, 0.64337158203125, 0.667755126953125, 0.692138671875, 0.716522216796875, 0.74090576171875, 0.765289306640625, 0.7896728515625, 0.814056396484375, 0.83843994140625, 0.862823486328125, 0.88720703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 4.0, 5.0, 4.0, 11.0, 9.0, 11.0, 13.0, 11.0, 22.0, 24.0, 26.0, 43.0, 44.0, 33.0, 36.0, 43.0, 38.0, 47.0, 28.0, 50.0, 43.0, 42.0, 48.0, 27.0, 33.0, 44.0, 34.0, 37.0, 27.0, 37.0, 22.0, 11.0, 14.0, 18.0, 13.0, 8.0, 8.0, 8.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.03125, -0.994659423828125, -0.95806884765625, -0.921478271484375, -0.8848876953125, -0.848297119140625, -0.81170654296875, -0.775115966796875, -0.738525390625, -0.701934814453125, -0.66534423828125, -0.628753662109375, -0.5921630859375, -0.555572509765625, -0.51898193359375, -0.482391357421875, -0.44580078125, -0.409210205078125, -0.37261962890625, -0.336029052734375, -0.2994384765625, -0.262847900390625, -0.22625732421875, -0.189666748046875, -0.153076171875, -0.116485595703125, -0.07989501953125, -0.043304443359375, -0.0067138671875, 0.029876708984375, 0.06646728515625, 0.103057861328125, 0.1396484375, 0.176239013671875, 0.21282958984375, 0.249420166015625, 0.2860107421875, 0.322601318359375, 0.35919189453125, 0.395782470703125, 0.432373046875, 0.468963623046875, 0.50555419921875, 0.542144775390625, 0.5787353515625, 0.615325927734375, 0.65191650390625, 0.688507080078125, 0.72509765625, 0.761688232421875, 0.79827880859375, 0.834869384765625, 0.8714599609375, 0.908050537109375, 0.94464111328125, 0.981231689453125, 1.017822265625, 1.054412841796875, 1.09100341796875, 1.127593994140625, 1.1641845703125, 1.200775146484375, 1.23736572265625, 1.273956298828125, 1.310546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 4.0, 9.0, 22.0, 32.0, 45.0, 92.0, 128.0, 217.0, 408.0, 899.0, 2100.0, 7335.0, 59482.0, 626236.0, 319932.0, 24332.0, 4297.0, 1502.0, 640.0, 362.0, 187.0, 102.0, 67.0, 36.0, 19.0, 10.0, 17.0, 9.0, 4.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.317626953125, -0.30731964111328125, -0.2970123291015625, -0.28670501708984375, -0.276397705078125, -0.26609039306640625, -0.2557830810546875, -0.24547576904296875, -0.23516845703125, -0.22486114501953125, -0.2145538330078125, -0.20424652099609375, -0.193939208984375, -0.18363189697265625, -0.1733245849609375, -0.16301727294921875, -0.1527099609375, -0.14240264892578125, -0.1320953369140625, -0.12178802490234375, -0.111480712890625, -0.10117340087890625, -0.0908660888671875, -0.08055877685546875, -0.07025146484375, -0.05994415283203125, -0.0496368408203125, -0.03932952880859375, -0.029022216796875, -0.01871490478515625, -0.0084075927734375, 0.00189971923828125, 0.01220703125, 0.02251434326171875, 0.0328216552734375, 0.04312896728515625, 0.053436279296875, 0.06374359130859375, 0.0740509033203125, 0.08435821533203125, 0.09466552734375, 0.10497283935546875, 0.1152801513671875, 0.12558746337890625, 0.135894775390625, 0.14620208740234375, 0.1565093994140625, 0.16681671142578125, 0.1771240234375, 0.18743133544921875, 0.1977386474609375, 0.20804595947265625, 0.218353271484375, 0.22866058349609375, 0.2389678955078125, 0.24927520751953125, 0.25958251953125, 0.26988983154296875, 0.2801971435546875, 0.29050445556640625, 0.300811767578125, 0.31111907958984375, 0.3214263916015625, 0.33173370361328125, 0.342041015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 2.0, 7.0, 5.0, 13.0, 13.0, 22.0, 27.0, 35.0, 45.0, 48.0, 72.0, 79.0, 80.0, 96.0, 86.0, 77.0, 67.0, 54.0, 48.0, 35.0, 20.0, 14.0, 15.0, 8.0, 8.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.045797348022461e-05, -2.9489398002624512e-05, -2.8520822525024414e-05, -2.7552247047424316e-05, -2.658367156982422e-05, -2.561509609222412e-05, -2.4646520614624023e-05, -2.3677945137023926e-05, -2.2709369659423828e-05, -2.174079418182373e-05, -2.0772218704223633e-05, -1.9803643226623535e-05, -1.8835067749023438e-05, -1.786649227142334e-05, -1.6897916793823242e-05, -1.5929341316223145e-05, -1.4960765838623047e-05, -1.399219036102295e-05, -1.3023614883422852e-05, -1.2055039405822754e-05, -1.1086463928222656e-05, -1.0117888450622559e-05, -9.149312973022461e-06, -8.180737495422363e-06, -7.212162017822266e-06, -6.243586540222168e-06, -5.27501106262207e-06, -4.306435585021973e-06, -3.337860107421875e-06, -2.3692846298217773e-06, -1.4007091522216797e-06, -4.3213367462158203e-07, 5.364418029785156e-07, 1.5050172805786133e-06, 2.473592758178711e-06, 3.4421682357788086e-06, 4.410743713378906e-06, 5.379319190979004e-06, 6.3478946685791016e-06, 7.316470146179199e-06, 8.285045623779297e-06, 9.253621101379395e-06, 1.0222196578979492e-05, 1.119077205657959e-05, 1.2159347534179688e-05, 1.3127923011779785e-05, 1.4096498489379883e-05, 1.506507396697998e-05, 1.6033649444580078e-05, 1.7002224922180176e-05, 1.7970800399780273e-05, 1.893937587738037e-05, 1.990795135498047e-05, 2.0876526832580566e-05, 2.1845102310180664e-05, 2.2813677787780762e-05, 2.378225326538086e-05, 2.4750828742980957e-05, 2.5719404220581055e-05, 2.6687979698181152e-05, 2.765655517578125e-05, 2.8625130653381348e-05, 2.9593706130981445e-05, 3.056228160858154e-05, 3.153085708618164e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 16.0, 15.0, 47.0, 62.0, 131.0, 308.0, 790.0, 2456.0, 12506.0, 184893.0, 768984.0, 68794.0, 6858.0, 1675.0, 530.0, 203.0, 102.0, 66.0, 35.0, 17.0, 14.0, 13.0, 1.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39794921875, -0.3860130310058594, -0.37407684326171875, -0.3621406555175781, -0.3502044677734375, -0.3382682800292969, -0.32633209228515625, -0.3143959045410156, -0.302459716796875, -0.2905235290527344, -0.27858734130859375, -0.2666511535644531, -0.2547149658203125, -0.24277877807617188, -0.23084259033203125, -0.21890640258789062, -0.20697021484375, -0.19503402709960938, -0.18309783935546875, -0.17116165161132812, -0.1592254638671875, -0.14728927612304688, -0.13535308837890625, -0.12341690063476562, -0.111480712890625, -0.09954452514648438, -0.08760833740234375, -0.07567214965820312, -0.0637359619140625, -0.051799774169921875, -0.03986358642578125, -0.027927398681640625, -0.0159912109375, -0.004055023193359375, 0.00788116455078125, 0.019817352294921875, 0.0317535400390625, 0.043689727783203125, 0.05562591552734375, 0.06756210327148438, 0.079498291015625, 0.09143447875976562, 0.10337066650390625, 0.11530685424804688, 0.1272430419921875, 0.13917922973632812, 0.15111541748046875, 0.16305160522460938, 0.17498779296875, 0.18692398071289062, 0.19886016845703125, 0.21079635620117188, 0.2227325439453125, 0.23466873168945312, 0.24660491943359375, 0.2585411071777344, 0.270477294921875, 0.2824134826660156, 0.29434967041015625, 0.3062858581542969, 0.3182220458984375, 0.3301582336425781, 0.34209442138671875, 0.3540306091308594, 0.365966796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 14.0, 9.0, 31.0, 36.0, 62.0, 79.0, 74.0, 99.0, 111.0, 110.0, 94.0, 78.0, 54.0, 48.0, 25.0, 23.0, 12.0, 6.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2990837097167969, -0.28737640380859375, -0.2756690979003906, -0.2639617919921875, -0.2522544860839844, -0.24054718017578125, -0.22883987426757812, -0.217132568359375, -0.20542526245117188, -0.19371795654296875, -0.18201065063476562, -0.1703033447265625, -0.15859603881835938, -0.14688873291015625, -0.13518142700195312, -0.12347412109375, -0.11176681518554688, -0.10005950927734375, -0.08835220336914062, -0.0766448974609375, -0.06493759155273438, -0.05323028564453125, -0.041522979736328125, -0.029815673828125, -0.018108367919921875, -0.00640106201171875, 0.005306243896484375, 0.0170135498046875, 0.028720855712890625, 0.04042816162109375, 0.052135467529296875, 0.0638427734375, 0.07555007934570312, 0.08725738525390625, 0.09896469116210938, 0.1106719970703125, 0.12237930297851562, 0.13408660888671875, 0.14579391479492188, 0.157501220703125, 0.16920852661132812, 0.18091583251953125, 0.19262313842773438, 0.2043304443359375, 0.21603775024414062, 0.22774505615234375, 0.23945236206054688, 0.25115966796875, 0.2628669738769531, 0.27457427978515625, 0.2862815856933594, 0.2979888916015625, 0.3096961975097656, 0.32140350341796875, 0.3331108093261719, 0.344818115234375, 0.3565254211425781, 0.36823272705078125, 0.3799400329589844, 0.3916473388671875, 0.4033546447753906, 0.41506195068359375, 0.4267692565917969, 0.4384765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 22.0, 39.0, 130.0, 295.0, 310.0, 143.0, 26.0, 20.0, 8.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.023377418518066, -12.66304874420166, -12.302720069885254, -11.942390441894531, -11.582061767578125, -11.221733093261719, -10.861404418945312, -10.501075744628906, -10.1407470703125, -9.780418395996094, -9.420089721679688, -9.059761047363281, -8.699431419372559, -8.339102745056152, -7.978774070739746, -7.61844539642334, -7.258115768432617, -6.897787094116211, -6.5374579429626465, -6.17712926864624, -5.816800117492676, -5.4564714431762695, -5.096142768859863, -4.735814094543457, -4.375484943389893, -4.015156269073486, -3.654827117919922, -3.2944984436035156, -2.9341695308685303, -2.573840618133545, -2.2135119438171387, -1.8531830310821533, -1.4928531646728516, -1.1325242519378662, -0.7721954584121704, -0.4118666648864746, -0.05153775215148926, 0.3087911605834961, 0.6691198348999023, 1.0294487476348877, 1.389777660369873, 1.7501065731048584, 2.1104354858398438, 2.47076416015625, 2.8310930728912354, 3.1914219856262207, 3.551750659942627, 3.9120795726776123, 4.272408485412598, 4.632737159729004, 4.993066310882568, 5.353394985198975, 5.713724136352539, 6.074052810668945, 6.434381484985352, 6.794710159301758, 7.155039310455322, 7.5153679847717285, 7.875697135925293, 8.2360258102417, 8.596354484558105, 8.956684112548828, 9.317012786865234, 9.67734146118164, 10.037670135498047]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 1.0, 12.0, 7.0, 13.0, 13.0, 14.0, 11.0, 26.0, 22.0, 16.0, 22.0, 35.0, 44.0, 48.0, 53.0, 34.0, 48.0, 58.0, 50.0, 37.0, 52.0, 56.0, 43.0, 48.0, 38.0, 34.0, 31.0, 26.0, 24.0, 22.0, 14.0, 11.0, 8.0, 9.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.490626335144043, -7.286118030548096, -7.081609725952148, -6.877100944519043, -6.672592639923096, -6.468084335327148, -6.263576030731201, -6.059067726135254, -5.854558944702148, -5.650050640106201, -5.445542335510254, -5.241033554077148, -5.036525249481201, -4.832016944885254, -4.627508640289307, -4.423000335693359, -4.218492031097412, -4.013983726501465, -3.8094751834869385, -3.604966878890991, -3.400458335876465, -3.1959500312805176, -2.9914417266845703, -2.786933422088623, -2.5824248790740967, -2.3779165744781494, -2.173408031463623, -1.9688997268676758, -1.764391303062439, -1.5598828792572021, -1.3553745746612549, -1.150866150856018, -0.9463577270507812, -0.7418493032455444, -0.5373409390449524, -0.33283257484436035, -0.12832415103912354, 0.07618427276611328, 0.28069257736206055, 0.48520100116729736, 0.6897094249725342, 0.894217848777771, 1.0987262725830078, 1.303234577178955, 1.507743000984192, 1.7122514247894287, 1.916759729385376, 2.1212682723999023, 2.3257765769958496, 2.530284881591797, 2.7347934246063232, 2.9393017292022705, 3.143810272216797, 3.348318576812744, 3.5528268814086914, 3.7573351860046387, 3.961843729019165, 4.166352272033691, 4.370860576629639, 4.575368881225586, 4.779877185821533, 4.9843854904174805, 5.188894271850586, 5.393402576446533, 5.5979108810424805]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 3.0, 4.0, 12.0, 14.0, 21.0, 40.0, 52.0, 66.0, 100.0, 139.0, 166.0, 287.0, 417.0, 659.0, 1262.0, 2390.0, 5363.0, 13473.0, 58115.0, 3958945.0, 119520.0, 19528.0, 6876.0, 3083.0, 1493.0, 812.0, 459.0, 276.0, 191.0, 139.0, 108.0, 81.0, 57.0, 29.0, 28.0, 18.0, 12.0, 10.0, 10.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4267578125, -1.3855743408203125, -1.344390869140625, -1.3032073974609375, -1.26202392578125, -1.2208404541015625, -1.179656982421875, -1.1384735107421875, -1.0972900390625, -1.0561065673828125, -1.014923095703125, -0.9737396240234375, -0.93255615234375, -0.8913726806640625, -0.850189208984375, -0.8090057373046875, -0.767822265625, -0.7266387939453125, -0.685455322265625, -0.6442718505859375, -0.60308837890625, -0.5619049072265625, -0.520721435546875, -0.4795379638671875, -0.4383544921875, -0.3971710205078125, -0.355987548828125, -0.3148040771484375, -0.27362060546875, -0.2324371337890625, -0.191253662109375, -0.1500701904296875, -0.10888671875, -0.0677032470703125, -0.026519775390625, 0.0146636962890625, 0.05584716796875, 0.0970306396484375, 0.138214111328125, 0.1793975830078125, 0.2205810546875, 0.2617645263671875, 0.302947998046875, 0.3441314697265625, 0.38531494140625, 0.4264984130859375, 0.467681884765625, 0.5088653564453125, 0.550048828125, 0.5912322998046875, 0.632415771484375, 0.6735992431640625, 0.71478271484375, 0.7559661865234375, 0.797149658203125, 0.8383331298828125, 0.8795166015625, 0.9207000732421875, 0.961883544921875, 1.0030670166015625, 1.04425048828125, 1.0854339599609375, 1.126617431640625, 1.1678009033203125, 1.208984375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 16.0, 15.0, 22.0, 21.0, 21.0, 23.0, 32.0, 40.0, 47.0, 46.0, 67.0, 43.0, 53.0, 40.0, 54.0, 54.0, 42.0, 51.0, 44.0, 39.0, 35.0, 22.0, 35.0, 24.0, 16.0, 20.0, 15.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.381591796875, -0.3698997497558594, -0.35820770263671875, -0.3465156555175781, -0.3348236083984375, -0.3231315612792969, -0.31143951416015625, -0.2997474670410156, -0.288055419921875, -0.2763633728027344, -0.26467132568359375, -0.2529792785644531, -0.2412872314453125, -0.22959518432617188, -0.21790313720703125, -0.20621109008789062, -0.19451904296875, -0.18282699584960938, -0.17113494873046875, -0.15944290161132812, -0.1477508544921875, -0.13605880737304688, -0.12436676025390625, -0.11267471313476562, -0.100982666015625, -0.08929061889648438, -0.07759857177734375, -0.06590652465820312, -0.0542144775390625, -0.042522430419921875, -0.03083038330078125, -0.019138336181640625, -0.0074462890625, 0.004245758056640625, 0.01593780517578125, 0.027629852294921875, 0.0393218994140625, 0.051013946533203125, 0.06270599365234375, 0.07439804077148438, 0.086090087890625, 0.09778213500976562, 0.10947418212890625, 0.12116622924804688, 0.1328582763671875, 0.14455032348632812, 0.15624237060546875, 0.16793441772460938, 0.17962646484375, 0.19131851196289062, 0.20301055908203125, 0.21470260620117188, 0.2263946533203125, 0.23808670043945312, 0.24977874755859375, 0.2614707946777344, 0.273162841796875, 0.2848548889160156, 0.29654693603515625, 0.3082389831542969, 0.3199310302734375, 0.3316230773925781, 0.34331512451171875, 0.3550071716308594, 0.36669921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 5.0, 7.0, 6.0, 8.0, 14.0, 20.0, 24.0, 35.0, 45.0, 47.0, 65.0, 96.0, 256.0, 873.0, 5950.0, 3979477.0, 202966.0, 3291.0, 593.0, 204.0, 79.0, 54.0, 34.0, 32.0, 31.0, 15.0, 21.0, 17.0, 8.0, 10.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.333984375, -3.238433837890625, -3.14288330078125, -3.047332763671875, -2.9517822265625, -2.856231689453125, -2.76068115234375, -2.665130615234375, -2.569580078125, -2.474029541015625, -2.37847900390625, -2.282928466796875, -2.1873779296875, -2.091827392578125, -1.99627685546875, -1.900726318359375, -1.80517578125, -1.709625244140625, -1.61407470703125, -1.518524169921875, -1.4229736328125, -1.327423095703125, -1.23187255859375, -1.136322021484375, -1.040771484375, -0.945220947265625, -0.84967041015625, -0.754119873046875, -0.6585693359375, -0.563018798828125, -0.46746826171875, -0.371917724609375, -0.2763671875, -0.180816650390625, -0.08526611328125, 0.010284423828125, 0.1058349609375, 0.201385498046875, 0.29693603515625, 0.392486572265625, 0.488037109375, 0.583587646484375, 0.67913818359375, 0.774688720703125, 0.8702392578125, 0.965789794921875, 1.06134033203125, 1.156890869140625, 1.25244140625, 1.347991943359375, 1.44354248046875, 1.539093017578125, 1.6346435546875, 1.730194091796875, 1.82574462890625, 1.921295166015625, 2.016845703125, 2.112396240234375, 2.20794677734375, 2.303497314453125, 2.3990478515625, 2.494598388671875, 2.59014892578125, 2.685699462890625, 2.78125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 7.0, 15.0, 19.0, 58.0, 177.0, 3564.0, 169.0, 44.0, 14.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.166015625, -2.1239242553710938, -2.0818328857421875, -2.0397415161132812, -1.997650146484375, -1.9555587768554688, -1.9134674072265625, -1.8713760375976562, -1.82928466796875, -1.7871932983398438, -1.7451019287109375, -1.7030105590820312, -1.660919189453125, -1.6188278198242188, -1.5767364501953125, -1.5346450805664062, -1.4925537109375, -1.4504623413085938, -1.4083709716796875, -1.3662796020507812, -1.324188232421875, -1.2820968627929688, -1.2400054931640625, -1.1979141235351562, -1.15582275390625, -1.1137313842773438, -1.0716400146484375, -1.0295486450195312, -0.987457275390625, -0.9453659057617188, -0.9032745361328125, -0.8611831665039062, -0.819091796875, -0.7770004272460938, -0.7349090576171875, -0.6928176879882812, -0.650726318359375, -0.6086349487304688, -0.5665435791015625, -0.5244522094726562, -0.48236083984375, -0.44026947021484375, -0.3981781005859375, -0.35608673095703125, -0.313995361328125, -0.27190399169921875, -0.2298126220703125, -0.18772125244140625, -0.1456298828125, -0.10353851318359375, -0.0614471435546875, -0.01935577392578125, 0.022735595703125, 0.06482696533203125, 0.1069183349609375, 0.14900970458984375, 0.19110107421875, 0.23319244384765625, 0.2752838134765625, 0.31737518310546875, 0.359466552734375, 0.40155792236328125, 0.4436492919921875, 0.48574066162109375, 0.52783203125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 12.0, 48.0, 86.0, 318.0, 412.0, 87.0, 18.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.1212921142578125, -6.984578609466553, -6.847865104675293, -6.711151123046875, -6.574437618255615, -6.4377241134643555, -6.301010608673096, -6.164297103881836, -6.027583599090576, -5.890870094299316, -5.754156589508057, -5.617443084716797, -5.480729103088379, -5.344015598297119, -5.207302093505859, -5.0705885887146, -4.93387508392334, -4.79716157913208, -4.66044807434082, -4.523734092712402, -4.387020587921143, -4.250307083129883, -4.113593578338623, -3.9768800735473633, -3.8401660919189453, -3.7034525871276855, -3.5667388439178467, -3.430025339126587, -3.293311834335327, -3.1565980911254883, -3.0198845863342285, -2.8831710815429688, -2.746457815170288, -2.6097443103790283, -2.4730305671691895, -2.3363170623779297, -2.19960355758667, -2.06289005279541, -1.9261763095855713, -1.7894628047943115, -1.6527491807937622, -1.516035556793213, -1.3793220520019531, -1.2426084280014038, -1.1058948040008545, -0.9691812992095947, -0.8324676752090454, -0.6957541108131409, -0.5590405464172363, -0.4223269820213318, -0.28561338782310486, -0.14889979362487793, -0.012186229228973389, 0.12452733516693115, 0.26124095916748047, 0.397954523563385, 0.5346680879592896, 0.6713816523551941, 0.8080952167510986, 0.944808840751648, 1.0815224647521973, 1.218235969543457, 1.3549495935440063, 1.4916632175445557, 1.6283767223358154]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 16.0, 12.0, 22.0, 25.0, 31.0, 32.0, 33.0, 38.0, 49.0, 70.0, 75.0, 59.0, 74.0, 71.0, 75.0, 57.0, 51.0, 38.0, 31.0, 41.0, 23.0, 25.0, 15.0, 15.0, 5.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2456023693084717, -2.1779773235321045, -2.1103525161743164, -2.042727470397949, -1.9751026630401611, -1.907477617263794, -1.8398526906967163, -1.7722277641296387, -1.704602837562561, -1.6369779109954834, -1.5693529844284058, -1.5017280578613281, -1.434103012084961, -1.3664782047271729, -1.2988531589508057, -1.231228232383728, -1.1636033058166504, -1.0959783792495728, -1.0283534526824951, -0.9607284665107727, -0.8931035399436951, -0.8254786133766174, -0.757853627204895, -0.6902287006378174, -0.6226037740707397, -0.5549788475036621, -0.4873538911342621, -0.41972893476486206, -0.3521040081977844, -0.2844790816307068, -0.21685412526130676, -0.14922916889190674, -0.08160400390625, -0.01397906243801117, 0.05364587903022766, 0.12127082049846649, 0.18889576196670532, 0.25652068853378296, 0.324145644903183, 0.391770601272583, 0.45939552783966064, 0.5270204544067383, 0.5946453809738159, 0.6622703671455383, 0.729895293712616, 0.7975202202796936, 0.865145206451416, 0.9327701330184937, 1.0003950595855713, 1.068019986152649, 1.1356449127197266, 1.2032698392868042, 1.2708947658538818, 1.338519811630249, 1.4061447381973267, 1.4737696647644043, 1.541394591331482, 1.6090195178985596, 1.6766444444656372, 1.7442693710327148, 1.811894416809082, 1.8795192241668701, 1.9471442699432373, 2.0147690773010254, 2.0823941230773926]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 11.0, 12.0, 12.0, 21.0, 33.0, 39.0, 60.0, 83.0, 115.0, 135.0, 236.0, 323.0, 481.0, 703.0, 1055.0, 1758.0, 2894.0, 4621.0, 7672.0, 13701.0, 24787.0, 47617.0, 100501.0, 242044.0, 319016.0, 142755.0, 63292.0, 32208.0, 17434.0, 9789.0, 5609.0, 3434.0, 2133.0, 1259.0, 886.0, 565.0, 405.0, 254.0, 173.0, 137.0, 78.0, 53.0, 49.0, 30.0, 17.0, 16.0, 16.0, 11.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.48876953125, -0.47258758544921875, -0.4564056396484375, -0.44022369384765625, -0.424041748046875, -0.40785980224609375, -0.3916778564453125, -0.37549591064453125, -0.35931396484375, -0.34313201904296875, -0.3269500732421875, -0.31076812744140625, -0.294586181640625, -0.27840423583984375, -0.2622222900390625, -0.24604034423828125, -0.2298583984375, -0.21367645263671875, -0.1974945068359375, -0.18131256103515625, -0.165130615234375, -0.14894866943359375, -0.1327667236328125, -0.11658477783203125, -0.10040283203125, -0.08422088623046875, -0.0680389404296875, -0.05185699462890625, -0.035675048828125, -0.01949310302734375, -0.0033111572265625, 0.01287078857421875, 0.029052734375, 0.04523468017578125, 0.0614166259765625, 0.07759857177734375, 0.093780517578125, 0.10996246337890625, 0.1261444091796875, 0.14232635498046875, 0.15850830078125, 0.17469024658203125, 0.1908721923828125, 0.20705413818359375, 0.223236083984375, 0.23941802978515625, 0.2555999755859375, 0.27178192138671875, 0.2879638671875, 0.30414581298828125, 0.3203277587890625, 0.33650970458984375, 0.352691650390625, 0.36887359619140625, 0.3850555419921875, 0.40123748779296875, 0.41741943359375, 0.43360137939453125, 0.4497833251953125, 0.46596527099609375, 0.482147216796875, 0.49832916259765625, 0.5145111083984375, 0.5306930541992188, 0.546875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 4.0, 10.0, 8.0, 17.0, 8.0, 24.0, 22.0, 28.0, 23.0, 26.0, 44.0, 40.0, 47.0, 45.0, 76.0, 44.0, 54.0, 58.0, 46.0, 35.0, 39.0, 45.0, 46.0, 25.0, 34.0, 28.0, 23.0, 24.0, 14.0, 17.0, 6.0, 12.0, 4.0, 7.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.413330078125, -0.40139007568359375, -0.3894500732421875, -0.37751007080078125, -0.365570068359375, -0.35363006591796875, -0.3416900634765625, -0.32975006103515625, -0.31781005859375, -0.30587005615234375, -0.2939300537109375, -0.28199005126953125, -0.270050048828125, -0.25811004638671875, -0.2461700439453125, -0.23423004150390625, -0.2222900390625, -0.21035003662109375, -0.1984100341796875, -0.18647003173828125, -0.174530029296875, -0.16259002685546875, -0.1506500244140625, -0.13871002197265625, -0.12677001953125, -0.11483001708984375, -0.1028900146484375, -0.09095001220703125, -0.079010009765625, -0.06707000732421875, -0.0551300048828125, -0.04319000244140625, -0.03125, -0.01930999755859375, -0.0073699951171875, 0.00457000732421875, 0.016510009765625, 0.02845001220703125, 0.0403900146484375, 0.05233001708984375, 0.06427001953125, 0.07621002197265625, 0.0881500244140625, 0.10009002685546875, 0.112030029296875, 0.12397003173828125, 0.1359100341796875, 0.14785003662109375, 0.1597900390625, 0.17173004150390625, 0.1836700439453125, 0.19561004638671875, 0.207550048828125, 0.21949005126953125, 0.2314300537109375, 0.24337005615234375, 0.25531005859375, 0.26725006103515625, 0.2791900634765625, 0.29113006591796875, 0.303070068359375, 0.31501007080078125, 0.3269500732421875, 0.33889007568359375, 0.350830078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 11.0, 16.0, 15.0, 26.0, 30.0, 66.0, 87.0, 95.0, 139.0, 212.0, 370.0, 675.0, 1037.0, 2129.0, 4290.0, 9602.0, 24699.0, 74834.0, 314891.0, 447135.0, 111423.0, 33342.0, 12389.0, 5162.0, 2531.0, 1306.0, 750.0, 448.0, 295.0, 156.0, 113.0, 76.0, 57.0, 38.0, 20.0, 19.0, 21.0, 12.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.796875, -0.7728347778320312, -0.7487945556640625, -0.7247543334960938, -0.700714111328125, -0.6766738891601562, -0.6526336669921875, -0.6285934448242188, -0.60455322265625, -0.5805130004882812, -0.5564727783203125, -0.5324325561523438, -0.508392333984375, -0.48435211181640625, -0.4603118896484375, -0.43627166748046875, -0.4122314453125, -0.38819122314453125, -0.3641510009765625, -0.34011077880859375, -0.316070556640625, -0.29203033447265625, -0.2679901123046875, -0.24394989013671875, -0.21990966796875, -0.19586944580078125, -0.1718292236328125, -0.14778900146484375, -0.123748779296875, -0.09970855712890625, -0.0756683349609375, -0.05162811279296875, -0.027587890625, -0.00354766845703125, 0.0204925537109375, 0.04453277587890625, 0.068572998046875, 0.09261322021484375, 0.1166534423828125, 0.14069366455078125, 0.16473388671875, 0.18877410888671875, 0.2128143310546875, 0.23685455322265625, 0.260894775390625, 0.28493499755859375, 0.3089752197265625, 0.33301544189453125, 0.3570556640625, 0.38109588623046875, 0.4051361083984375, 0.42917633056640625, 0.453216552734375, 0.47725677490234375, 0.5012969970703125, 0.5253372192382812, 0.54937744140625, 0.5734176635742188, 0.5974578857421875, 0.6214981079101562, 0.645538330078125, 0.6695785522460938, 0.6936187744140625, 0.7176589965820312, 0.74169921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 7.0, 3.0, 9.0, 7.0, 8.0, 10.0, 11.0, 12.0, 19.0, 18.0, 21.0, 21.0, 24.0, 37.0, 35.0, 31.0, 52.0, 41.0, 40.0, 41.0, 46.0, 49.0, 54.0, 49.0, 46.0, 46.0, 49.0, 37.0, 25.0, 24.0, 23.0, 16.0, 19.0, 14.0, 12.0, 10.0, 6.0, 6.0, 6.0, 5.0, 8.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.564453125, -1.51544189453125, -1.4664306640625, -1.41741943359375, -1.368408203125, -1.31939697265625, -1.2703857421875, -1.22137451171875, -1.17236328125, -1.12335205078125, -1.0743408203125, -1.02532958984375, -0.976318359375, -0.92730712890625, -0.8782958984375, -0.82928466796875, -0.7802734375, -0.73126220703125, -0.6822509765625, -0.63323974609375, -0.584228515625, -0.53521728515625, -0.4862060546875, -0.43719482421875, -0.38818359375, -0.33917236328125, -0.2901611328125, -0.24114990234375, -0.192138671875, -0.14312744140625, -0.0941162109375, -0.04510498046875, 0.00390625, 0.05291748046875, 0.1019287109375, 0.15093994140625, 0.199951171875, 0.24896240234375, 0.2979736328125, 0.34698486328125, 0.39599609375, 0.44500732421875, 0.4940185546875, 0.54302978515625, 0.592041015625, 0.64105224609375, 0.6900634765625, 0.73907470703125, 0.7880859375, 0.83709716796875, 0.8861083984375, 0.93511962890625, 0.984130859375, 1.03314208984375, 1.0821533203125, 1.13116455078125, 1.18017578125, 1.22918701171875, 1.2781982421875, 1.32720947265625, 1.376220703125, 1.42523193359375, 1.4742431640625, 1.52325439453125, 1.572265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 8.0, 19.0, 22.0, 35.0, 77.0, 115.0, 222.0, 351.0, 669.0, 1623.0, 4888.0, 27787.0, 547411.0, 435221.0, 22832.0, 4294.0, 1504.0, 658.0, 324.0, 182.0, 120.0, 53.0, 36.0, 24.0, 17.0, 12.0, 11.0, 5.0, 2.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.4919090270996094, -0.47698211669921875, -0.4620552062988281, -0.4471282958984375, -0.4322013854980469, -0.41727447509765625, -0.4023475646972656, -0.387420654296875, -0.3724937438964844, -0.35756683349609375, -0.3426399230957031, -0.3277130126953125, -0.3127861022949219, -0.29785919189453125, -0.2829322814941406, -0.26800537109375, -0.2530784606933594, -0.23815155029296875, -0.22322463989257812, -0.2082977294921875, -0.19337081909179688, -0.17844390869140625, -0.16351699829101562, -0.148590087890625, -0.13366317749023438, -0.11873626708984375, -0.10380935668945312, -0.0888824462890625, -0.07395553588867188, -0.05902862548828125, -0.044101715087890625, -0.0291748046875, -0.014247894287109375, 0.00067901611328125, 0.015605926513671875, 0.0305328369140625, 0.045459747314453125, 0.06038665771484375, 0.07531356811523438, 0.090240478515625, 0.10516738891601562, 0.12009429931640625, 0.13502120971679688, 0.1499481201171875, 0.16487503051757812, 0.17980194091796875, 0.19472885131835938, 0.20965576171875, 0.22458267211914062, 0.23950958251953125, 0.2544364929199219, 0.2693634033203125, 0.2842903137207031, 0.29921722412109375, 0.3141441345214844, 0.329071044921875, 0.3439979553222656, 0.35892486572265625, 0.3738517761230469, 0.3887786865234375, 0.4037055969238281, 0.41863250732421875, 0.4335594177246094, 0.448486328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 9.0, 17.0, 24.0, 31.0, 39.0, 56.0, 90.0, 107.0, 120.0, 125.0, 104.0, 77.0, 59.0, 35.0, 36.0, 21.0, 13.0, 9.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2498111724853516e-05, -4.097074270248413e-05, -3.9443373680114746e-05, -3.791600465774536e-05, -3.6388635635375977e-05, -3.486126661300659e-05, -3.333389759063721e-05, -3.180652856826782e-05, -3.0279159545898438e-05, -2.8751790523529053e-05, -2.7224421501159668e-05, -2.5697052478790283e-05, -2.41696834564209e-05, -2.2642314434051514e-05, -2.111494541168213e-05, -1.9587576389312744e-05, -1.806020736694336e-05, -1.6532838344573975e-05, -1.500546932220459e-05, -1.3478100299835205e-05, -1.195073127746582e-05, -1.0423362255096436e-05, -8.89599323272705e-06, -7.368624210357666e-06, -5.841255187988281e-06, -4.3138861656188965e-06, -2.7865171432495117e-06, -1.259148120880127e-06, 2.682209014892578e-07, 1.7955899238586426e-06, 3.3229589462280273e-06, 4.850327968597412e-06, 6.377696990966797e-06, 7.905066013336182e-06, 9.432435035705566e-06, 1.0959804058074951e-05, 1.2487173080444336e-05, 1.401454210281372e-05, 1.5541911125183105e-05, 1.706928014755249e-05, 1.8596649169921875e-05, 2.012401819229126e-05, 2.1651387214660645e-05, 2.317875623703003e-05, 2.4706125259399414e-05, 2.62334942817688e-05, 2.7760863304138184e-05, 2.928823232650757e-05, 3.081560134887695e-05, 3.234297037124634e-05, 3.387033939361572e-05, 3.539770841598511e-05, 3.692507743835449e-05, 3.845244646072388e-05, 3.997981548309326e-05, 4.1507184505462646e-05, 4.303455352783203e-05, 4.4561922550201416e-05, 4.60892915725708e-05, 4.7616660594940186e-05, 4.914402961730957e-05, 5.0671398639678955e-05, 5.219876766204834e-05, 5.3726136684417725e-05, 5.525350570678711e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 10.0, 12.0, 29.0, 54.0, 104.0, 200.0, 502.0, 1391.0, 7067.0, 135008.0, 854737.0, 43937.0, 3878.0, 992.0, 344.0, 130.0, 74.0, 34.0, 24.0, 11.0, 8.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.370849609375, -0.3516807556152344, -0.33251190185546875, -0.3133430480957031, -0.2941741943359375, -0.2750053405761719, -0.25583648681640625, -0.23666763305664062, -0.217498779296875, -0.19832992553710938, -0.17916107177734375, -0.15999221801757812, -0.1408233642578125, -0.12165451049804688, -0.10248565673828125, -0.08331680297851562, -0.06414794921875, -0.044979095458984375, -0.02581024169921875, -0.006641387939453125, 0.0125274658203125, 0.031696319580078125, 0.05086517333984375, 0.07003402709960938, 0.089202880859375, 0.10837173461914062, 0.12754058837890625, 0.14670944213867188, 0.1658782958984375, 0.18504714965820312, 0.20421600341796875, 0.22338485717773438, 0.2425537109375, 0.2617225646972656, 0.28089141845703125, 0.3000602722167969, 0.3192291259765625, 0.3383979797363281, 0.35756683349609375, 0.3767356872558594, 0.395904541015625, 0.4150733947753906, 0.43424224853515625, 0.4534111022949219, 0.4725799560546875, 0.4917488098144531, 0.5109176635742188, 0.5300865173339844, 0.54925537109375, 0.5684242248535156, 0.5875930786132812, 0.6067619323730469, 0.6259307861328125, 0.6450996398925781, 0.6642684936523438, 0.6834373474121094, 0.702606201171875, 0.7217750549316406, 0.7409439086914062, 0.7601127624511719, 0.7792816162109375, 0.7984504699707031, 0.8176193237304688, 0.8367881774902344, 0.85595703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 4.0, 13.0, 10.0, 12.0, 13.0, 24.0, 31.0, 49.0, 86.0, 100.0, 107.0, 126.0, 115.0, 84.0, 57.0, 48.0, 28.0, 18.0, 23.0, 16.0, 7.0, 9.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5625, -0.5460891723632812, -0.5296783447265625, -0.5132675170898438, -0.496856689453125, -0.48044586181640625, -0.4640350341796875, -0.44762420654296875, -0.43121337890625, -0.41480255126953125, -0.3983917236328125, -0.38198089599609375, -0.365570068359375, -0.34915924072265625, -0.3327484130859375, -0.31633758544921875, -0.2999267578125, -0.28351593017578125, -0.2671051025390625, -0.25069427490234375, -0.234283447265625, -0.21787261962890625, -0.2014617919921875, -0.18505096435546875, -0.16864013671875, -0.15222930908203125, -0.1358184814453125, -0.11940765380859375, -0.102996826171875, -0.08658599853515625, -0.0701751708984375, -0.05376434326171875, -0.037353515625, -0.02094268798828125, -0.0045318603515625, 0.01187896728515625, 0.028289794921875, 0.04470062255859375, 0.0611114501953125, 0.07752227783203125, 0.09393310546875, 0.11034393310546875, 0.1267547607421875, 0.14316558837890625, 0.159576416015625, 0.17598724365234375, 0.1923980712890625, 0.20880889892578125, 0.2252197265625, 0.24163055419921875, 0.2580413818359375, 0.27445220947265625, 0.290863037109375, 0.30727386474609375, 0.3236846923828125, 0.34009552001953125, 0.35650634765625, 0.37291717529296875, 0.3893280029296875, 0.40573883056640625, 0.422149658203125, 0.43856048583984375, 0.4549713134765625, 0.47138214111328125, 0.48779296875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 8.0, 4.0, 13.0, 11.0, 24.0, 37.0, 51.0, 78.0, 119.0, 170.0, 165.0, 117.0, 74.0, 56.0, 25.0, 17.0, 14.0, 8.0, 11.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.226987838745117, -7.000500202178955, -6.774013042449951, -6.547525405883789, -6.321038246154785, -6.094550609588623, -5.868062973022461, -5.641575813293457, -5.415088653564453, -5.188601016998291, -4.962113857269287, -4.735626220703125, -4.509139060974121, -4.282651424407959, -4.056163787841797, -3.829676628112793, -3.603188991546631, -3.376701593399048, -3.150214195251465, -2.9237265586853027, -2.697239398956299, -2.4707517623901367, -2.2442643642425537, -2.0177769660949707, -1.7912895679473877, -1.5648021697998047, -1.3383147716522217, -1.1118272542953491, -0.8853398561477661, -0.6588524580001831, -0.43236494064331055, -0.20587754249572754, 0.02060985565185547, 0.24709728360176086, 0.47358471155166626, 0.700072169303894, 0.926559567451477, 1.15304696559906, 1.3795344829559326, 1.6060218811035156, 1.8325092792510986, 2.0589966773986816, 2.2854840755462646, 2.5119714736938477, 2.7384591102600098, 2.9649462699890137, 3.191433906555176, 3.417921304702759, 3.644408702850342, 3.870896100997925, 4.097383499145508, 4.32387113571167, 4.550358295440674, 4.776845932006836, 5.00333309173584, 5.229820728302002, 5.456308364868164, 5.682796001434326, 5.90928316116333, 6.135770797729492, 6.362257957458496, 6.588745594024658, 6.81523323059082, 7.041720390319824, 7.268207550048828]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 6.0, 12.0, 8.0, 14.0, 11.0, 17.0, 13.0, 19.0, 20.0, 14.0, 30.0, 39.0, 28.0, 37.0, 33.0, 34.0, 35.0, 37.0, 40.0, 48.0, 34.0, 39.0, 45.0, 31.0, 42.0, 30.0, 26.0, 32.0, 30.0, 27.0, 17.0, 34.0, 21.0, 13.0, 11.0, 13.0, 7.0, 11.0, 11.0, 4.0, 5.0, 5.0, 5.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0], "bins": [-8.274454116821289, -8.036709785461426, -7.7989654541015625, -7.561221122741699, -7.323476791381836, -7.085732460021973, -6.847988128662109, -6.610243797302246, -6.372499465942383, -6.1347551345825195, -5.897010803222656, -5.659266471862793, -5.42152214050293, -5.183777809143066, -4.946033477783203, -4.70828914642334, -4.470544815063477, -4.232800483703613, -3.99505615234375, -3.7573118209838867, -3.5195674896240234, -3.28182315826416, -3.044078826904297, -2.8063344955444336, -2.5685906410217285, -2.3308463096618652, -2.093101978302002, -1.8553576469421387, -1.6176133155822754, -1.3798691034317017, -1.1421247720718384, -0.9043804407119751, -0.6666359901428223, -0.428891658782959, -0.1911473572254181, 0.0465969443321228, 0.2843412756919861, 0.5220855474472046, 0.7598298788070679, 0.9975742101669312, 1.2353185415267944, 1.4730628728866577, 1.710807204246521, 1.9485514163970947, 2.186295747756958, 2.4240400791168213, 2.6617844104766846, 2.899528741836548, 3.137273073196411, 3.3750174045562744, 3.6127617359161377, 3.850506067276001, 4.088250160217285, 4.325994491577148, 4.563738822937012, 4.801483154296875, 5.039227485656738, 5.276971817016602, 5.514716148376465, 5.752460479736328, 5.990204811096191, 6.227949142456055, 6.465693473815918, 6.703437805175781, 6.9411821365356445]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 6.0, 13.0, 18.0, 23.0, 24.0, 40.0, 45.0, 67.0, 90.0, 106.0, 170.0, 219.0, 300.0, 430.0, 580.0, 891.0, 1305.0, 2017.0, 3075.0, 5521.0, 10820.0, 27238.0, 152522.0, 3879495.0, 68644.0, 19371.0, 8403.0, 4574.0, 2762.0, 1747.0, 1149.0, 727.0, 550.0, 400.0, 265.0, 179.0, 151.0, 104.0, 81.0, 41.0, 37.0, 24.0, 11.0, 19.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.1875, -1.1538848876953125, -1.120269775390625, -1.0866546630859375, -1.05303955078125, -1.0194244384765625, -0.985809326171875, -0.9521942138671875, -0.9185791015625, -0.8849639892578125, -0.851348876953125, -0.8177337646484375, -0.78411865234375, -0.7505035400390625, -0.716888427734375, -0.6832733154296875, -0.649658203125, -0.6160430908203125, -0.582427978515625, -0.5488128662109375, -0.51519775390625, -0.4815826416015625, -0.447967529296875, -0.4143524169921875, -0.3807373046875, -0.3471221923828125, -0.313507080078125, -0.2798919677734375, -0.24627685546875, -0.2126617431640625, -0.179046630859375, -0.1454315185546875, -0.11181640625, -0.0782012939453125, -0.044586181640625, -0.0109710693359375, 0.02264404296875, 0.0562591552734375, 0.089874267578125, 0.1234893798828125, 0.1571044921875, 0.1907196044921875, 0.224334716796875, 0.2579498291015625, 0.29156494140625, 0.3251800537109375, 0.358795166015625, 0.3924102783203125, 0.426025390625, 0.4596405029296875, 0.493255615234375, 0.5268707275390625, 0.56048583984375, 0.5941009521484375, 0.627716064453125, 0.6613311767578125, 0.6949462890625, 0.7285614013671875, 0.762176513671875, 0.7957916259765625, 0.82940673828125, 0.8630218505859375, 0.896636962890625, 0.9302520751953125, 0.9638671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 11.0, 3.0, 9.0, 3.0, 10.0, 7.0, 22.0, 14.0, 22.0, 26.0, 39.0, 35.0, 30.0, 46.0, 40.0, 46.0, 41.0, 52.0, 46.0, 49.0, 56.0, 53.0, 37.0, 39.0, 33.0, 43.0, 28.0, 30.0, 13.0, 27.0, 20.0, 19.0, 15.0, 9.0, 10.0, 6.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.482666015625, -0.4683723449707031, -0.45407867431640625, -0.4397850036621094, -0.4254913330078125, -0.4111976623535156, -0.39690399169921875, -0.3826103210449219, -0.368316650390625, -0.3540229797363281, -0.33972930908203125, -0.3254356384277344, -0.3111419677734375, -0.2968482971191406, -0.28255462646484375, -0.2682609558105469, -0.25396728515625, -0.23967361450195312, -0.22537994384765625, -0.21108627319335938, -0.1967926025390625, -0.18249893188476562, -0.16820526123046875, -0.15391159057617188, -0.139617919921875, -0.12532424926757812, -0.11103057861328125, -0.09673690795898438, -0.0824432373046875, -0.06814956665039062, -0.05385589599609375, -0.039562225341796875, -0.0252685546875, -0.010974884033203125, 0.00331878662109375, 0.017612457275390625, 0.0319061279296875, 0.046199798583984375, 0.06049346923828125, 0.07478713989257812, 0.089080810546875, 0.10337448120117188, 0.11766815185546875, 0.13196182250976562, 0.1462554931640625, 0.16054916381835938, 0.17484283447265625, 0.18913650512695312, 0.20343017578125, 0.21772384643554688, 0.23201751708984375, 0.24631118774414062, 0.2606048583984375, 0.2748985290527344, 0.28919219970703125, 0.3034858703613281, 0.317779541015625, 0.3320732116699219, 0.34636688232421875, 0.3606605529785156, 0.3749542236328125, 0.3892478942871094, 0.40354156494140625, 0.4178352355957031, 0.43212890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 15.0, 13.0, 19.0, 32.0, 44.0, 51.0, 76.0, 107.0, 176.0, 235.0, 410.0, 866.0, 1919.0, 5572.0, 23683.0, 1322885.0, 2803869.0, 24455.0, 5740.0, 2047.0, 829.0, 444.0, 222.0, 162.0, 113.0, 80.0, 72.0, 46.0, 28.0, 21.0, 17.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.6574859619140625, -1.604034423828125, -1.5505828857421875, -1.49713134765625, -1.4436798095703125, -1.390228271484375, -1.3367767333984375, -1.2833251953125, -1.2298736572265625, -1.176422119140625, -1.1229705810546875, -1.06951904296875, -1.0160675048828125, -0.962615966796875, -0.9091644287109375, -0.855712890625, -0.8022613525390625, -0.748809814453125, -0.6953582763671875, -0.64190673828125, -0.5884552001953125, -0.535003662109375, -0.4815521240234375, -0.4281005859375, -0.3746490478515625, -0.321197509765625, -0.2677459716796875, -0.21429443359375, -0.1608428955078125, -0.107391357421875, -0.0539398193359375, -0.00048828125, 0.0529632568359375, 0.106414794921875, 0.1598663330078125, 0.21331787109375, 0.2667694091796875, 0.320220947265625, 0.3736724853515625, 0.4271240234375, 0.4805755615234375, 0.534027099609375, 0.5874786376953125, 0.64093017578125, 0.6943817138671875, 0.747833251953125, 0.8012847900390625, 0.854736328125, 0.9081878662109375, 0.961639404296875, 1.0150909423828125, 1.06854248046875, 1.1219940185546875, 1.175445556640625, 1.2288970947265625, 1.2823486328125, 1.3358001708984375, 1.389251708984375, 1.4427032470703125, 1.49615478515625, 1.5496063232421875, 1.603057861328125, 1.6565093994140625, 1.7099609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 8.0, 17.0, 26.0, 48.0, 121.0, 3322.0, 344.0, 77.0, 44.0, 20.0, 17.0, 4.0, 2.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.666015625, -1.6206817626953125, -1.575347900390625, -1.5300140380859375, -1.48468017578125, -1.4393463134765625, -1.394012451171875, -1.3486785888671875, -1.3033447265625, -1.2580108642578125, -1.212677001953125, -1.1673431396484375, -1.12200927734375, -1.0766754150390625, -1.031341552734375, -0.9860076904296875, -0.940673828125, -0.8953399658203125, -0.850006103515625, -0.8046722412109375, -0.75933837890625, -0.7140045166015625, -0.668670654296875, -0.6233367919921875, -0.5780029296875, -0.5326690673828125, -0.487335205078125, -0.4420013427734375, -0.39666748046875, -0.3513336181640625, -0.305999755859375, -0.2606658935546875, -0.21533203125, -0.1699981689453125, -0.124664306640625, -0.0793304443359375, -0.03399658203125, 0.0113372802734375, 0.056671142578125, 0.1020050048828125, 0.1473388671875, 0.1926727294921875, 0.238006591796875, 0.2833404541015625, 0.32867431640625, 0.3740081787109375, 0.419342041015625, 0.4646759033203125, 0.510009765625, 0.5553436279296875, 0.600677490234375, 0.6460113525390625, 0.69134521484375, 0.7366790771484375, 0.782012939453125, 0.8273468017578125, 0.8726806640625, 0.9180145263671875, 0.963348388671875, 1.0086822509765625, 1.05401611328125, 1.0993499755859375, 1.144683837890625, 1.1900177001953125, 1.2353515625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 13.0, 20.0, 74.0, 273.0, 458.0, 122.0, 22.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.31445598602295, -9.088199615478516, -8.861942291259766, -8.635685920715332, -8.409429550170898, -8.183172225952148, -7.956915855407715, -7.730659484863281, -7.5044026374816895, -7.278145790100098, -7.051889419555664, -6.825632572174072, -6.5993757247924805, -6.373119354248047, -6.146862506866455, -5.920605659484863, -5.69434928894043, -5.468092441558838, -5.241836071014404, -5.0155792236328125, -4.789322376251221, -4.563066005706787, -4.336809158325195, -4.110552787780762, -3.8842954635620117, -3.658038854598999, -3.4317820072174072, -3.2055253982543945, -2.979268789291382, -2.753012180328369, -2.5267553329467773, -2.3004987239837646, -2.074242115020752, -1.8479853868484497, -1.621728777885437, -1.3954720497131348, -1.169215440750122, -0.9429587125778198, -0.7167019844055176, -0.4904453754425049, -0.26418864727020264, -0.03793196380138397, 0.1883247196674347, 0.41458141803741455, 0.640838086605072, 0.8670947551727295, 1.0933514833450317, 1.3196080923080444, 1.5458648204803467, 1.772121548652649, 1.9983781576156616, 2.224634885787964, 2.4508914947509766, 2.6771483421325684, 2.903404951095581, 3.1296615600585938, 3.3559184074401855, 3.5821750164031982, 3.80843186378479, 4.034688472747803, 4.2609453201293945, 4.487201690673828, 4.71345853805542, 4.939715385437012, 5.165971755981445]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 7.0, 6.0, 7.0, 6.0, 19.0, 16.0, 22.0, 31.0, 29.0, 39.0, 30.0, 51.0, 54.0, 48.0, 54.0, 47.0, 58.0, 55.0, 65.0, 55.0, 49.0, 37.0, 34.0, 34.0, 25.0, 20.0, 33.0, 24.0, 11.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2443583011627197, -2.1656370162963867, -2.0869157314300537, -2.0081944465637207, -1.9294731616973877, -1.8507518768310547, -1.7720307111740112, -1.6933094263076782, -1.6145881414413452, -1.5358668565750122, -1.4571455717086792, -1.3784242868423462, -1.2997031211853027, -1.2209818363189697, -1.1422605514526367, -1.0635392665863037, -0.9848179817199707, -0.9060966968536377, -0.8273754119873047, -0.7486541867256165, -0.6699329018592834, -0.5912116169929504, -0.5124903917312622, -0.4337691068649292, -0.3550478219985962, -0.2763265371322632, -0.19760528206825256, -0.11888401210308075, -0.040162742137908936, 0.03855854272842407, 0.11727979779243469, 0.1960010528564453, 0.2747225761413574, 0.35344386100769043, 0.43216511607170105, 0.5108863711357117, 0.5896076560020447, 0.6683289408683777, 0.7470501661300659, 0.8257714509963989, 0.9044927358627319, 0.9832140207290649, 1.061935305595398, 1.140656590461731, 1.2193777561187744, 1.2980990409851074, 1.3768203258514404, 1.4555416107177734, 1.5342628955841064, 1.6129841804504395, 1.6917054653167725, 1.7704267501831055, 1.8491480350494385, 1.9278693199157715, 2.0065906047821045, 2.0853118896484375, 2.1640329360961914, 2.2427542209625244, 2.3214755058288574, 2.4001967906951904, 2.4789180755615234, 2.5576393604278564, 2.6363606452941895, 2.7150816917419434, 2.7938032150268555]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 5.0, 9.0, 6.0, 10.0, 11.0, 16.0, 32.0, 23.0, 45.0, 45.0, 78.0, 119.0, 149.0, 339.0, 603.0, 1242.0, 2933.0, 7595.0, 22492.0, 79490.0, 387568.0, 421301.0, 86172.0, 24356.0, 7964.0, 3124.0, 1297.0, 581.0, 334.0, 195.0, 112.0, 77.0, 63.0, 44.0, 29.0, 23.0, 15.0, 15.0, 9.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4794921875, -1.437255859375, -1.39501953125, -1.352783203125, -1.310546875, -1.268310546875, -1.22607421875, -1.183837890625, -1.1416015625, -1.099365234375, -1.05712890625, -1.014892578125, -0.97265625, -0.930419921875, -0.88818359375, -0.845947265625, -0.8037109375, -0.761474609375, -0.71923828125, -0.677001953125, -0.634765625, -0.592529296875, -0.55029296875, -0.508056640625, -0.4658203125, -0.423583984375, -0.38134765625, -0.339111328125, -0.296875, -0.254638671875, -0.21240234375, -0.170166015625, -0.1279296875, -0.085693359375, -0.04345703125, -0.001220703125, 0.041015625, 0.083251953125, 0.12548828125, 0.167724609375, 0.2099609375, 0.252197265625, 0.29443359375, 0.336669921875, 0.37890625, 0.421142578125, 0.46337890625, 0.505615234375, 0.5478515625, 0.590087890625, 0.63232421875, 0.674560546875, 0.716796875, 0.759033203125, 0.80126953125, 0.843505859375, 0.8857421875, 0.927978515625, 0.97021484375, 1.012451171875, 1.0546875, 1.096923828125, 1.13916015625, 1.181396484375, 1.2236328125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 3.0, 7.0, 17.0, 12.0, 12.0, 23.0, 25.0, 21.0, 25.0, 32.0, 39.0, 37.0, 60.0, 55.0, 40.0, 49.0, 41.0, 62.0, 58.0, 43.0, 32.0, 40.0, 33.0, 40.0, 27.0, 34.0, 18.0, 22.0, 22.0, 8.0, 18.0, 6.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.501953125, -0.48696136474609375, -0.4719696044921875, -0.45697784423828125, -0.441986083984375, -0.42699432373046875, -0.4120025634765625, -0.39701080322265625, -0.38201904296875, -0.36702728271484375, -0.3520355224609375, -0.33704376220703125, -0.322052001953125, -0.30706024169921875, -0.2920684814453125, -0.27707672119140625, -0.2620849609375, -0.24709320068359375, -0.2321014404296875, -0.21710968017578125, -0.202117919921875, -0.18712615966796875, -0.1721343994140625, -0.15714263916015625, -0.14215087890625, -0.12715911865234375, -0.1121673583984375, -0.09717559814453125, -0.082183837890625, -0.06719207763671875, -0.0522003173828125, -0.03720855712890625, -0.022216796875, -0.00722503662109375, 0.0077667236328125, 0.02275848388671875, 0.037750244140625, 0.05274200439453125, 0.0677337646484375, 0.08272552490234375, 0.09771728515625, 0.11270904541015625, 0.1277008056640625, 0.14269256591796875, 0.157684326171875, 0.17267608642578125, 0.1876678466796875, 0.20265960693359375, 0.2176513671875, 0.23264312744140625, 0.2476348876953125, 0.26262664794921875, 0.277618408203125, 0.29261016845703125, 0.3076019287109375, 0.32259368896484375, 0.33758544921875, 0.35257720947265625, 0.3675689697265625, 0.38256072998046875, 0.397552490234375, 0.41254425048828125, 0.4275360107421875, 0.44252777099609375, 0.45751953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 10.0, 21.0, 23.0, 33.0, 58.0, 113.0, 188.0, 381.0, 852.0, 2245.0, 7903.0, 36436.0, 359600.0, 575098.0, 50868.0, 9914.0, 2795.0, 1020.0, 467.0, 205.0, 126.0, 67.0, 43.0, 21.0, 14.0, 9.0, 10.0, 9.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.068359375, -2.01104736328125, -1.9537353515625, -1.89642333984375, -1.839111328125, -1.78179931640625, -1.7244873046875, -1.66717529296875, -1.60986328125, -1.55255126953125, -1.4952392578125, -1.43792724609375, -1.380615234375, -1.32330322265625, -1.2659912109375, -1.20867919921875, -1.1513671875, -1.09405517578125, -1.0367431640625, -0.97943115234375, -0.922119140625, -0.86480712890625, -0.8074951171875, -0.75018310546875, -0.69287109375, -0.63555908203125, -0.5782470703125, -0.52093505859375, -0.463623046875, -0.40631103515625, -0.3489990234375, -0.29168701171875, -0.234375, -0.17706298828125, -0.1197509765625, -0.06243896484375, -0.005126953125, 0.05218505859375, 0.1094970703125, 0.16680908203125, 0.22412109375, 0.28143310546875, 0.3387451171875, 0.39605712890625, 0.453369140625, 0.51068115234375, 0.5679931640625, 0.62530517578125, 0.6826171875, 0.73992919921875, 0.7972412109375, 0.85455322265625, 0.911865234375, 0.96917724609375, 1.0264892578125, 1.08380126953125, 1.14111328125, 1.19842529296875, 1.2557373046875, 1.31304931640625, 1.370361328125, 1.42767333984375, 1.4849853515625, 1.54229736328125, 1.599609375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 5.0, 11.0, 20.0, 22.0, 26.0, 33.0, 42.0, 31.0, 55.0, 44.0, 65.0, 76.0, 63.0, 63.0, 56.0, 53.0, 57.0, 53.0, 33.0, 38.0, 30.0, 23.0, 30.0, 18.0, 10.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.295440673828125, -2.21002197265625, -2.124603271484375, -2.0391845703125, -1.953765869140625, -1.86834716796875, -1.782928466796875, -1.697509765625, -1.612091064453125, -1.52667236328125, -1.441253662109375, -1.3558349609375, -1.270416259765625, -1.18499755859375, -1.099578857421875, -1.01416015625, -0.928741455078125, -0.84332275390625, -0.757904052734375, -0.6724853515625, -0.587066650390625, -0.50164794921875, -0.416229248046875, -0.330810546875, -0.245391845703125, -0.15997314453125, -0.074554443359375, 0.0108642578125, 0.096282958984375, 0.18170166015625, 0.267120361328125, 0.3525390625, 0.437957763671875, 0.52337646484375, 0.608795166015625, 0.6942138671875, 0.779632568359375, 0.86505126953125, 0.950469970703125, 1.035888671875, 1.121307373046875, 1.20672607421875, 1.292144775390625, 1.3775634765625, 1.462982177734375, 1.54840087890625, 1.633819580078125, 1.71923828125, 1.804656982421875, 1.89007568359375, 1.975494384765625, 2.0609130859375, 2.146331787109375, 2.23175048828125, 2.317169189453125, 2.402587890625, 2.488006591796875, 2.57342529296875, 2.658843994140625, 2.7442626953125, 2.829681396484375, 2.91510009765625, 3.000518798828125, 3.0859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 12.0, 17.0, 25.0, 29.0, 51.0, 83.0, 135.0, 213.0, 308.0, 524.0, 1007.0, 2116.0, 6827.0, 60052.0, 933875.0, 33935.0, 5362.0, 1859.0, 830.0, 447.0, 317.0, 189.0, 110.0, 84.0, 53.0, 30.0, 22.0, 10.0, 9.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0146484375, -0.9801483154296875, -0.945648193359375, -0.9111480712890625, -0.87664794921875, -0.8421478271484375, -0.807647705078125, -0.7731475830078125, -0.7386474609375, -0.7041473388671875, -0.669647216796875, -0.6351470947265625, -0.60064697265625, -0.5661468505859375, -0.531646728515625, -0.4971466064453125, -0.462646484375, -0.4281463623046875, -0.393646240234375, -0.3591461181640625, -0.32464599609375, -0.2901458740234375, -0.255645751953125, -0.2211456298828125, -0.1866455078125, -0.1521453857421875, -0.117645263671875, -0.0831451416015625, -0.04864501953125, -0.0141448974609375, 0.020355224609375, 0.0548553466796875, 0.08935546875, 0.1238555908203125, 0.158355712890625, 0.1928558349609375, 0.22735595703125, 0.2618560791015625, 0.296356201171875, 0.3308563232421875, 0.3653564453125, 0.3998565673828125, 0.434356689453125, 0.4688568115234375, 0.50335693359375, 0.5378570556640625, 0.572357177734375, 0.6068572998046875, 0.641357421875, 0.6758575439453125, 0.710357666015625, 0.7448577880859375, 0.77935791015625, 0.8138580322265625, 0.848358154296875, 0.8828582763671875, 0.9173583984375, 0.9518585205078125, 0.986358642578125, 1.0208587646484375, 1.05535888671875, 1.0898590087890625, 1.124359130859375, 1.1588592529296875, 1.193359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 10.0, 19.0, 27.0, 34.0, 59.0, 95.0, 132.0, 154.0, 149.0, 108.0, 83.0, 38.0, 29.0, 16.0, 13.0, 5.0, 10.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.535385131835938e-05, -8.303020149469376e-05, -8.070655167102814e-05, -7.838290184736252e-05, -7.60592520236969e-05, -7.373560220003128e-05, -7.141195237636566e-05, -6.908830255270004e-05, -6.676465272903442e-05, -6.44410029053688e-05, -6.211735308170319e-05, -5.979370325803757e-05, -5.747005343437195e-05, -5.514640361070633e-05, -5.282275378704071e-05, -5.049910396337509e-05, -4.817545413970947e-05, -4.5851804316043854e-05, -4.3528154492378235e-05, -4.1204504668712616e-05, -3.8880854845047e-05, -3.655720502138138e-05, -3.423355519771576e-05, -3.190990537405014e-05, -2.958625555038452e-05, -2.7262605726718903e-05, -2.4938955903053284e-05, -2.2615306079387665e-05, -2.0291656255722046e-05, -1.7968006432056427e-05, -1.5644356608390808e-05, -1.332070678472519e-05, -1.099705696105957e-05, -8.673407137393951e-06, -6.3497573137283325e-06, -4.026107490062714e-06, -1.7024576663970947e-06, 6.211921572685242e-07, 2.944841980934143e-06, 5.268491804599762e-06, 7.592141628265381e-06, 9.915791451931e-06, 1.2239441275596619e-05, 1.4563091099262238e-05, 1.6886740922927856e-05, 1.9210390746593475e-05, 2.1534040570259094e-05, 2.3857690393924713e-05, 2.6181340217590332e-05, 2.850499004125595e-05, 3.082863986492157e-05, 3.315228968858719e-05, 3.547593951225281e-05, 3.7799589335918427e-05, 4.0123239159584045e-05, 4.2446888983249664e-05, 4.477053880691528e-05, 4.70941886305809e-05, 4.941783845424652e-05, 5.174148827791214e-05, 5.406513810157776e-05, 5.638878792524338e-05, 5.8712437748908997e-05, 6.103608757257462e-05, 6.335973739624023e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 2.0, 9.0, 18.0, 22.0, 47.0, 80.0, 117.0, 243.0, 471.0, 932.0, 2121.0, 6706.0, 120553.0, 891031.0, 19620.0, 3641.0, 1435.0, 728.0, 339.0, 188.0, 97.0, 61.0, 24.0, 17.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.033203125, -1.000152587890625, -0.96710205078125, -0.934051513671875, -0.9010009765625, -0.867950439453125, -0.83489990234375, -0.801849365234375, -0.768798828125, -0.735748291015625, -0.70269775390625, -0.669647216796875, -0.6365966796875, -0.603546142578125, -0.57049560546875, -0.537445068359375, -0.50439453125, -0.471343994140625, -0.43829345703125, -0.405242919921875, -0.3721923828125, -0.339141845703125, -0.30609130859375, -0.273040771484375, -0.239990234375, -0.206939697265625, -0.17388916015625, -0.140838623046875, -0.1077880859375, -0.074737548828125, -0.04168701171875, -0.008636474609375, 0.0244140625, 0.057464599609375, 0.09051513671875, 0.123565673828125, 0.1566162109375, 0.189666748046875, 0.22271728515625, 0.255767822265625, 0.288818359375, 0.321868896484375, 0.35491943359375, 0.387969970703125, 0.4210205078125, 0.454071044921875, 0.48712158203125, 0.520172119140625, 0.55322265625, 0.586273193359375, 0.61932373046875, 0.652374267578125, 0.6854248046875, 0.718475341796875, 0.75152587890625, 0.784576416015625, 0.817626953125, 0.850677490234375, 0.88372802734375, 0.916778564453125, 0.9498291015625, 0.982879638671875, 1.01593017578125, 1.048980712890625, 1.08203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 3.0, 10.0, 14.0, 23.0, 49.0, 118.0, 269.0, 276.0, 131.0, 47.0, 20.0, 10.0, 11.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.244140625, -1.19232177734375, -1.1405029296875, -1.08868408203125, -1.036865234375, -0.98504638671875, -0.9332275390625, -0.88140869140625, -0.82958984375, -0.77777099609375, -0.7259521484375, -0.67413330078125, -0.622314453125, -0.57049560546875, -0.5186767578125, -0.46685791015625, -0.4150390625, -0.36322021484375, -0.3114013671875, -0.25958251953125, -0.207763671875, -0.15594482421875, -0.1041259765625, -0.05230712890625, -0.00048828125, 0.05133056640625, 0.1031494140625, 0.15496826171875, 0.206787109375, 0.25860595703125, 0.3104248046875, 0.36224365234375, 0.4140625, 0.46588134765625, 0.5177001953125, 0.56951904296875, 0.621337890625, 0.67315673828125, 0.7249755859375, 0.77679443359375, 0.82861328125, 0.88043212890625, 0.9322509765625, 0.98406982421875, 1.035888671875, 1.08770751953125, 1.1395263671875, 1.19134521484375, 1.2431640625, 1.29498291015625, 1.3468017578125, 1.39862060546875, 1.450439453125, 1.50225830078125, 1.5540771484375, 1.60589599609375, 1.65771484375, 1.70953369140625, 1.7613525390625, 1.81317138671875, 1.864990234375, 1.91680908203125, 1.9686279296875, 2.02044677734375, 2.072265625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 21.0, 22.0, 49.0, 80.0, 149.0, 211.0, 186.0, 136.0, 64.0, 28.0, 25.0, 10.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.204975128173828, -10.772348403930664, -10.3397216796875, -9.90709400177002, -9.474467277526855, -9.041840553283691, -8.609213829040527, -8.176586151123047, -7.743959426879883, -7.311332702636719, -6.8787055015563965, -6.446078777313232, -6.01345157623291, -5.580824851989746, -5.148198127746582, -4.71557092666626, -4.282944202423096, -3.8503172397613525, -3.4176902770996094, -2.9850635528564453, -2.552436351776123, -2.119809627532959, -1.6871826648712158, -1.2545557022094727, -0.8219287395477295, -0.3893018066883087, 0.04332512617111206, 0.47595202922821045, 0.9085789918899536, 1.3412058353424072, 1.7738327980041504, 2.2064597606658936, 2.6390867233276367, 3.07171368598938, 3.504340648651123, 3.936967372894287, 4.369594573974609, 4.802221298217773, 5.2348480224609375, 5.66747522354126, 6.100102424621582, 6.532729148864746, 6.965356349945068, 7.397983074188232, 7.830610275268555, 8.263236999511719, 8.695863723754883, 9.128490447998047, 9.561117172241211, 9.993743896484375, 10.426370620727539, 10.85899829864502, 11.291625022888184, 11.724251747131348, 12.156878471374512, 12.589506149291992, 13.022132873535156, 13.45475959777832, 13.887386322021484, 14.320013999938965, 14.752640724182129, 15.185267448425293, 15.617894172668457, 16.050521850585938, 16.4831485748291]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 6.0, 3.0, 11.0, 13.0, 15.0, 18.0, 24.0, 23.0, 25.0, 22.0, 27.0, 25.0, 45.0, 31.0, 57.0, 40.0, 47.0, 55.0, 48.0, 37.0, 37.0, 41.0, 33.0, 35.0, 35.0, 22.0, 34.0, 33.0, 23.0, 30.0, 16.0, 14.0, 13.0, 15.0, 11.0, 5.0, 3.0, 5.0, 1.0, 6.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.7000732421875, -11.367838859558105, -11.035604476928711, -10.703371047973633, -10.371136665344238, -10.038902282714844, -9.70666790008545, -9.374433517456055, -9.04219913482666, -8.709964752197266, -8.377730369567871, -8.045495986938477, -7.71326208114624, -7.381028175354004, -7.048793792724609, -6.716559410095215, -6.3843255043029785, -6.052091121673584, -5.719857215881348, -5.387622833251953, -5.055388450622559, -4.723154067993164, -4.390920162200928, -4.058685779571533, -3.7264516353607178, -3.3942174911499023, -3.061983108520508, -2.7297489643096924, -2.397514820098877, -2.0652804374694824, -1.733046293258667, -1.4008119106292725, -1.068577766418457, -0.736343502998352, -0.40410929918289185, -0.07187509536743164, 0.26035916805267334, 0.5925934314727783, 0.9248275756835938, 1.2570619583129883, 1.5892961025238037, 1.9215303659439087, 2.2537646293640137, 2.585998773574829, 2.9182329177856445, 3.250467300415039, 3.5827014446258545, 3.914935827255249, 4.2471699714660645, 4.579404354095459, 4.911638259887695, 5.24387264251709, 5.576107025146484, 5.908341407775879, 6.240575313568115, 6.57280969619751, 6.905043601989746, 7.237277984619141, 7.569511890411377, 7.9017462730407715, 8.233980178833008, 8.566214561462402, 8.898448944091797, 9.230683326721191, 9.562917709350586]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 0.0, 7.0, 5.0, 1.0, 4.0, 6.0, 10.0, 13.0, 11.0, 22.0, 18.0, 28.0, 35.0, 45.0, 42.0, 79.0, 86.0, 121.0, 151.0, 236.0, 309.0, 531.0, 1077.0, 5827.0, 4163606.0, 18375.0, 1661.0, 612.0, 334.0, 242.0, 205.0, 130.0, 93.0, 93.0, 50.0, 44.0, 44.0, 30.0, 21.0, 10.0, 11.0, 13.0, 15.0, 9.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.2109375, -3.10955810546875, -3.0081787109375, -2.90679931640625, -2.805419921875, -2.70404052734375, -2.6026611328125, -2.50128173828125, -2.39990234375, -2.29852294921875, -2.1971435546875, -2.09576416015625, -1.994384765625, -1.89300537109375, -1.7916259765625, -1.69024658203125, -1.5888671875, -1.48748779296875, -1.3861083984375, -1.28472900390625, -1.183349609375, -1.08197021484375, -0.9805908203125, -0.87921142578125, -0.77783203125, -0.67645263671875, -0.5750732421875, -0.47369384765625, -0.372314453125, -0.27093505859375, -0.1695556640625, -0.06817626953125, 0.033203125, 0.13458251953125, 0.2359619140625, 0.33734130859375, 0.438720703125, 0.54010009765625, 0.6414794921875, 0.74285888671875, 0.84423828125, 0.94561767578125, 1.0469970703125, 1.14837646484375, 1.249755859375, 1.35113525390625, 1.4525146484375, 1.55389404296875, 1.6552734375, 1.75665283203125, 1.8580322265625, 1.95941162109375, 2.060791015625, 2.16217041015625, 2.2635498046875, 2.36492919921875, 2.46630859375, 2.56768798828125, 2.6690673828125, 2.77044677734375, 2.871826171875, 2.97320556640625, 3.0745849609375, 3.17596435546875, 3.27734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 5.0, 10.0, 10.0, 17.0, 20.0, 18.0, 17.0, 14.0, 24.0, 30.0, 38.0, 40.0, 41.0, 45.0, 50.0, 30.0, 45.0, 39.0, 33.0, 48.0, 50.0, 32.0, 40.0, 37.0, 26.0, 28.0, 24.0, 18.0, 20.0, 27.0, 16.0, 15.0, 9.0, 14.0, 5.0, 5.0, 10.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.51220703125, -0.4963836669921875, -0.480560302734375, -0.4647369384765625, -0.44891357421875, -0.4330902099609375, -0.417266845703125, -0.4014434814453125, -0.3856201171875, -0.3697967529296875, -0.353973388671875, -0.3381500244140625, -0.32232666015625, -0.3065032958984375, -0.290679931640625, -0.2748565673828125, -0.259033203125, -0.2432098388671875, -0.227386474609375, -0.2115631103515625, -0.19573974609375, -0.1799163818359375, -0.164093017578125, -0.1482696533203125, -0.1324462890625, -0.1166229248046875, -0.100799560546875, -0.0849761962890625, -0.06915283203125, -0.0533294677734375, -0.037506103515625, -0.0216827392578125, -0.005859375, 0.0099639892578125, 0.025787353515625, 0.0416107177734375, 0.05743408203125, 0.0732574462890625, 0.089080810546875, 0.1049041748046875, 0.1207275390625, 0.1365509033203125, 0.152374267578125, 0.1681976318359375, 0.18402099609375, 0.1998443603515625, 0.215667724609375, 0.2314910888671875, 0.247314453125, 0.2631378173828125, 0.278961181640625, 0.2947845458984375, 0.31060791015625, 0.3264312744140625, 0.342254638671875, 0.3580780029296875, 0.3739013671875, 0.3897247314453125, 0.405548095703125, 0.4213714599609375, 0.43719482421875, 0.4530181884765625, 0.468841552734375, 0.4846649169921875, 0.50048828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 11.0, 19.0, 22.0, 30.0, 45.0, 54.0, 74.0, 113.0, 160.0, 222.0, 318.0, 491.0, 784.0, 1318.0, 2592.0, 7039.0, 81107.0, 4080470.0, 11716.0, 3487.0, 1595.0, 882.0, 553.0, 361.0, 252.0, 165.0, 120.0, 81.0, 64.0, 39.0, 24.0, 17.0, 12.0, 11.0, 7.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0], "bins": [-2.498046875, -2.43426513671875, -2.3704833984375, -2.30670166015625, -2.242919921875, -2.17913818359375, -2.1153564453125, -2.05157470703125, -1.98779296875, -1.92401123046875, -1.8602294921875, -1.79644775390625, -1.732666015625, -1.66888427734375, -1.6051025390625, -1.54132080078125, -1.4775390625, -1.41375732421875, -1.3499755859375, -1.28619384765625, -1.222412109375, -1.15863037109375, -1.0948486328125, -1.03106689453125, -0.96728515625, -0.90350341796875, -0.8397216796875, -0.77593994140625, -0.712158203125, -0.64837646484375, -0.5845947265625, -0.52081298828125, -0.45703125, -0.39324951171875, -0.3294677734375, -0.26568603515625, -0.201904296875, -0.13812255859375, -0.0743408203125, -0.01055908203125, 0.05322265625, 0.11700439453125, 0.1807861328125, 0.24456787109375, 0.308349609375, 0.37213134765625, 0.4359130859375, 0.49969482421875, 0.5634765625, 0.62725830078125, 0.6910400390625, 0.75482177734375, 0.818603515625, 0.88238525390625, 0.9461669921875, 1.00994873046875, 1.07373046875, 1.13751220703125, 1.2012939453125, 1.26507568359375, 1.328857421875, 1.39263916015625, 1.4564208984375, 1.52020263671875, 1.583984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 18.0, 85.0, 3879.0, 48.0, 18.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.93798828125, -0.9163551330566406, -0.8947219848632812, -0.8730888366699219, -0.8514556884765625, -0.8298225402832031, -0.8081893920898438, -0.7865562438964844, -0.764923095703125, -0.7432899475097656, -0.7216567993164062, -0.7000236511230469, -0.6783905029296875, -0.6567573547363281, -0.6351242065429688, -0.6134910583496094, -0.59185791015625, -0.5702247619628906, -0.5485916137695312, -0.5269584655761719, -0.5053253173828125, -0.4836921691894531, -0.46205902099609375, -0.4404258728027344, -0.418792724609375, -0.3971595764160156, -0.37552642822265625, -0.3538932800292969, -0.3322601318359375, -0.3106269836425781, -0.28899383544921875, -0.2673606872558594, -0.2457275390625, -0.22409439086914062, -0.20246124267578125, -0.18082809448242188, -0.1591949462890625, -0.13756179809570312, -0.11592864990234375, -0.09429550170898438, -0.072662353515625, -0.051029205322265625, -0.02939605712890625, -0.007762908935546875, 0.0138702392578125, 0.035503387451171875, 0.05713653564453125, 0.07876968383789062, 0.10040283203125, 0.12203598022460938, 0.14366912841796875, 0.16530227661132812, 0.1869354248046875, 0.20856857299804688, 0.23020172119140625, 0.2518348693847656, 0.273468017578125, 0.2951011657714844, 0.31673431396484375, 0.3383674621582031, 0.3600006103515625, 0.3816337585449219, 0.40326690673828125, 0.4249000549316406, 0.446533203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 13.0, 11.0, 25.0, 35.0, 82.0, 120.0, 196.0, 200.0, 157.0, 76.0, 49.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8249605894088745, -1.7769306898117065, -1.7289009094238281, -1.6808710098266602, -1.6328412294387817, -1.5848113298416138, -1.5367815494537354, -1.4887516498565674, -1.4407217502593994, -1.3926918506622314, -1.344662070274353, -1.296632170677185, -1.2486023902893066, -1.2005724906921387, -1.1525425910949707, -1.1045128107070923, -1.0564830303192139, -1.008453130722046, -0.9604233503341675, -0.9123934507369995, -0.8643636703491211, -0.8163337707519531, -0.7683039307594299, -0.7202740907669067, -0.6722442507743835, -0.6242144107818604, -0.5761845707893372, -0.528154730796814, -0.4801248610019684, -0.4320950210094452, -0.3840651512145996, -0.3360353112220764, -0.2880055904388428, -0.23997575044631958, -0.1919458955526352, -0.1439160406589508, -0.09588620066642761, -0.04785636067390442, 0.0001735091209411621, 0.048203349113464355, 0.09623318910598755, 0.14426302909851074, 0.19229288399219513, 0.24032273888587952, 0.2883525788784027, 0.3363824188709259, 0.3844122886657715, 0.4324421286582947, 0.48047196865081787, 0.5285018086433411, 0.5765316486358643, 0.6245615482330322, 0.6725913286209106, 0.7206212282180786, 0.7686510682106018, 0.816680908203125, 0.8647107481956482, 0.9127405881881714, 0.9607704281806946, 1.0088002681732178, 1.0568301677703857, 1.1048599481582642, 1.1528898477554321, 1.2009196281433105, 1.2489495277404785]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 4.0, 10.0, 7.0, 6.0, 14.0, 13.0, 17.0, 28.0, 21.0, 21.0, 26.0, 42.0, 38.0, 38.0, 35.0, 50.0, 54.0, 50.0, 48.0, 33.0, 42.0, 37.0, 41.0, 35.0, 38.0, 35.0, 21.0, 21.0, 23.0, 21.0, 22.0, 18.0, 17.0, 15.0, 13.0, 11.0, 8.0, 6.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.0060992240905762, -0.9769303202629089, -0.9477614164352417, -0.9185925126075745, -0.8894236087799072, -0.86025470495224, -0.8310858011245728, -0.8019168972969055, -0.7727479934692383, -0.743579089641571, -0.7144101858139038, -0.6852412819862366, -0.6560723781585693, -0.6269034743309021, -0.5977345705032349, -0.5685656666755676, -0.5393967628479004, -0.5102278590202332, -0.4810589551925659, -0.4518900513648987, -0.42272114753723145, -0.3935522437095642, -0.364383339881897, -0.33521443605422974, -0.3060455322265625, -0.27687662839889526, -0.24770772457122803, -0.2185388207435608, -0.18936991691589355, -0.16020101308822632, -0.13103210926055908, -0.10186320543289185, -0.07269430160522461, -0.04352539777755737, -0.014356493949890137, 0.0148124098777771, 0.043981313705444336, 0.07315021753311157, 0.10231912136077881, 0.13148802518844604, 0.16065692901611328, 0.18982583284378052, 0.21899473667144775, 0.248163640499115, 0.2773325443267822, 0.30650144815444946, 0.3356703519821167, 0.36483925580978394, 0.39400815963745117, 0.4231770634651184, 0.45234596729278564, 0.4815148711204529, 0.5106837749481201, 0.5398526787757874, 0.5690215826034546, 0.5981904864311218, 0.6273593902587891, 0.6565282940864563, 0.6856971979141235, 0.7148661017417908, 0.744035005569458, 0.7732039093971252, 0.8023728132247925, 0.8315417170524597, 0.860710620880127]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 7.0, 6.0, 9.0, 8.0, 5.0, 10.0, 14.0, 27.0, 38.0, 47.0, 70.0, 100.0, 145.0, 208.0, 369.0, 591.0, 1022.0, 1911.0, 3228.0, 5800.0, 10686.0, 20892.0, 43636.0, 100097.0, 255849.0, 336124.0, 147975.0, 60529.0, 27766.0, 14063.0, 7506.0, 4199.0, 2248.0, 1351.0, 709.0, 466.0, 282.0, 184.0, 108.0, 72.0, 51.0, 38.0, 29.0, 21.0, 19.0, 13.0, 7.0, 4.0, 7.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0], "bins": [-0.873046875, -0.8467559814453125, -0.820465087890625, -0.7941741943359375, -0.76788330078125, -0.7415924072265625, -0.715301513671875, -0.6890106201171875, -0.6627197265625, -0.6364288330078125, -0.610137939453125, -0.5838470458984375, -0.55755615234375, -0.5312652587890625, -0.504974365234375, -0.4786834716796875, -0.452392578125, -0.4261016845703125, -0.399810791015625, -0.3735198974609375, -0.34722900390625, -0.3209381103515625, -0.294647216796875, -0.2683563232421875, -0.2420654296875, -0.2157745361328125, -0.189483642578125, -0.1631927490234375, -0.13690185546875, -0.1106109619140625, -0.084320068359375, -0.0580291748046875, -0.03173828125, -0.0054473876953125, 0.020843505859375, 0.0471343994140625, 0.07342529296875, 0.0997161865234375, 0.126007080078125, 0.1522979736328125, 0.1785888671875, 0.2048797607421875, 0.231170654296875, 0.2574615478515625, 0.28375244140625, 0.3100433349609375, 0.336334228515625, 0.3626251220703125, 0.388916015625, 0.4152069091796875, 0.441497802734375, 0.4677886962890625, 0.49407958984375, 0.5203704833984375, 0.546661376953125, 0.5729522705078125, 0.5992431640625, 0.6255340576171875, 0.651824951171875, 0.6781158447265625, 0.70440673828125, 0.7306976318359375, 0.756988525390625, 0.7832794189453125, 0.8095703125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 2.0, 5.0, 6.0, 2.0, 9.0, 7.0, 10.0, 16.0, 14.0, 17.0, 18.0, 24.0, 15.0, 21.0, 27.0, 35.0, 34.0, 37.0, 34.0, 29.0, 59.0, 33.0, 36.0, 38.0, 40.0, 43.0, 37.0, 27.0, 46.0, 29.0, 32.0, 36.0, 29.0, 20.0, 14.0, 16.0, 10.0, 12.0, 12.0, 9.0, 14.0, 7.0, 11.0, 4.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.5419921875, -0.5255279541015625, -0.509063720703125, -0.4925994873046875, -0.47613525390625, -0.4596710205078125, -0.443206787109375, -0.4267425537109375, -0.4102783203125, -0.3938140869140625, -0.377349853515625, -0.3608856201171875, -0.34442138671875, -0.3279571533203125, -0.311492919921875, -0.2950286865234375, -0.278564453125, -0.2621002197265625, -0.245635986328125, -0.2291717529296875, -0.21270751953125, -0.1962432861328125, -0.179779052734375, -0.1633148193359375, -0.1468505859375, -0.1303863525390625, -0.113922119140625, -0.0974578857421875, -0.08099365234375, -0.0645294189453125, -0.048065185546875, -0.0316009521484375, -0.01513671875, 0.0013275146484375, 0.017791748046875, 0.0342559814453125, 0.05072021484375, 0.0671844482421875, 0.083648681640625, 0.1001129150390625, 0.1165771484375, 0.1330413818359375, 0.149505615234375, 0.1659698486328125, 0.18243408203125, 0.1988983154296875, 0.215362548828125, 0.2318267822265625, 0.248291015625, 0.2647552490234375, 0.281219482421875, 0.2976837158203125, 0.31414794921875, 0.3306121826171875, 0.347076416015625, 0.3635406494140625, 0.3800048828125, 0.3964691162109375, 0.412933349609375, 0.4293975830078125, 0.44586181640625, 0.4623260498046875, 0.478790283203125, 0.4952545166015625, 0.51171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 8.0, 12.0, 15.0, 16.0, 26.0, 38.0, 35.0, 52.0, 75.0, 126.0, 199.0, 273.0, 519.0, 1113.0, 2790.0, 7851.0, 25182.0, 111889.0, 596270.0, 237550.0, 44278.0, 12567.0, 4206.0, 1687.0, 700.0, 362.0, 201.0, 138.0, 102.0, 61.0, 45.0, 33.0, 22.0, 18.0, 22.0, 12.0, 18.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.4482421875, -1.3994903564453125, -1.350738525390625, -1.3019866943359375, -1.25323486328125, -1.2044830322265625, -1.155731201171875, -1.1069793701171875, -1.0582275390625, -1.0094757080078125, -0.960723876953125, -0.9119720458984375, -0.86322021484375, -0.8144683837890625, -0.765716552734375, -0.7169647216796875, -0.668212890625, -0.6194610595703125, -0.570709228515625, -0.5219573974609375, -0.47320556640625, -0.4244537353515625, -0.375701904296875, -0.3269500732421875, -0.2781982421875, -0.2294464111328125, -0.180694580078125, -0.1319427490234375, -0.08319091796875, -0.0344390869140625, 0.014312744140625, 0.0630645751953125, 0.11181640625, 0.1605682373046875, 0.209320068359375, 0.2580718994140625, 0.30682373046875, 0.3555755615234375, 0.404327392578125, 0.4530792236328125, 0.5018310546875, 0.5505828857421875, 0.599334716796875, 0.6480865478515625, 0.69683837890625, 0.7455902099609375, 0.794342041015625, 0.8430938720703125, 0.891845703125, 0.9405975341796875, 0.989349365234375, 1.0381011962890625, 1.08685302734375, 1.1356048583984375, 1.184356689453125, 1.2331085205078125, 1.2818603515625, 1.3306121826171875, 1.379364013671875, 1.4281158447265625, 1.47686767578125, 1.5256195068359375, 1.574371337890625, 1.6231231689453125, 1.671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 7.0, 14.0, 10.0, 15.0, 26.0, 25.0, 34.0, 32.0, 28.0, 35.0, 40.0, 58.0, 50.0, 33.0, 62.0, 53.0, 65.0, 45.0, 47.0, 53.0, 49.0, 29.0, 30.0, 28.0, 21.0, 16.0, 12.0, 15.0, 6.0, 11.0, 14.0, 6.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.256256103515625, -3.14727783203125, -3.038299560546875, -2.9293212890625, -2.820343017578125, -2.71136474609375, -2.602386474609375, -2.493408203125, -2.384429931640625, -2.27545166015625, -2.166473388671875, -2.0574951171875, -1.948516845703125, -1.83953857421875, -1.730560302734375, -1.62158203125, -1.512603759765625, -1.40362548828125, -1.294647216796875, -1.1856689453125, -1.076690673828125, -0.96771240234375, -0.858734130859375, -0.749755859375, -0.640777587890625, -0.53179931640625, -0.422821044921875, -0.3138427734375, -0.204864501953125, -0.09588623046875, 0.013092041015625, 0.1220703125, 0.231048583984375, 0.34002685546875, 0.449005126953125, 0.5579833984375, 0.666961669921875, 0.77593994140625, 0.884918212890625, 0.993896484375, 1.102874755859375, 1.21185302734375, 1.320831298828125, 1.4298095703125, 1.538787841796875, 1.64776611328125, 1.756744384765625, 1.86572265625, 1.974700927734375, 2.08367919921875, 2.192657470703125, 2.3016357421875, 2.410614013671875, 2.51959228515625, 2.628570556640625, 2.737548828125, 2.846527099609375, 2.95550537109375, 3.064483642578125, 3.1734619140625, 3.282440185546875, 3.39141845703125, 3.500396728515625, 3.609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 12.0, 8.0, 6.0, 19.0, 21.0, 34.0, 51.0, 58.0, 86.0, 149.0, 256.0, 491.0, 1134.0, 2795.0, 8979.0, 45837.0, 617835.0, 331318.0, 28785.0, 6503.0, 2174.0, 973.0, 414.0, 204.0, 123.0, 87.0, 52.0, 45.0, 31.0, 21.0, 13.0, 14.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.7060546875, -0.6831893920898438, -0.6603240966796875, -0.6374588012695312, -0.614593505859375, -0.5917282104492188, -0.5688629150390625, -0.5459976196289062, -0.52313232421875, -0.5002670288085938, -0.4774017333984375, -0.45453643798828125, -0.431671142578125, -0.40880584716796875, -0.3859405517578125, -0.36307525634765625, -0.3402099609375, -0.31734466552734375, -0.2944793701171875, -0.27161407470703125, -0.248748779296875, -0.22588348388671875, -0.2030181884765625, -0.18015289306640625, -0.15728759765625, -0.13442230224609375, -0.1115570068359375, -0.08869171142578125, -0.065826416015625, -0.04296112060546875, -0.0200958251953125, 0.00276947021484375, 0.025634765625, 0.04850006103515625, 0.0713653564453125, 0.09423065185546875, 0.117095947265625, 0.13996124267578125, 0.1628265380859375, 0.18569183349609375, 0.20855712890625, 0.23142242431640625, 0.2542877197265625, 0.27715301513671875, 0.300018310546875, 0.32288360595703125, 0.3457489013671875, 0.36861419677734375, 0.3914794921875, 0.41434478759765625, 0.4372100830078125, 0.46007537841796875, 0.482940673828125, 0.5058059692382812, 0.5286712646484375, 0.5515365600585938, 0.57440185546875, 0.5972671508789062, 0.6201324462890625, 0.6429977416992188, 0.665863037109375, 0.6887283325195312, 0.7115936279296875, 0.7344589233398438, 0.75732421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 8.0, 19.0, 21.0, 30.0, 47.0, 48.0, 72.0, 74.0, 82.0, 87.0, 89.0, 80.0, 79.0, 72.0, 48.0, 38.0, 25.0, 16.0, 18.0, 5.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.988908767700195e-05, -4.7958455979824066e-05, -4.602782428264618e-05, -4.409719258546829e-05, -4.2166560888290405e-05, -4.023592919111252e-05, -3.830529749393463e-05, -3.6374665796756744e-05, -3.444403409957886e-05, -3.251340240240097e-05, -3.0582770705223083e-05, -2.8652139008045197e-05, -2.672150731086731e-05, -2.4790875613689423e-05, -2.2860243916511536e-05, -2.092961221933365e-05, -1.8998980522155762e-05, -1.7068348824977875e-05, -1.5137717127799988e-05, -1.32070854306221e-05, -1.1276453733444214e-05, -9.345822036266327e-06, -7.41519033908844e-06, -5.484558641910553e-06, -3.553926944732666e-06, -1.623295247554779e-06, 3.073364496231079e-07, 2.237968146800995e-06, 4.168599843978882e-06, 6.099231541156769e-06, 8.029863238334656e-06, 9.960494935512543e-06, 1.189112663269043e-05, 1.3821758329868317e-05, 1.5752390027046204e-05, 1.768302172422409e-05, 1.9613653421401978e-05, 2.1544285118579865e-05, 2.347491681575775e-05, 2.540554851293564e-05, 2.7336180210113525e-05, 2.9266811907291412e-05, 3.11974436044693e-05, 3.3128075301647186e-05, 3.505870699882507e-05, 3.698933869600296e-05, 3.891997039318085e-05, 4.0850602090358734e-05, 4.278123378753662e-05, 4.471186548471451e-05, 4.6642497181892395e-05, 4.857312887907028e-05, 5.050376057624817e-05, 5.2434392273426056e-05, 5.436502397060394e-05, 5.629565566778183e-05, 5.822628736495972e-05, 6.0156919062137604e-05, 6.208755075931549e-05, 6.401818245649338e-05, 6.594881415367126e-05, 6.787944585084915e-05, 6.981007754802704e-05, 7.174070924520493e-05, 7.367134094238281e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 5.0, 10.0, 20.0, 25.0, 27.0, 43.0, 45.0, 77.0, 137.0, 255.0, 398.0, 781.0, 1853.0, 5420.0, 22236.0, 175029.0, 704256.0, 113414.0, 16837.0, 4345.0, 1591.0, 725.0, 391.0, 232.0, 123.0, 67.0, 48.0, 40.0, 25.0, 17.0, 16.0, 14.0, 5.0, 4.0, 4.0, 6.0, 3.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.61328125, -0.5949249267578125, -0.576568603515625, -0.5582122802734375, -0.53985595703125, -0.5214996337890625, -0.503143310546875, -0.4847869873046875, -0.4664306640625, -0.4480743408203125, -0.429718017578125, -0.4113616943359375, -0.39300537109375, -0.3746490478515625, -0.356292724609375, -0.3379364013671875, -0.319580078125, -0.3012237548828125, -0.282867431640625, -0.2645111083984375, -0.24615478515625, -0.2277984619140625, -0.209442138671875, -0.1910858154296875, -0.1727294921875, -0.1543731689453125, -0.136016845703125, -0.1176605224609375, -0.09930419921875, -0.0809478759765625, -0.062591552734375, -0.0442352294921875, -0.02587890625, -0.0075225830078125, 0.010833740234375, 0.0291900634765625, 0.04754638671875, 0.0659027099609375, 0.084259033203125, 0.1026153564453125, 0.1209716796875, 0.1393280029296875, 0.157684326171875, 0.1760406494140625, 0.19439697265625, 0.2127532958984375, 0.231109619140625, 0.2494659423828125, 0.267822265625, 0.2861785888671875, 0.304534912109375, 0.3228912353515625, 0.34124755859375, 0.3596038818359375, 0.377960205078125, 0.3963165283203125, 0.4146728515625, 0.4330291748046875, 0.451385498046875, 0.4697418212890625, 0.48809814453125, 0.5064544677734375, 0.524810791015625, 0.5431671142578125, 0.5615234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 12.0, 5.0, 15.0, 23.0, 33.0, 35.0, 55.0, 93.0, 108.0, 150.0, 142.0, 94.0, 85.0, 51.0, 36.0, 19.0, 14.0, 5.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0908203125, -1.0482940673828125, -1.005767822265625, -0.9632415771484375, -0.92071533203125, -0.8781890869140625, -0.835662841796875, -0.7931365966796875, -0.7506103515625, -0.7080841064453125, -0.665557861328125, -0.6230316162109375, -0.58050537109375, -0.5379791259765625, -0.495452880859375, -0.4529266357421875, -0.410400390625, -0.3678741455078125, -0.325347900390625, -0.2828216552734375, -0.24029541015625, -0.1977691650390625, -0.155242919921875, -0.1127166748046875, -0.0701904296875, -0.0276641845703125, 0.014862060546875, 0.0573883056640625, 0.09991455078125, 0.1424407958984375, 0.184967041015625, 0.2274932861328125, 0.27001953125, 0.3125457763671875, 0.355072021484375, 0.3975982666015625, 0.44012451171875, 0.4826507568359375, 0.525177001953125, 0.5677032470703125, 0.6102294921875, 0.6527557373046875, 0.695281982421875, 0.7378082275390625, 0.78033447265625, 0.8228607177734375, 0.865386962890625, 0.9079132080078125, 0.950439453125, 0.9929656982421875, 1.035491943359375, 1.0780181884765625, 1.12054443359375, 1.1630706787109375, 1.205596923828125, 1.2481231689453125, 1.2906494140625, 1.3331756591796875, 1.375701904296875, 1.4182281494140625, 1.46075439453125, 1.5032806396484375, 1.545806884765625, 1.5883331298828125, 1.630859375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 24.0, 61.0, 227.0, 442.0, 179.0, 55.0, 17.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.00821590423584, -9.953398704528809, -8.898582458496094, -7.8437652587890625, -6.7889485359191895, -5.734131813049316, -4.679314613342285, -3.624497890472412, -2.569681167602539, -1.5148643255233765, -0.46004748344421387, 0.5947694778442383, 1.6495862007141113, 2.7044029235839844, 3.7592201232910156, 4.814036846160889, 5.868853569030762, 6.923670291900635, 7.978487014770508, 9.033304214477539, 10.08812141418457, 11.142937660217285, 12.197754859924316, 13.252571105957031, 14.307388305664062, 15.362205505371094, 16.417022705078125, 17.471839904785156, 18.526655197143555, 19.581472396850586, 20.636289596557617, 21.69110679626465, 22.745922088623047, 23.800739288330078, 24.85555648803711, 25.91037368774414, 26.96518898010254, 28.02000617980957, 29.0748233795166, 30.129640579223633, 31.18445587158203, 32.23927307128906, 33.294090270996094, 34.348907470703125, 35.403724670410156, 36.45854187011719, 37.51335906982422, 38.568172454833984, 39.62299346923828, 40.67781066894531, 41.732627868652344, 42.787445068359375, 43.842262268066406, 44.89707946777344, 45.95189666748047, 47.006710052490234, 48.061527252197266, 49.1163444519043, 50.17116165161133, 51.22597885131836, 52.28079605102539, 53.335609436035156, 54.39042663574219, 55.44524383544922, 56.50006103515625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 7.0, 12.0, 9.0, 11.0, 7.0, 19.0, 14.0, 20.0, 21.0, 33.0, 33.0, 25.0, 28.0, 44.0, 53.0, 55.0, 48.0, 53.0, 54.0, 41.0, 53.0, 44.0, 41.0, 41.0, 32.0, 26.0, 23.0, 21.0, 16.0, 15.0, 18.0, 6.0, 18.0, 12.0, 9.0, 5.0, 4.0, 9.0, 4.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.341935157775879, -14.843670845031738, -14.345407485961914, -13.847143173217773, -13.348878860473633, -12.850615501403809, -12.352351188659668, -11.854087829589844, -11.355823516845703, -10.857559204101562, -10.359295845031738, -9.861031532287598, -9.362768173217773, -8.864503860473633, -8.366239547729492, -7.86797571182251, -7.369711875915527, -6.871448040008545, -6.3731842041015625, -5.874919891357422, -5.3766560554504395, -4.878392219543457, -4.380127906799316, -3.881864070892334, -3.3836002349853516, -2.885336399078369, -2.3870723247528076, -1.8888083696365356, -1.3905444145202637, -0.8922805786132812, -0.3940165042877197, 0.1042475700378418, 0.6025123596191406, 1.1007763147354126, 1.5990402698516846, 2.097304344177246, 2.5955681800842285, 3.093832015991211, 3.5920960903167725, 4.090360164642334, 4.588624000549316, 5.086887836456299, 5.585151672363281, 6.083415985107422, 6.581679821014404, 7.079943656921387, 7.578207969665527, 8.076471328735352, 8.574735641479492, 9.072999954223633, 9.571263313293457, 10.069527626037598, 10.567790985107422, 11.066055297851562, 11.564319610595703, 12.062583923339844, 12.560847282409668, 13.059111595153809, 13.557374954223633, 14.055639266967773, 14.553903579711914, 15.052166938781738, 15.550431251525879, 16.048694610595703, 16.546958923339844]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 6.0, 8.0, 9.0, 9.0, 18.0, 16.0, 22.0, 20.0, 34.0, 57.0, 77.0, 111.0, 191.0, 437.0, 805.0, 1952.0, 7525.0, 4065087.0, 109302.0, 5285.0, 1611.0, 774.0, 331.0, 206.0, 132.0, 75.0, 43.0, 28.0, 20.0, 18.0, 9.0, 13.0, 4.0, 4.0, 11.0, 7.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.974609375, -1.9127044677734375, -1.850799560546875, -1.7888946533203125, -1.72698974609375, -1.6650848388671875, -1.603179931640625, -1.5412750244140625, -1.4793701171875, -1.4174652099609375, -1.355560302734375, -1.2936553955078125, -1.23175048828125, -1.1698455810546875, -1.107940673828125, -1.0460357666015625, -0.984130859375, -0.9222259521484375, -0.860321044921875, -0.7984161376953125, -0.73651123046875, -0.6746063232421875, -0.612701416015625, -0.5507965087890625, -0.4888916015625, -0.4269866943359375, -0.365081787109375, -0.3031768798828125, -0.24127197265625, -0.1793670654296875, -0.117462158203125, -0.0555572509765625, 0.00634765625, 0.0682525634765625, 0.130157470703125, 0.1920623779296875, 0.25396728515625, 0.3158721923828125, 0.377777099609375, 0.4396820068359375, 0.5015869140625, 0.5634918212890625, 0.625396728515625, 0.6873016357421875, 0.74920654296875, 0.8111114501953125, 0.873016357421875, 0.9349212646484375, 0.996826171875, 1.0587310791015625, 1.120635986328125, 1.1825408935546875, 1.24444580078125, 1.3063507080078125, 1.368255615234375, 1.4301605224609375, 1.4920654296875, 1.5539703369140625, 1.615875244140625, 1.6777801513671875, 1.73968505859375, 1.8015899658203125, 1.863494873046875, 1.9253997802734375, 1.9873046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 2.0, 11.0, 12.0, 8.0, 12.0, 20.0, 22.0, 26.0, 25.0, 24.0, 28.0, 25.0, 31.0, 50.0, 51.0, 55.0, 58.0, 50.0, 44.0, 52.0, 43.0, 45.0, 38.0, 44.0, 31.0, 27.0, 29.0, 21.0, 17.0, 15.0, 9.0, 14.0, 5.0, 7.0, 11.0, 6.0, 5.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.80615234375, -0.7815933227539062, -0.7570343017578125, -0.7324752807617188, -0.707916259765625, -0.6833572387695312, -0.6587982177734375, -0.6342391967773438, -0.60968017578125, -0.5851211547851562, -0.5605621337890625, -0.5360031127929688, -0.511444091796875, -0.48688507080078125, -0.4623260498046875, -0.43776702880859375, -0.4132080078125, -0.38864898681640625, -0.3640899658203125, -0.33953094482421875, -0.314971923828125, -0.29041290283203125, -0.2658538818359375, -0.24129486083984375, -0.21673583984375, -0.19217681884765625, -0.1676177978515625, -0.14305877685546875, -0.118499755859375, -0.09394073486328125, -0.0693817138671875, -0.04482269287109375, -0.020263671875, 0.00429534912109375, 0.0288543701171875, 0.05341339111328125, 0.077972412109375, 0.10253143310546875, 0.1270904541015625, 0.15164947509765625, 0.17620849609375, 0.20076751708984375, 0.2253265380859375, 0.24988555908203125, 0.274444580078125, 0.29900360107421875, 0.3235626220703125, 0.34812164306640625, 0.3726806640625, 0.39723968505859375, 0.4217987060546875, 0.44635772705078125, 0.470916748046875, 0.49547576904296875, 0.5200347900390625, 0.5445938110351562, 0.56915283203125, 0.5937118530273438, 0.6182708740234375, 0.6428298950195312, 0.667388916015625, 0.6919479370117188, 0.7165069580078125, 0.7410659790039062, 0.765625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 7.0, 15.0, 17.0, 24.0, 25.0, 40.0, 49.0, 90.0, 119.0, 172.0, 294.0, 531.0, 1036.0, 2406.0, 9364.0, 396740.0, 3768168.0, 10187.0, 2533.0, 1017.0, 510.0, 306.0, 184.0, 133.0, 80.0, 56.0, 37.0, 31.0, 22.0, 25.0, 14.0, 12.0, 5.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904296875, -1.83868408203125, -1.7730712890625, -1.70745849609375, -1.641845703125, -1.57623291015625, -1.5106201171875, -1.44500732421875, -1.37939453125, -1.31378173828125, -1.2481689453125, -1.18255615234375, -1.116943359375, -1.05133056640625, -0.9857177734375, -0.92010498046875, -0.8544921875, -0.78887939453125, -0.7232666015625, -0.65765380859375, -0.592041015625, -0.52642822265625, -0.4608154296875, -0.39520263671875, -0.32958984375, -0.26397705078125, -0.1983642578125, -0.13275146484375, -0.067138671875, -0.00152587890625, 0.0640869140625, 0.12969970703125, 0.1953125, 0.26092529296875, 0.3265380859375, 0.39215087890625, 0.457763671875, 0.52337646484375, 0.5889892578125, 0.65460205078125, 0.72021484375, 0.78582763671875, 0.8514404296875, 0.91705322265625, 0.982666015625, 1.04827880859375, 1.1138916015625, 1.17950439453125, 1.2451171875, 1.31072998046875, 1.3763427734375, 1.44195556640625, 1.507568359375, 1.57318115234375, 1.6387939453125, 1.70440673828125, 1.77001953125, 1.83563232421875, 1.9012451171875, 1.96685791015625, 2.032470703125, 2.09808349609375, 2.1636962890625, 2.22930908203125, 2.294921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 11.0, 49.0, 3513.0, 429.0, 41.0, 16.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.107421875, -1.0803680419921875, -1.053314208984375, -1.0262603759765625, -0.99920654296875, -0.9721527099609375, -0.945098876953125, -0.9180450439453125, -0.8909912109375, -0.8639373779296875, -0.836883544921875, -0.8098297119140625, -0.78277587890625, -0.7557220458984375, -0.728668212890625, -0.7016143798828125, -0.674560546875, -0.6475067138671875, -0.620452880859375, -0.5933990478515625, -0.56634521484375, -0.5392913818359375, -0.512237548828125, -0.4851837158203125, -0.4581298828125, -0.4310760498046875, -0.404022216796875, -0.3769683837890625, -0.34991455078125, -0.3228607177734375, -0.295806884765625, -0.2687530517578125, -0.24169921875, -0.2146453857421875, -0.187591552734375, -0.1605377197265625, -0.13348388671875, -0.1064300537109375, -0.079376220703125, -0.0523223876953125, -0.0252685546875, 0.0017852783203125, 0.028839111328125, 0.0558929443359375, 0.08294677734375, 0.1100006103515625, 0.137054443359375, 0.1641082763671875, 0.191162109375, 0.2182159423828125, 0.245269775390625, 0.2723236083984375, 0.29937744140625, 0.3264312744140625, 0.353485107421875, 0.3805389404296875, 0.4075927734375, 0.4346466064453125, 0.461700439453125, 0.4887542724609375, 0.51580810546875, 0.5428619384765625, 0.569915771484375, 0.5969696044921875, 0.6240234375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 14.0, 30.0, 143.0, 342.0, 311.0, 112.0, 36.0, 19.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.820366859436035, -2.7097201347351074, -2.5990734100341797, -2.488426923751831, -2.3777801990509033, -2.2671334743499756, -2.156486988067627, -2.045840263366699, -1.9351935386657715, -1.8245468139648438, -1.7139002084732056, -1.6032536029815674, -1.4926068782806396, -1.381960153579712, -1.2713135480880737, -1.1606669425964355, -1.0500202178955078, -0.9393735527992249, -0.8287268877029419, -0.7180802226066589, -0.607433557510376, -0.496786892414093, -0.38614022731781006, -0.2754935622215271, -0.16484689712524414, -0.05420023202896118, 0.05644643306732178, 0.16709309816360474, 0.2777397632598877, 0.38838642835617065, 0.4990330934524536, 0.6096797585487366, 0.7203264236450195, 0.8309730887413025, 0.9416197538375854, 1.0522663593292236, 1.1629130840301514, 1.273559808731079, 1.3842064142227173, 1.4948530197143555, 1.6054997444152832, 1.716146469116211, 1.8267930746078491, 1.9374396800994873, 2.048086404800415, 2.1587331295013428, 2.2693796157836914, 2.380026340484619, 2.490673065185547, 2.6013197898864746, 2.7119665145874023, 2.822613000869751, 2.9332597255706787, 3.0439064502716064, 3.154552936553955, 3.265199661254883, 3.3758463859558105, 3.4864931106567383, 3.597139835357666, 3.7077863216400146, 3.8184330463409424, 3.92907977104187, 4.039726257324219, 4.1503729820251465, 4.261019706726074]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 7.0, 9.0, 8.0, 13.0, 15.0, 21.0, 16.0, 23.0, 28.0, 23.0, 27.0, 32.0, 36.0, 29.0, 42.0, 51.0, 41.0, 40.0, 43.0, 50.0, 47.0, 51.0, 32.0, 38.0, 33.0, 31.0, 35.0, 28.0, 24.0, 27.0, 16.0, 19.0, 12.0, 9.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9043163061141968, -0.8735536336898804, -0.842790961265564, -0.8120282888412476, -0.7812656164169312, -0.7505029439926147, -0.7197402715682983, -0.6889775991439819, -0.6582149267196655, -0.6274522542953491, -0.5966895818710327, -0.5659269094467163, -0.5351642370223999, -0.5044015645980835, -0.4736388921737671, -0.4428762197494507, -0.4121135175228119, -0.3813508450984955, -0.3505881726741791, -0.31982550024986267, -0.28906282782554626, -0.25830012559890747, -0.22753746807575226, -0.19677479565143585, -0.16601212322711945, -0.13524945080280304, -0.10448677837848663, -0.07372409850358963, -0.042961426079273224, -0.01219874620437622, 0.018563926219940186, 0.04932659864425659, 0.080089271068573, 0.1108519434928894, 0.1416146159172058, 0.17237728834152222, 0.20313996076583862, 0.23390264809131622, 0.26466530561447144, 0.29542797803878784, 0.32619065046310425, 0.35695332288742065, 0.38771599531173706, 0.41847866773605347, 0.4492413401603699, 0.4800040125846863, 0.5107666850090027, 0.5415293574333191, 0.5722920894622803, 0.6030547618865967, 0.6338174343109131, 0.6645801067352295, 0.6953427791595459, 0.7261054515838623, 0.7568681240081787, 0.7876307964324951, 0.8183934688568115, 0.8491561412811279, 0.8799188137054443, 0.9106814861297607, 0.9414441585540771, 0.9722068309783936, 1.00296950340271, 1.0337321758270264, 1.0644948482513428]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 7.0, 13.0, 8.0, 14.0, 17.0, 15.0, 35.0, 31.0, 57.0, 74.0, 138.0, 196.0, 283.0, 526.0, 929.0, 1830.0, 3636.0, 8441.0, 21162.0, 62553.0, 239569.0, 493655.0, 145672.0, 41880.0, 15095.0, 6455.0, 2887.0, 1434.0, 735.0, 411.0, 260.0, 165.0, 99.0, 70.0, 43.0, 40.0, 21.0, 23.0, 11.0, 15.0, 8.0, 8.0, 5.0, 3.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1738433837890625, -1.133819580078125, -1.0937957763671875, -1.05377197265625, -1.0137481689453125, -0.973724365234375, -0.9337005615234375, -0.8936767578125, -0.8536529541015625, -0.813629150390625, -0.7736053466796875, -0.73358154296875, -0.6935577392578125, -0.653533935546875, -0.6135101318359375, -0.573486328125, -0.5334625244140625, -0.493438720703125, -0.4534149169921875, -0.41339111328125, -0.3733673095703125, -0.333343505859375, -0.2933197021484375, -0.2532958984375, -0.2132720947265625, -0.173248291015625, -0.1332244873046875, -0.09320068359375, -0.0531768798828125, -0.013153076171875, 0.0268707275390625, 0.06689453125, 0.1069183349609375, 0.146942138671875, 0.1869659423828125, 0.22698974609375, 0.2670135498046875, 0.307037353515625, 0.3470611572265625, 0.3870849609375, 0.4271087646484375, 0.467132568359375, 0.5071563720703125, 0.54718017578125, 0.5872039794921875, 0.627227783203125, 0.6672515869140625, 0.707275390625, 0.7472991943359375, 0.787322998046875, 0.8273468017578125, 0.86737060546875, 0.9073944091796875, 0.947418212890625, 0.9874420166015625, 1.0274658203125, 1.0674896240234375, 1.107513427734375, 1.1475372314453125, 1.18756103515625, 1.2275848388671875, 1.267608642578125, 1.3076324462890625, 1.34765625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 12.0, 12.0, 24.0, 18.0, 21.0, 20.0, 34.0, 30.0, 19.0, 30.0, 35.0, 41.0, 41.0, 49.0, 53.0, 54.0, 44.0, 35.0, 39.0, 52.0, 38.0, 35.0, 35.0, 27.0, 26.0, 28.0, 18.0, 9.0, 15.0, 10.0, 15.0, 11.0, 5.0, 7.0, 6.0, 3.0, 1.0, 2.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.7421875, -0.7194671630859375, -0.696746826171875, -0.6740264892578125, -0.65130615234375, -0.6285858154296875, -0.605865478515625, -0.5831451416015625, -0.5604248046875, -0.5377044677734375, -0.514984130859375, -0.4922637939453125, -0.46954345703125, -0.4468231201171875, -0.424102783203125, -0.4013824462890625, -0.378662109375, -0.3559417724609375, -0.333221435546875, -0.3105010986328125, -0.28778076171875, -0.2650604248046875, -0.242340087890625, -0.2196197509765625, -0.1968994140625, -0.1741790771484375, -0.151458740234375, -0.1287384033203125, -0.10601806640625, -0.0832977294921875, -0.060577392578125, -0.0378570556640625, -0.01513671875, 0.0075836181640625, 0.030303955078125, 0.0530242919921875, 0.07574462890625, 0.0984649658203125, 0.121185302734375, 0.1439056396484375, 0.1666259765625, 0.1893463134765625, 0.212066650390625, 0.2347869873046875, 0.25750732421875, 0.2802276611328125, 0.302947998046875, 0.3256683349609375, 0.348388671875, 0.3711090087890625, 0.393829345703125, 0.4165496826171875, 0.43927001953125, 0.4619903564453125, 0.484710693359375, 0.5074310302734375, 0.5301513671875, 0.5528717041015625, 0.575592041015625, 0.5983123779296875, 0.62103271484375, 0.6437530517578125, 0.666473388671875, 0.6891937255859375, 0.7119140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 1.0, 7.0, 9.0, 12.0, 16.0, 23.0, 43.0, 52.0, 66.0, 92.0, 165.0, 227.0, 392.0, 706.0, 1353.0, 3341.0, 11115.0, 62951.0, 699049.0, 231977.0, 26336.0, 6146.0, 2097.0, 995.0, 508.0, 308.0, 181.0, 128.0, 83.0, 46.0, 33.0, 24.0, 20.0, 13.0, 11.0, 4.0, 1.0, 5.0, 6.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.166015625, -2.0880126953125, -2.010009765625, -1.9320068359375, -1.85400390625, -1.7760009765625, -1.697998046875, -1.6199951171875, -1.5419921875, -1.4639892578125, -1.385986328125, -1.3079833984375, -1.22998046875, -1.1519775390625, -1.073974609375, -0.9959716796875, -0.91796875, -0.8399658203125, -0.761962890625, -0.6839599609375, -0.60595703125, -0.5279541015625, -0.449951171875, -0.3719482421875, -0.2939453125, -0.2159423828125, -0.137939453125, -0.0599365234375, 0.01806640625, 0.0960693359375, 0.174072265625, 0.2520751953125, 0.330078125, 0.4080810546875, 0.486083984375, 0.5640869140625, 0.64208984375, 0.7200927734375, 0.798095703125, 0.8760986328125, 0.9541015625, 1.0321044921875, 1.110107421875, 1.1881103515625, 1.26611328125, 1.3441162109375, 1.422119140625, 1.5001220703125, 1.578125, 1.6561279296875, 1.734130859375, 1.8121337890625, 1.89013671875, 1.9681396484375, 2.046142578125, 2.1241455078125, 2.2021484375, 2.2801513671875, 2.358154296875, 2.4361572265625, 2.51416015625, 2.5921630859375, 2.670166015625, 2.7481689453125, 2.826171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 24.0, 40.0, 59.0, 59.0, 92.0, 90.0, 113.0, 107.0, 88.0, 83.0, 69.0, 49.0, 28.0, 21.0, 17.0, 9.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.55517578125, -6.3134765625, -6.07177734375, -5.830078125, -5.58837890625, -5.3466796875, -5.10498046875, -4.86328125, -4.62158203125, -4.3798828125, -4.13818359375, -3.896484375, -3.65478515625, -3.4130859375, -3.17138671875, -2.9296875, -2.68798828125, -2.4462890625, -2.20458984375, -1.962890625, -1.72119140625, -1.4794921875, -1.23779296875, -0.99609375, -0.75439453125, -0.5126953125, -0.27099609375, -0.029296875, 0.21240234375, 0.4541015625, 0.69580078125, 0.9375, 1.17919921875, 1.4208984375, 1.66259765625, 1.904296875, 2.14599609375, 2.3876953125, 2.62939453125, 2.87109375, 3.11279296875, 3.3544921875, 3.59619140625, 3.837890625, 4.07958984375, 4.3212890625, 4.56298828125, 4.8046875, 5.04638671875, 5.2880859375, 5.52978515625, 5.771484375, 6.01318359375, 6.2548828125, 6.49658203125, 6.73828125, 6.97998046875, 7.2216796875, 7.46337890625, 7.705078125, 7.94677734375, 8.1884765625, 8.43017578125, 8.671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 21.0, 24.0, 27.0, 56.0, 116.0, 235.0, 572.0, 1569.0, 6442.0, 309367.0, 718864.0, 8107.0, 1786.0, 689.0, 286.0, 150.0, 86.0, 39.0, 32.0, 19.0, 12.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.33966064453125, -1.2789306640625, -1.21820068359375, -1.157470703125, -1.09674072265625, -1.0360107421875, -0.97528076171875, -0.91455078125, -0.85382080078125, -0.7930908203125, -0.73236083984375, -0.671630859375, -0.61090087890625, -0.5501708984375, -0.48944091796875, -0.4287109375, -0.36798095703125, -0.3072509765625, -0.24652099609375, -0.185791015625, -0.12506103515625, -0.0643310546875, -0.00360107421875, 0.05712890625, 0.11785888671875, 0.1785888671875, 0.23931884765625, 0.300048828125, 0.36077880859375, 0.4215087890625, 0.48223876953125, 0.54296875, 0.60369873046875, 0.6644287109375, 0.72515869140625, 0.785888671875, 0.84661865234375, 0.9073486328125, 0.96807861328125, 1.02880859375, 1.08953857421875, 1.1502685546875, 1.21099853515625, 1.271728515625, 1.33245849609375, 1.3931884765625, 1.45391845703125, 1.5146484375, 1.57537841796875, 1.6361083984375, 1.69683837890625, 1.757568359375, 1.81829833984375, 1.8790283203125, 1.93975830078125, 2.00048828125, 2.06121826171875, 2.1219482421875, 2.18267822265625, 2.243408203125, 2.30413818359375, 2.3648681640625, 2.42559814453125, 2.486328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 7.0, 6.0, 19.0, 23.0, 36.0, 66.0, 118.0, 165.0, 154.0, 120.0, 80.0, 75.0, 40.0, 21.0, 17.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.560585021972656e-05, -9.245611727237701e-05, -8.930638432502747e-05, -8.615665137767792e-05, -8.300691843032837e-05, -7.985718548297882e-05, -7.670745253562927e-05, -7.355771958827972e-05, -7.040798664093018e-05, -6.725825369358063e-05, -6.410852074623108e-05, -6.095878779888153e-05, -5.780905485153198e-05, -5.4659321904182434e-05, -5.1509588956832886e-05, -4.835985600948334e-05, -4.521012306213379e-05, -4.206039011478424e-05, -3.891065716743469e-05, -3.5760924220085144e-05, -3.2611191272735596e-05, -2.9461458325386047e-05, -2.63117253780365e-05, -2.316199243068695e-05, -2.0012259483337402e-05, -1.6862526535987854e-05, -1.3712793588638306e-05, -1.0563060641288757e-05, -7.413327693939209e-06, -4.263594746589661e-06, -1.1138617992401123e-06, 2.035871148109436e-06, 5.185604095458984e-06, 8.335337042808533e-06, 1.1485069990158081e-05, 1.463480293750763e-05, 1.7784535884857178e-05, 2.0934268832206726e-05, 2.4084001779556274e-05, 2.7233734726905823e-05, 3.038346767425537e-05, 3.353320062160492e-05, 3.668293356895447e-05, 3.9832666516304016e-05, 4.2982399463653564e-05, 4.613213241100311e-05, 4.928186535835266e-05, 5.243159830570221e-05, 5.558133125305176e-05, 5.8731064200401306e-05, 6.188079714775085e-05, 6.50305300951004e-05, 6.818026304244995e-05, 7.13299959897995e-05, 7.447972893714905e-05, 7.76294618844986e-05, 8.077919483184814e-05, 8.392892777919769e-05, 8.707866072654724e-05, 9.022839367389679e-05, 9.337812662124634e-05, 9.652785956859589e-05, 9.967759251594543e-05, 0.00010282732546329498, 0.00010597705841064453]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 6.0, 15.0, 15.0, 54.0, 80.0, 145.0, 307.0, 1159.0, 8938.0, 1010677.0, 24475.0, 1835.0, 450.0, 170.0, 79.0, 50.0, 34.0, 20.0, 18.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.955078125, -2.874420166015625, -2.79376220703125, -2.713104248046875, -2.6324462890625, -2.551788330078125, -2.47113037109375, -2.390472412109375, -2.309814453125, -2.229156494140625, -2.14849853515625, -2.067840576171875, -1.9871826171875, -1.906524658203125, -1.82586669921875, -1.745208740234375, -1.66455078125, -1.583892822265625, -1.50323486328125, -1.422576904296875, -1.3419189453125, -1.261260986328125, -1.18060302734375, -1.099945068359375, -1.019287109375, -0.938629150390625, -0.85797119140625, -0.777313232421875, -0.6966552734375, -0.615997314453125, -0.53533935546875, -0.454681396484375, -0.3740234375, -0.293365478515625, -0.21270751953125, -0.132049560546875, -0.0513916015625, 0.029266357421875, 0.10992431640625, 0.190582275390625, 0.271240234375, 0.351898193359375, 0.43255615234375, 0.513214111328125, 0.5938720703125, 0.674530029296875, 0.75518798828125, 0.835845947265625, 0.91650390625, 0.997161865234375, 1.07781982421875, 1.158477783203125, 1.2391357421875, 1.319793701171875, 1.40045166015625, 1.481109619140625, 1.561767578125, 1.642425537109375, 1.72308349609375, 1.803741455078125, 1.8843994140625, 1.965057373046875, 2.04571533203125, 2.126373291015625, 2.20703125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 4.0, 9.0, 38.0, 167.0, 534.0, 204.0, 28.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8125, -6.669219970703125, -6.52593994140625, -6.382659912109375, -6.2393798828125, -6.096099853515625, -5.95281982421875, -5.809539794921875, -5.666259765625, -5.522979736328125, -5.37969970703125, -5.236419677734375, -5.0931396484375, -4.949859619140625, -4.80657958984375, -4.663299560546875, -4.52001953125, -4.376739501953125, -4.23345947265625, -4.090179443359375, -3.9468994140625, -3.803619384765625, -3.66033935546875, -3.517059326171875, -3.373779296875, -3.230499267578125, -3.08721923828125, -2.943939208984375, -2.8006591796875, -2.657379150390625, -2.51409912109375, -2.370819091796875, -2.2275390625, -2.084259033203125, -1.94097900390625, -1.797698974609375, -1.6544189453125, -1.511138916015625, -1.36785888671875, -1.224578857421875, -1.081298828125, -0.938018798828125, -0.79473876953125, -0.651458740234375, -0.5081787109375, -0.364898681640625, -0.22161865234375, -0.078338623046875, 0.06494140625, 0.208221435546875, 0.35150146484375, 0.494781494140625, 0.6380615234375, 0.781341552734375, 0.92462158203125, 1.067901611328125, 1.211181640625, 1.354461669921875, 1.49774169921875, 1.641021728515625, 1.7843017578125, 1.927581787109375, 2.07086181640625, 2.214141845703125, 2.357421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 19.0, 14.0, 24.0, 47.0, 72.0, 84.0, 173.0, 202.0, 141.0, 75.0, 61.0, 20.0, 16.0, 13.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.11675453186035, -21.584630966186523, -21.052509307861328, -20.5203857421875, -19.988262176513672, -19.456138610839844, -18.92401695251465, -18.39189338684082, -17.859769821166992, -17.327646255493164, -16.79552459716797, -16.26340103149414, -15.731277465820312, -15.1991548538208, -14.667032241821289, -14.134908676147461, -13.60278606414795, -13.070663452148438, -12.53853988647461, -12.006417274475098, -11.47429370880127, -10.942171096801758, -10.41004753112793, -9.877924919128418, -9.345802307128906, -8.813679695129395, -8.281556129455566, -7.749433517456055, -7.217309951782227, -6.685187339782715, -6.153064250946045, -5.620941162109375, -5.0888166427612305, -4.5566935539245605, -4.024570465087891, -3.4924476146698, -2.96032452583313, -2.42820143699646, -1.8960785865783691, -1.3639554977416992, -0.8318324089050293, -0.29970937967300415, 0.232413649559021, 0.7645366191864014, 1.2966597080230713, 1.8287827968597412, 2.360905647277832, 2.893028736114502, 3.425151824951172, 3.957274913787842, 4.489398002624512, 5.021520614624023, 5.553644180297852, 6.085766792297363, 6.617889881134033, 7.150012969970703, 7.682136058807373, 8.214259147644043, 8.746381759643555, 9.278505325317383, 9.810627937316895, 10.342751502990723, 10.874874114990234, 11.406997680664062, 11.939120292663574]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 0.0, 4.0, 6.0, 10.0, 4.0, 7.0, 6.0, 7.0, 11.0, 13.0, 16.0, 18.0, 21.0, 30.0, 26.0, 32.0, 21.0, 29.0, 46.0, 38.0, 56.0, 44.0, 54.0, 48.0, 39.0, 49.0, 39.0, 36.0, 30.0, 43.0, 25.0, 19.0, 27.0, 14.0, 22.0, 20.0, 14.0, 16.0, 16.0, 7.0, 14.0, 7.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.390840530395508, -16.845069885253906, -16.299299240112305, -15.753527641296387, -15.207756996154785, -14.661985397338867, -14.116214752197266, -13.570444107055664, -13.024673461914062, -12.478902816772461, -11.933131217956543, -11.387360572814941, -10.84158992767334, -10.295818328857422, -9.75004768371582, -9.204277038574219, -8.6585054397583, -8.1127347946167, -7.5669636726379395, -7.02119255065918, -6.475421905517578, -5.929650783538818, -5.383879661560059, -4.838109016418457, -4.292337894439697, -3.7465670108795166, -3.200796127319336, -2.655025005340576, -2.1092541217803955, -1.5634832382202148, -1.017712116241455, -0.4719412326812744, 0.07382965087890625, 0.6196005940437317, 1.1653715372085571, 1.7111425399780273, 2.256913423538208, 2.8026843070983887, 3.3484554290771484, 3.894226312637329, 4.43999719619751, 4.9857683181762695, 5.531538963317871, 6.077310085296631, 6.623081207275391, 7.168851852416992, 7.714622974395752, 8.260394096374512, 8.806164741516113, 9.351935386657715, 9.897706985473633, 10.443477630615234, 10.989248275756836, 11.535018920898438, 12.080790519714355, 12.626561164855957, 13.172332763671875, 13.718103408813477, 14.263875007629395, 14.809645652770996, 15.355416297912598, 15.901187896728516, 16.446958541870117, 16.99272918701172, 17.53849983215332]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 23.0, 14.0, 14.0, 39.0, 38.0, 47.0, 108.0, 176.0, 391.0, 1171.0, 5551.0, 4089110.0, 91461.0, 4247.0, 1024.0, 361.0, 171.0, 107.0, 54.0, 47.0, 28.0, 29.0, 17.0, 9.0, 11.0, 7.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.52734375, -3.436737060546875, -3.34613037109375, -3.255523681640625, -3.1649169921875, -3.074310302734375, -2.98370361328125, -2.893096923828125, -2.802490234375, -2.711883544921875, -2.62127685546875, -2.530670166015625, -2.4400634765625, -2.349456787109375, -2.25885009765625, -2.168243408203125, -2.07763671875, -1.987030029296875, -1.89642333984375, -1.805816650390625, -1.7152099609375, -1.624603271484375, -1.53399658203125, -1.443389892578125, -1.352783203125, -1.262176513671875, -1.17156982421875, -1.080963134765625, -0.9903564453125, -0.899749755859375, -0.80914306640625, -0.718536376953125, -0.6279296875, -0.537322998046875, -0.44671630859375, -0.356109619140625, -0.2655029296875, -0.174896240234375, -0.08428955078125, 0.006317138671875, 0.096923828125, 0.187530517578125, 0.27813720703125, 0.368743896484375, 0.4593505859375, 0.549957275390625, 0.64056396484375, 0.731170654296875, 0.82177734375, 0.912384033203125, 1.00299072265625, 1.093597412109375, 1.1842041015625, 1.274810791015625, 1.36541748046875, 1.456024169921875, 1.546630859375, 1.637237548828125, 1.72784423828125, 1.818450927734375, 1.9090576171875, 1.999664306640625, 2.09027099609375, 2.180877685546875, 2.271484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 8.0, 7.0, 6.0, 6.0, 9.0, 12.0, 15.0, 16.0, 17.0, 27.0, 30.0, 37.0, 39.0, 39.0, 55.0, 62.0, 54.0, 49.0, 64.0, 41.0, 54.0, 56.0, 53.0, 39.0, 37.0, 20.0, 37.0, 13.0, 19.0, 13.0, 6.0, 15.0, 8.0, 6.0, 4.0, 8.0, 4.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0], "bins": [-1.11328125, -1.0817718505859375, -1.050262451171875, -1.0187530517578125, -0.98724365234375, -0.9557342529296875, -0.924224853515625, -0.8927154541015625, -0.8612060546875, -0.8296966552734375, -0.798187255859375, -0.7666778564453125, -0.73516845703125, -0.7036590576171875, -0.672149658203125, -0.6406402587890625, -0.609130859375, -0.5776214599609375, -0.546112060546875, -0.5146026611328125, -0.48309326171875, -0.4515838623046875, -0.420074462890625, -0.3885650634765625, -0.3570556640625, -0.3255462646484375, -0.294036865234375, -0.2625274658203125, -0.23101806640625, -0.1995086669921875, -0.167999267578125, -0.1364898681640625, -0.10498046875, -0.0734710693359375, -0.041961669921875, -0.0104522705078125, 0.02105712890625, 0.0525665283203125, 0.084075927734375, 0.1155853271484375, 0.1470947265625, 0.1786041259765625, 0.210113525390625, 0.2416229248046875, 0.27313232421875, 0.3046417236328125, 0.336151123046875, 0.3676605224609375, 0.399169921875, 0.4306793212890625, 0.462188720703125, 0.4936981201171875, 0.52520751953125, 0.5567169189453125, 0.588226318359375, 0.6197357177734375, 0.6512451171875, 0.6827545166015625, 0.714263916015625, 0.7457733154296875, 0.77728271484375, 0.8087921142578125, 0.840301513671875, 0.8718109130859375, 0.9033203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 14.0, 17.0, 15.0, 22.0, 34.0, 44.0, 46.0, 74.0, 108.0, 198.0, 378.0, 1099.0, 6661.0, 4112781.0, 67817.0, 3354.0, 754.0, 315.0, 164.0, 91.0, 64.0, 63.0, 35.0, 35.0, 24.0, 12.0, 18.0, 10.0, 7.0, 10.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.461029052734375, -3.35565185546875, -3.250274658203125, -3.1448974609375, -3.039520263671875, -2.93414306640625, -2.828765869140625, -2.723388671875, -2.618011474609375, -2.51263427734375, -2.407257080078125, -2.3018798828125, -2.196502685546875, -2.09112548828125, -1.985748291015625, -1.88037109375, -1.774993896484375, -1.66961669921875, -1.564239501953125, -1.4588623046875, -1.353485107421875, -1.24810791015625, -1.142730712890625, -1.037353515625, -0.931976318359375, -0.82659912109375, -0.721221923828125, -0.6158447265625, -0.510467529296875, -0.40509033203125, -0.299713134765625, -0.1943359375, -0.088958740234375, 0.01641845703125, 0.121795654296875, 0.2271728515625, 0.332550048828125, 0.43792724609375, 0.543304443359375, 0.648681640625, 0.754058837890625, 0.85943603515625, 0.964813232421875, 1.0701904296875, 1.175567626953125, 1.28094482421875, 1.386322021484375, 1.49169921875, 1.597076416015625, 1.70245361328125, 1.807830810546875, 1.9132080078125, 2.018585205078125, 2.12396240234375, 2.229339599609375, 2.334716796875, 2.440093994140625, 2.54547119140625, 2.650848388671875, 2.7562255859375, 2.861602783203125, 2.96697998046875, 3.072357177734375, 3.177734375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 10.0, 26.0, 604.0, 3362.0, 42.0, 20.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.252197265625, -0.22417831420898438, -0.19615936279296875, -0.16814041137695312, -0.1401214599609375, -0.11210250854492188, -0.08408355712890625, -0.056064605712890625, -0.028045654296875, -2.6702880859375e-05, 0.02799224853515625, 0.056011199951171875, 0.0840301513671875, 0.11204910278320312, 0.14006805419921875, 0.16808700561523438, 0.19610595703125, 0.22412490844726562, 0.25214385986328125, 0.2801628112792969, 0.3081817626953125, 0.3362007141113281, 0.36421966552734375, 0.3922386169433594, 0.420257568359375, 0.4482765197753906, 0.47629547119140625, 0.5043144226074219, 0.5323333740234375, 0.5603523254394531, 0.5883712768554688, 0.6163902282714844, 0.6444091796875, 0.6724281311035156, 0.7004470825195312, 0.7284660339355469, 0.7564849853515625, 0.7845039367675781, 0.8125228881835938, 0.8405418395996094, 0.868560791015625, 0.8965797424316406, 0.9245986938476562, 0.9526176452636719, 0.9806365966796875, 1.0086555480957031, 1.0366744995117188, 1.0646934509277344, 1.09271240234375, 1.1207313537597656, 1.1487503051757812, 1.1767692565917969, 1.2047882080078125, 1.2328071594238281, 1.2608261108398438, 1.2888450622558594, 1.316864013671875, 1.3448829650878906, 1.3729019165039062, 1.4009208679199219, 1.4289398193359375, 1.4569587707519531, 1.4849777221679688, 1.5129966735839844, 1.541015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 231.0, 666.0, 89.0, 19.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.540596008300781, -11.237174034118652, -10.933752059936523, -10.630329132080078, -10.32690715789795, -10.02348518371582, -9.720063209533691, -9.416641235351562, -9.113219261169434, -8.809797286987305, -8.506375312805176, -8.202953338623047, -7.89953088760376, -7.596108436584473, -7.292686462402344, -6.989264488220215, -6.685842037200928, -6.382420063018799, -6.078997611999512, -5.775575637817383, -5.472153663635254, -5.168731689453125, -4.865309238433838, -4.561887264251709, -4.258464813232422, -3.955042600631714, -3.651620626449585, -3.348198413848877, -3.044776439666748, -2.74135422706604, -2.437932014465332, -2.134510040283203, -1.831087589263916, -1.5276654958724976, -1.224243402481079, -0.9208211898803711, -0.6173990964889526, -0.3139770030975342, -0.010554790496826172, 0.29286718368530273, 0.5962893962860107, 0.8997114896774292, 1.2031335830688477, 1.5065557956695557, 1.8099778890609741, 2.1133999824523926, 2.4168221950531006, 2.7202441692352295, 3.0236663818359375, 3.3270885944366455, 3.6305105686187744, 3.9339327812194824, 4.237354755401611, 4.540777206420898, 4.844199180603027, 5.147621154785156, 5.451043128967285, 5.754465103149414, 6.057887554168701, 6.36130952835083, 6.664731502532959, 6.968153953552246, 7.271575927734375, 7.574997901916504, 7.878420352935791]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 12.0, 17.0, 11.0, 17.0, 20.0, 15.0, 26.0, 26.0, 29.0, 28.0, 38.0, 40.0, 34.0, 44.0, 48.0, 54.0, 42.0, 43.0, 55.0, 34.0, 41.0, 44.0, 29.0, 28.0, 25.0, 27.0, 31.0, 26.0, 21.0, 23.0, 11.0, 12.0, 9.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.294280767440796, -1.2528924942016602, -1.2115042209625244, -1.1701159477233887, -1.128727674484253, -1.0873394012451172, -1.0459511280059814, -1.0045628547668457, -0.96317458152771, -0.9217863082885742, -0.8803980350494385, -0.8390097618103027, -0.797621488571167, -0.7562332153320312, -0.7148449420928955, -0.6734566688537598, -0.632068395614624, -0.5906801223754883, -0.5492918491363525, -0.5079035758972168, -0.46651530265808105, -0.4251270294189453, -0.38373875617980957, -0.34235048294067383, -0.3009622097015381, -0.25957393646240234, -0.2181856632232666, -0.17679738998413086, -0.13540911674499512, -0.09402084350585938, -0.05263257026672363, -0.01124429702758789, 0.0301438570022583, 0.07153213024139404, 0.11292040348052979, 0.15430867671966553, 0.19569694995880127, 0.237085223197937, 0.27847349643707275, 0.3198617696762085, 0.36125004291534424, 0.40263831615448, 0.4440265893936157, 0.48541486263275146, 0.5268031358718872, 0.568191409111023, 0.6095796823501587, 0.6509679555892944, 0.6923562288284302, 0.7337445020675659, 0.7751327753067017, 0.8165210485458374, 0.8579093217849731, 0.8992975950241089, 0.9406858682632446, 0.9820741415023804, 1.0234624147415161, 1.0648506879806519, 1.1062389612197876, 1.1476272344589233, 1.189015507698059, 1.2304037809371948, 1.2717920541763306, 1.3131803274154663, 1.354568600654602]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 9.0, 10.0, 12.0, 16.0, 20.0, 17.0, 32.0, 71.0, 61.0, 65.0, 127.0, 143.0, 210.0, 251.0, 423.0, 680.0, 1011.0, 1784.0, 3400.0, 7265.0, 18305.0, 63413.0, 373273.0, 462550.0, 77021.0, 21199.0, 8137.0, 3686.0, 2032.0, 1156.0, 604.0, 468.0, 307.0, 226.0, 137.0, 111.0, 82.0, 41.0, 41.0, 39.0, 34.0, 22.0, 22.0, 10.0, 12.0, 2.0, 4.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0], "bins": [-2.029296875, -1.9697265625, -1.91015625, -1.8505859375, -1.791015625, -1.7314453125, -1.671875, -1.6123046875, -1.552734375, -1.4931640625, -1.43359375, -1.3740234375, -1.314453125, -1.2548828125, -1.1953125, -1.1357421875, -1.076171875, -1.0166015625, -0.95703125, -0.8974609375, -0.837890625, -0.7783203125, -0.71875, -0.6591796875, -0.599609375, -0.5400390625, -0.48046875, -0.4208984375, -0.361328125, -0.3017578125, -0.2421875, -0.1826171875, -0.123046875, -0.0634765625, -0.00390625, 0.0556640625, 0.115234375, 0.1748046875, 0.234375, 0.2939453125, 0.353515625, 0.4130859375, 0.47265625, 0.5322265625, 0.591796875, 0.6513671875, 0.7109375, 0.7705078125, 0.830078125, 0.8896484375, 0.94921875, 1.0087890625, 1.068359375, 1.1279296875, 1.1875, 1.2470703125, 1.306640625, 1.3662109375, 1.42578125, 1.4853515625, 1.544921875, 1.6044921875, 1.6640625, 1.7236328125, 1.783203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 6.0, 8.0, 9.0, 16.0, 19.0, 8.0, 16.0, 36.0, 33.0, 40.0, 36.0, 33.0, 52.0, 36.0, 74.0, 57.0, 51.0, 47.0, 50.0, 49.0, 48.0, 33.0, 39.0, 35.0, 29.0, 19.0, 20.0, 16.0, 12.0, 6.0, 7.0, 10.0, 9.0, 5.0, 3.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0595703125, -1.0286865234375, -0.997802734375, -0.9669189453125, -0.93603515625, -0.9051513671875, -0.874267578125, -0.8433837890625, -0.8125, -0.7816162109375, -0.750732421875, -0.7198486328125, -0.68896484375, -0.6580810546875, -0.627197265625, -0.5963134765625, -0.5654296875, -0.5345458984375, -0.503662109375, -0.4727783203125, -0.44189453125, -0.4110107421875, -0.380126953125, -0.3492431640625, -0.318359375, -0.2874755859375, -0.256591796875, -0.2257080078125, -0.19482421875, -0.1639404296875, -0.133056640625, -0.1021728515625, -0.0712890625, -0.0404052734375, -0.009521484375, 0.0213623046875, 0.05224609375, 0.0831298828125, 0.114013671875, 0.1448974609375, 0.17578125, 0.2066650390625, 0.237548828125, 0.2684326171875, 0.29931640625, 0.3302001953125, 0.361083984375, 0.3919677734375, 0.4228515625, 0.4537353515625, 0.484619140625, 0.5155029296875, 0.54638671875, 0.5772705078125, 0.608154296875, 0.6390380859375, 0.669921875, 0.7008056640625, 0.731689453125, 0.7625732421875, 0.79345703125, 0.8243408203125, 0.855224609375, 0.8861083984375, 0.9169921875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 20.0, 20.0, 35.0, 68.0, 110.0, 199.0, 420.0, 907.0, 2175.0, 7195.0, 102013.0, 908239.0, 20640.0, 3801.0, 1374.0, 612.0, 318.0, 157.0, 100.0, 57.0, 32.0, 17.0, 11.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.06317138671875, -4.8958740234375, -4.72857666015625, -4.561279296875, -4.39398193359375, -4.2266845703125, -4.05938720703125, -3.89208984375, -3.72479248046875, -3.5574951171875, -3.39019775390625, -3.222900390625, -3.05560302734375, -2.8883056640625, -2.72100830078125, -2.5537109375, -2.38641357421875, -2.2191162109375, -2.05181884765625, -1.884521484375, -1.71722412109375, -1.5499267578125, -1.38262939453125, -1.21533203125, -1.04803466796875, -0.8807373046875, -0.71343994140625, -0.546142578125, -0.37884521484375, -0.2115478515625, -0.04425048828125, 0.123046875, 0.29034423828125, 0.4576416015625, 0.62493896484375, 0.792236328125, 0.95953369140625, 1.1268310546875, 1.29412841796875, 1.46142578125, 1.62872314453125, 1.7960205078125, 1.96331787109375, 2.130615234375, 2.29791259765625, 2.4652099609375, 2.63250732421875, 2.7998046875, 2.96710205078125, 3.1343994140625, 3.30169677734375, 3.468994140625, 3.63629150390625, 3.8035888671875, 3.97088623046875, 4.13818359375, 4.30548095703125, 4.4727783203125, 4.64007568359375, 4.807373046875, 4.97467041015625, 5.1419677734375, 5.30926513671875, 5.4765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 12.0, 14.0, 22.0, 37.0, 38.0, 49.0, 58.0, 64.0, 70.0, 94.0, 98.0, 86.0, 76.0, 62.0, 49.0, 43.0, 25.0, 20.0, 19.0, 16.0, 13.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.49847412109375, -6.2586669921875, -6.01885986328125, -5.779052734375, -5.53924560546875, -5.2994384765625, -5.05963134765625, -4.81982421875, -4.58001708984375, -4.3402099609375, -4.10040283203125, -3.860595703125, -3.62078857421875, -3.3809814453125, -3.14117431640625, -2.9013671875, -2.66156005859375, -2.4217529296875, -2.18194580078125, -1.942138671875, -1.70233154296875, -1.4625244140625, -1.22271728515625, -0.98291015625, -0.74310302734375, -0.5032958984375, -0.26348876953125, -0.023681640625, 0.21612548828125, 0.4559326171875, 0.69573974609375, 0.935546875, 1.17535400390625, 1.4151611328125, 1.65496826171875, 1.894775390625, 2.13458251953125, 2.3743896484375, 2.61419677734375, 2.85400390625, 3.09381103515625, 3.3336181640625, 3.57342529296875, 3.813232421875, 4.05303955078125, 4.2928466796875, 4.53265380859375, 4.7724609375, 5.01226806640625, 5.2520751953125, 5.49188232421875, 5.731689453125, 5.97149658203125, 6.2113037109375, 6.45111083984375, 6.69091796875, 6.93072509765625, 7.1705322265625, 7.41033935546875, 7.650146484375, 7.88995361328125, 8.1297607421875, 8.36956787109375, 8.609375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 24.0, 22.0, 66.0, 129.0, 338.0, 1165.0, 5660.0, 981080.0, 55583.0, 3216.0, 774.0, 252.0, 100.0, 62.0, 28.0, 8.0, 10.0, 7.0, 9.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.96875, -6.79815673828125, -6.6275634765625, -6.45697021484375, -6.286376953125, -6.11578369140625, -5.9451904296875, -5.77459716796875, -5.60400390625, -5.43341064453125, -5.2628173828125, -5.09222412109375, -4.921630859375, -4.75103759765625, -4.5804443359375, -4.40985107421875, -4.2392578125, -4.06866455078125, -3.8980712890625, -3.72747802734375, -3.556884765625, -3.38629150390625, -3.2156982421875, -3.04510498046875, -2.87451171875, -2.70391845703125, -2.5333251953125, -2.36273193359375, -2.192138671875, -2.02154541015625, -1.8509521484375, -1.68035888671875, -1.509765625, -1.33917236328125, -1.1685791015625, -0.99798583984375, -0.827392578125, -0.65679931640625, -0.4862060546875, -0.31561279296875, -0.14501953125, 0.02557373046875, 0.1961669921875, 0.36676025390625, 0.537353515625, 0.70794677734375, 0.8785400390625, 1.04913330078125, 1.2197265625, 1.39031982421875, 1.5609130859375, 1.73150634765625, 1.902099609375, 2.07269287109375, 2.2432861328125, 2.41387939453125, 2.58447265625, 2.75506591796875, 2.9256591796875, 3.09625244140625, 3.266845703125, 3.43743896484375, 3.6080322265625, 3.77862548828125, 3.94921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 24.0, 79.0, 241.0, 388.0, 154.0, 71.0, 12.0, 6.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003535747528076172, -0.0003432817757129669, -0.00033298879861831665, -0.0003226958215236664, -0.0003124028444290161, -0.00030210986733436584, -0.0002918168902397156, -0.0002815239131450653, -0.00027123093605041504, -0.00026093795895576477, -0.0002506449818611145, -0.00024035200476646423, -0.00023005902767181396, -0.0002197660505771637, -0.00020947307348251343, -0.00019918009638786316, -0.0001888871192932129, -0.00017859414219856262, -0.00016830116510391235, -0.00015800818800926208, -0.00014771521091461182, -0.00013742223381996155, -0.00012712925672531128, -0.00011683627963066101, -0.00010654330253601074, -9.625032544136047e-05, -8.59573483467102e-05, -7.566437125205994e-05, -6.537139415740967e-05, -5.50784170627594e-05, -4.478543996810913e-05, -3.449246287345886e-05, -2.4199485778808594e-05, -1.3906508684158325e-05, -3.6135315895080566e-06, 6.679445505142212e-06, 1.697242259979248e-05, 2.726539969444275e-05, 3.755837678909302e-05, 4.7851353883743286e-05, 5.8144330978393555e-05, 6.843730807304382e-05, 7.873028516769409e-05, 8.902326226234436e-05, 9.931623935699463e-05, 0.0001096092164516449, 0.00011990219354629517, 0.00013019517064094543, 0.0001404881477355957, 0.00015078112483024597, 0.00016107410192489624, 0.0001713670790195465, 0.00018166005611419678, 0.00019195303320884705, 0.00020224601030349731, 0.00021253898739814758, 0.00022283196449279785, 0.00023312494158744812, 0.0002434179186820984, 0.00025371089577674866, 0.0002640038728713989, 0.0002742968499660492, 0.00028458982706069946, 0.00029488280415534973, 0.00030517578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 13.0, 15.0, 17.0, 38.0, 62.0, 95.0, 212.0, 395.0, 876.0, 2342.0, 10251.0, 971512.0, 55321.0, 4642.0, 1546.0, 600.0, 265.0, 139.0, 74.0, 48.0, 28.0, 15.0, 13.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2578125, -2.15411376953125, -2.0504150390625, -1.94671630859375, -1.843017578125, -1.73931884765625, -1.6356201171875, -1.53192138671875, -1.42822265625, -1.32452392578125, -1.2208251953125, -1.11712646484375, -1.013427734375, -0.90972900390625, -0.8060302734375, -0.70233154296875, -0.5986328125, -0.49493408203125, -0.3912353515625, -0.28753662109375, -0.183837890625, -0.08013916015625, 0.0235595703125, 0.12725830078125, 0.23095703125, 0.33465576171875, 0.4383544921875, 0.54205322265625, 0.645751953125, 0.74945068359375, 0.8531494140625, 0.95684814453125, 1.060546875, 1.16424560546875, 1.2679443359375, 1.37164306640625, 1.475341796875, 1.57904052734375, 1.6827392578125, 1.78643798828125, 1.89013671875, 1.99383544921875, 2.0975341796875, 2.20123291015625, 2.304931640625, 2.40863037109375, 2.5123291015625, 2.61602783203125, 2.7197265625, 2.82342529296875, 2.9271240234375, 3.03082275390625, 3.134521484375, 3.23822021484375, 3.3419189453125, 3.44561767578125, 3.54931640625, 3.65301513671875, 3.7567138671875, 3.86041259765625, 3.964111328125, 4.06781005859375, 4.1715087890625, 4.27520751953125, 4.37890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 15.0, 57.0, 366.0, 401.0, 74.0, 15.0, 7.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.26019287109375, -4.0477294921875, -3.83526611328125, -3.622802734375, -3.41033935546875, -3.1978759765625, -2.98541259765625, -2.77294921875, -2.56048583984375, -2.3480224609375, -2.13555908203125, -1.923095703125, -1.71063232421875, -1.4981689453125, -1.28570556640625, -1.0732421875, -0.86077880859375, -0.6483154296875, -0.43585205078125, -0.223388671875, -0.01092529296875, 0.2015380859375, 0.41400146484375, 0.62646484375, 0.83892822265625, 1.0513916015625, 1.26385498046875, 1.476318359375, 1.68878173828125, 1.9012451171875, 2.11370849609375, 2.326171875, 2.53863525390625, 2.7510986328125, 2.96356201171875, 3.176025390625, 3.38848876953125, 3.6009521484375, 3.81341552734375, 4.02587890625, 4.23834228515625, 4.4508056640625, 4.66326904296875, 4.875732421875, 5.08819580078125, 5.3006591796875, 5.51312255859375, 5.7255859375, 5.93804931640625, 6.1505126953125, 6.36297607421875, 6.575439453125, 6.78790283203125, 7.0003662109375, 7.21282958984375, 7.42529296875, 7.63775634765625, 7.8502197265625, 8.06268310546875, 8.275146484375, 8.48760986328125, 8.7000732421875, 8.91253662109375, 9.125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 24.0, 114.0, 377.0, 321.0, 98.0, 41.0, 21.0, 8.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.653228759765625, -44.90689468383789, -43.16055679321289, -41.414222717285156, -39.667884826660156, -37.92155075073242, -36.17521667480469, -34.42887878417969, -32.68254089355469, -30.93620491027832, -29.189868927001953, -27.44353485107422, -25.69719696044922, -23.950862884521484, -22.204526901245117, -20.45819091796875, -18.711856842041016, -16.96552085876465, -15.219184875488281, -13.47284984588623, -11.726513862609863, -9.980177879333496, -8.233842849731445, -6.487506866455078, -4.741170883178711, -2.994835138320923, -1.2484993934631348, 0.4978361129760742, 2.2441720962524414, 3.9905080795288086, 5.736843109130859, 7.483179092407227, 9.229515075683594, 10.975851058959961, 12.722187042236328, 14.468522071838379, 16.214859008789062, 17.961193084716797, 19.707529067993164, 21.45386505126953, 23.2002010345459, 24.946537017822266, 26.692873001098633, 28.439208984375, 30.185543060302734, 31.931880950927734, 33.67821502685547, 35.42455291748047, 37.1708869934082, 38.91722106933594, 40.66355895996094, 42.40989303588867, 44.15623092651367, 45.902565002441406, 47.648902893066406, 49.39523696899414, 51.141571044921875, 52.88790512084961, 54.63424301147461, 56.380577087402344, 58.126914978027344, 59.87324905395508, 61.61958312988281, 63.36592102050781, 65.11225891113281]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 12.0, 13.0, 10.0, 18.0, 19.0, 28.0, 40.0, 37.0, 39.0, 39.0, 53.0, 44.0, 54.0, 66.0, 69.0, 58.0, 64.0, 36.0, 41.0, 47.0, 32.0, 36.0, 30.0, 27.0, 15.0, 26.0, 19.0, 9.0, 4.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.12522888183594, -31.160764694213867, -30.19630241394043, -29.23183822631836, -28.267375946044922, -27.30291175842285, -26.33844757080078, -25.373985290527344, -24.409523010253906, -23.445058822631836, -22.4805965423584, -21.516132354736328, -20.55167007446289, -19.58720588684082, -18.62274169921875, -17.658279418945312, -16.693815231323242, -15.729351997375488, -14.764888763427734, -13.800424575805664, -12.835962295532227, -11.871498107910156, -10.907034873962402, -9.942571640014648, -8.978108406066895, -8.01364517211914, -7.049181938171387, -6.084718227386475, -5.120254993438721, -4.155791759490967, -3.1913280487060547, -2.226864814758301, -1.262399673461914, -0.2979363203048706, 0.6665270328521729, 1.6309905052185059, 2.5954537391662598, 3.5599169731140137, 4.524380683898926, 5.48884391784668, 6.453307151794434, 7.4177703857421875, 8.382233619689941, 9.346696853637695, 10.311161041259766, 11.275623321533203, 12.240087509155273, 13.204550743103027, 14.169013977050781, 15.133477210998535, 16.09794044494629, 17.06240463256836, 18.026866912841797, 18.991331100463867, 19.955795288085938, 20.920257568359375, 21.884719848632812, 22.849184036254883, 23.81364631652832, 24.77811050415039, 25.742572784423828, 26.7070369720459, 27.67150115966797, 28.635963439941406, 29.600427627563477]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 0.0, 11.0, 3.0, 10.0, 12.0, 12.0, 14.0, 29.0, 38.0, 56.0, 77.0, 116.0, 174.0, 361.0, 1634.0, 117850.0, 4070201.0, 2565.0, 479.0, 206.0, 102.0, 81.0, 48.0, 51.0, 32.0, 23.0, 13.0, 15.0, 13.0, 8.0, 5.0, 9.0, 4.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1875, -6.00592041015625, -5.8243408203125, -5.64276123046875, -5.461181640625, -5.27960205078125, -5.0980224609375, -4.91644287109375, -4.73486328125, -4.55328369140625, -4.3717041015625, -4.19012451171875, -4.008544921875, -3.82696533203125, -3.6453857421875, -3.46380615234375, -3.2822265625, -3.10064697265625, -2.9190673828125, -2.73748779296875, -2.555908203125, -2.37432861328125, -2.1927490234375, -2.01116943359375, -1.82958984375, -1.64801025390625, -1.4664306640625, -1.28485107421875, -1.103271484375, -0.92169189453125, -0.7401123046875, -0.55853271484375, -0.376953125, -0.19537353515625, -0.0137939453125, 0.16778564453125, 0.349365234375, 0.53094482421875, 0.7125244140625, 0.89410400390625, 1.07568359375, 1.25726318359375, 1.4388427734375, 1.62042236328125, 1.802001953125, 1.98358154296875, 2.1651611328125, 2.34674072265625, 2.5283203125, 2.70989990234375, 2.8914794921875, 3.07305908203125, 3.254638671875, 3.43621826171875, 3.6177978515625, 3.79937744140625, 3.98095703125, 4.16253662109375, 4.3441162109375, 4.52569580078125, 4.707275390625, 4.88885498046875, 5.0704345703125, 5.25201416015625, 5.43359375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 10.0, 8.0, 13.0, 11.0, 19.0, 24.0, 32.0, 28.0, 57.0, 58.0, 54.0, 71.0, 77.0, 76.0, 62.0, 65.0, 62.0, 53.0, 38.0, 42.0, 34.0, 23.0, 12.0, 11.0, 12.0, 13.0, 6.0, 2.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.0563201904296875, -1.012054443359375, -0.9677886962890625, -0.92352294921875, -0.8792572021484375, -0.834991455078125, -0.7907257080078125, -0.7464599609375, -0.7021942138671875, -0.657928466796875, -0.6136627197265625, -0.56939697265625, -0.5251312255859375, -0.480865478515625, -0.4365997314453125, -0.392333984375, -0.3480682373046875, -0.303802490234375, -0.2595367431640625, -0.21527099609375, -0.1710052490234375, -0.126739501953125, -0.0824737548828125, -0.0382080078125, 0.0060577392578125, 0.050323486328125, 0.0945892333984375, 0.13885498046875, 0.1831207275390625, 0.227386474609375, 0.2716522216796875, 0.31591796875, 0.3601837158203125, 0.404449462890625, 0.4487152099609375, 0.49298095703125, 0.5372467041015625, 0.581512451171875, 0.6257781982421875, 0.6700439453125, 0.7143096923828125, 0.758575439453125, 0.8028411865234375, 0.84710693359375, 0.8913726806640625, 0.935638427734375, 0.9799041748046875, 1.024169921875, 1.0684356689453125, 1.112701416015625, 1.1569671630859375, 1.20123291015625, 1.2454986572265625, 1.289764404296875, 1.3340301513671875, 1.3782958984375, 1.4225616455078125, 1.466827392578125, 1.5110931396484375, 1.55535888671875, 1.5996246337890625, 1.643890380859375, 1.6881561279296875, 1.732421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 10.0, 10.0, 8.0, 22.0, 21.0, 17.0, 23.0, 19.0, 49.0, 57.0, 94.0, 111.0, 116.0, 192.0, 257.0, 292.0, 424.0, 533.0, 4475.0, 4184191.0, 1316.0, 501.0, 348.0, 293.0, 201.0, 174.0, 150.0, 100.0, 73.0, 52.0, 28.0, 29.0, 22.0, 18.0, 20.0, 12.0, 5.0, 7.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.28125, -14.83642578125, -14.3916015625, -13.94677734375, -13.501953125, -13.05712890625, -12.6123046875, -12.16748046875, -11.72265625, -11.27783203125, -10.8330078125, -10.38818359375, -9.943359375, -9.49853515625, -9.0537109375, -8.60888671875, -8.1640625, -7.71923828125, -7.2744140625, -6.82958984375, -6.384765625, -5.93994140625, -5.4951171875, -5.05029296875, -4.60546875, -4.16064453125, -3.7158203125, -3.27099609375, -2.826171875, -2.38134765625, -1.9365234375, -1.49169921875, -1.046875, -0.60205078125, -0.1572265625, 0.28759765625, 0.732421875, 1.17724609375, 1.6220703125, 2.06689453125, 2.51171875, 2.95654296875, 3.4013671875, 3.84619140625, 4.291015625, 4.73583984375, 5.1806640625, 5.62548828125, 6.0703125, 6.51513671875, 6.9599609375, 7.40478515625, 7.849609375, 8.29443359375, 8.7392578125, 9.18408203125, 9.62890625, 10.07373046875, 10.5185546875, 10.96337890625, 11.408203125, 11.85302734375, 12.2978515625, 12.74267578125, 13.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 49.0, 4028.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.875, -17.5048828125, -17.134765625, -16.7646484375, -16.39453125, -16.0244140625, -15.654296875, -15.2841796875, -14.9140625, -14.5439453125, -14.173828125, -13.8037109375, -13.43359375, -13.0634765625, -12.693359375, -12.3232421875, -11.953125, -11.5830078125, -11.212890625, -10.8427734375, -10.47265625, -10.1025390625, -9.732421875, -9.3623046875, -8.9921875, -8.6220703125, -8.251953125, -7.8818359375, -7.51171875, -7.1416015625, -6.771484375, -6.4013671875, -6.03125, -5.6611328125, -5.291015625, -4.9208984375, -4.55078125, -4.1806640625, -3.810546875, -3.4404296875, -3.0703125, -2.7001953125, -2.330078125, -1.9599609375, -1.58984375, -1.2197265625, -0.849609375, -0.4794921875, -0.109375, 0.2607421875, 0.630859375, 1.0009765625, 1.37109375, 1.7412109375, 2.111328125, 2.4814453125, 2.8515625, 3.2216796875, 3.591796875, 3.9619140625, 4.33203125, 4.7021484375, 5.072265625, 5.4423828125, 5.8125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 12.0, 68.0, 298.0, 470.0, 112.0, 29.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.91316223144531, -41.98273468017578, -41.052310943603516, -40.121883392333984, -39.19145584106445, -38.26103210449219, -37.330604553222656, -36.400177001953125, -35.46975326538086, -34.53932571411133, -33.60890197753906, -32.67847442626953, -31.748048782348633, -30.8176212310791, -29.887195587158203, -28.956768035888672, -28.02634048461914, -27.095914840698242, -26.16548728942871, -25.235061645507812, -24.304636001586914, -23.374208450317383, -22.443782806396484, -21.513355255126953, -20.582931518554688, -19.65250587463379, -18.722078323364258, -17.79165267944336, -16.86122703552246, -15.93079948425293, -15.000373840332031, -14.069947242736816, -13.139520645141602, -12.209094047546387, -11.278668403625488, -10.348241806030273, -9.417815208435059, -8.487388610839844, -7.556962966918945, -6.6265363693237305, -5.696110248565674, -4.765684127807617, -3.8352575302124023, -2.9048314094543457, -1.97440505027771, -1.0439786911010742, -0.11355257034301758, 0.8168740272521973, 1.747300148010254, 2.6777265071868896, 3.6081528663635254, 4.538578987121582, 5.469005584716797, 6.3994317054748535, 7.32985782623291, 8.260284423828125, 9.190710067749023, 10.121136665344238, 11.051562309265137, 11.981988906860352, 12.912415504455566, 13.842842102050781, 14.77326774597168, 15.703694343566895, 16.63412094116211]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 10.0, 21.0, 20.0, 44.0, 52.0, 113.0, 133.0, 134.0, 138.0, 120.0, 71.0, 39.0, 42.0, 24.0, 16.0, 6.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.127513885498047, -27.188119888305664, -26.24872589111328, -25.3093318939209, -24.369937896728516, -23.430545806884766, -22.49114990234375, -21.5517578125, -20.612363815307617, -19.672969818115234, -18.73357582092285, -17.79418182373047, -16.854787826538086, -15.91539478302002, -14.976000785827637, -14.03660774230957, -13.097212791442871, -12.157818794250488, -11.218424797058105, -10.279031753540039, -9.339637756347656, -8.400243759155273, -7.460849761962891, -6.521456241607666, -5.582062244415283, -4.6426682472229, -3.703274726867676, -2.763880729675293, -1.8244869709014893, -0.8850932121276855, 0.054300785064697266, 0.9936943054199219, 1.9330883026123047, 2.8724820613861084, 3.811875820159912, 4.751269817352295, 5.6906633377075195, 6.630057334899902, 7.569451332092285, 8.508844375610352, 9.448238372802734, 10.387632369995117, 11.3270263671875, 12.266420364379883, 13.20581340789795, 14.145207405090332, 15.084601402282715, 16.02399444580078, 16.963390350341797, 17.90278434753418, 18.842178344726562, 19.781572341918945, 20.720966339111328, 21.660358428955078, 22.599754333496094, 23.539146423339844, 24.478540420532227, 25.41793441772461, 26.357328414916992, 27.296722412109375, 28.236116409301758, 29.17551040649414, 30.11490249633789, 31.054296493530273, 31.993690490722656]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 9.0, 8.0, 21.0, 26.0, 56.0, 103.0, 144.0, 169.0, 348.0, 617.0, 1343.0, 3016.0, 8905.0, 35373.0, 239295.0, 638271.0, 93194.0, 18324.0, 5457.0, 1854.0, 842.0, 444.0, 285.0, 128.0, 112.0, 58.0, 32.0, 29.0, 13.0, 24.0, 10.0, 8.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.73828125, -2.6534423828125, -2.568603515625, -2.4837646484375, -2.39892578125, -2.3140869140625, -2.229248046875, -2.1444091796875, -2.0595703125, -1.9747314453125, -1.889892578125, -1.8050537109375, -1.72021484375, -1.6353759765625, -1.550537109375, -1.4656982421875, -1.380859375, -1.2960205078125, -1.211181640625, -1.1263427734375, -1.04150390625, -0.9566650390625, -0.871826171875, -0.7869873046875, -0.7021484375, -0.6173095703125, -0.532470703125, -0.4476318359375, -0.36279296875, -0.2779541015625, -0.193115234375, -0.1082763671875, -0.0234375, 0.0614013671875, 0.146240234375, 0.2310791015625, 0.31591796875, 0.4007568359375, 0.485595703125, 0.5704345703125, 0.6552734375, 0.7401123046875, 0.824951171875, 0.9097900390625, 0.99462890625, 1.0794677734375, 1.164306640625, 1.2491455078125, 1.333984375, 1.4188232421875, 1.503662109375, 1.5885009765625, 1.67333984375, 1.7581787109375, 1.843017578125, 1.9278564453125, 2.0126953125, 2.0975341796875, 2.182373046875, 2.2672119140625, 2.35205078125, 2.4368896484375, 2.521728515625, 2.6065673828125, 2.69140625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 11.0, 14.0, 12.0, 16.0, 23.0, 21.0, 26.0, 45.0, 59.0, 57.0, 84.0, 75.0, 72.0, 79.0, 75.0, 66.0, 64.0, 39.0, 38.0, 26.0, 17.0, 21.0, 20.0, 10.0, 7.0, 7.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.7158203125, -1.6540985107421875, -1.592376708984375, -1.5306549072265625, -1.46893310546875, -1.4072113037109375, -1.345489501953125, -1.2837677001953125, -1.2220458984375, -1.1603240966796875, -1.098602294921875, -1.0368804931640625, -0.97515869140625, -0.9134368896484375, -0.851715087890625, -0.7899932861328125, -0.728271484375, -0.6665496826171875, -0.604827880859375, -0.5431060791015625, -0.48138427734375, -0.4196624755859375, -0.357940673828125, -0.2962188720703125, -0.2344970703125, -0.1727752685546875, -0.111053466796875, -0.0493316650390625, 0.01239013671875, 0.0741119384765625, 0.135833740234375, 0.1975555419921875, 0.25927734375, 0.3209991455078125, 0.382720947265625, 0.4444427490234375, 0.50616455078125, 0.5678863525390625, 0.629608154296875, 0.6913299560546875, 0.7530517578125, 0.8147735595703125, 0.876495361328125, 0.9382171630859375, 0.99993896484375, 1.0616607666015625, 1.123382568359375, 1.1851043701171875, 1.246826171875, 1.3085479736328125, 1.370269775390625, 1.4319915771484375, 1.49371337890625, 1.5554351806640625, 1.617156982421875, 1.6788787841796875, 1.7406005859375, 1.8023223876953125, 1.864044189453125, 1.9257659912109375, 1.98748779296875, 2.0492095947265625, 2.110931396484375, 2.1726531982421875, 2.234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 16.0, 26.0, 40.0, 70.0, 133.0, 317.0, 977.0, 7524.0, 998629.0, 38187.0, 1731.0, 478.0, 187.0, 99.0, 58.0, 29.0, 15.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.7728271484375, -8.444091796875, -8.1153564453125, -7.78662109375, -7.4578857421875, -7.129150390625, -6.8004150390625, -6.4716796875, -6.1429443359375, -5.814208984375, -5.4854736328125, -5.15673828125, -4.8280029296875, -4.499267578125, -4.1705322265625, -3.841796875, -3.5130615234375, -3.184326171875, -2.8555908203125, -2.52685546875, -2.1981201171875, -1.869384765625, -1.5406494140625, -1.2119140625, -0.8831787109375, -0.554443359375, -0.2257080078125, 0.10302734375, 0.4317626953125, 0.760498046875, 1.0892333984375, 1.41796875, 1.7467041015625, 2.075439453125, 2.4041748046875, 2.73291015625, 3.0616455078125, 3.390380859375, 3.7191162109375, 4.0478515625, 4.3765869140625, 4.705322265625, 5.0340576171875, 5.36279296875, 5.6915283203125, 6.020263671875, 6.3489990234375, 6.677734375, 7.0064697265625, 7.335205078125, 7.6639404296875, 7.99267578125, 8.3214111328125, 8.650146484375, 8.9788818359375, 9.3076171875, 9.6363525390625, 9.965087890625, 10.2938232421875, 10.62255859375, 10.9512939453125, 11.280029296875, 11.6087646484375, 11.9375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 25.0, 58.0, 130.0, 184.0, 209.0, 165.0, 134.0, 50.0, 38.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.7099609375, -25.998046875, -25.2861328125, -24.57421875, -23.8623046875, -23.150390625, -22.4384765625, -21.7265625, -21.0146484375, -20.302734375, -19.5908203125, -18.87890625, -18.1669921875, -17.455078125, -16.7431640625, -16.03125, -15.3193359375, -14.607421875, -13.8955078125, -13.18359375, -12.4716796875, -11.759765625, -11.0478515625, -10.3359375, -9.6240234375, -8.912109375, -8.2001953125, -7.48828125, -6.7763671875, -6.064453125, -5.3525390625, -4.640625, -3.9287109375, -3.216796875, -2.5048828125, -1.79296875, -1.0810546875, -0.369140625, 0.3427734375, 1.0546875, 1.7666015625, 2.478515625, 3.1904296875, 3.90234375, 4.6142578125, 5.326171875, 6.0380859375, 6.75, 7.4619140625, 8.173828125, 8.8857421875, 9.59765625, 10.3095703125, 11.021484375, 11.7333984375, 12.4453125, 13.1572265625, 13.869140625, 14.5810546875, 15.29296875, 16.0048828125, 16.716796875, 17.4287109375, 18.140625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 12.0, 19.0, 31.0, 48.0, 138.0, 634.0, 8118.0, 1004681.0, 33353.0, 1136.0, 231.0, 73.0, 32.0, 22.0, 11.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.373046875, -3.2900848388671875, -3.207122802734375, -3.1241607666015625, -3.04119873046875, -2.9582366943359375, -2.875274658203125, -2.7923126220703125, -2.7093505859375, -2.6263885498046875, -2.543426513671875, -2.4604644775390625, -2.37750244140625, -2.2945404052734375, -2.211578369140625, -2.1286163330078125, -2.045654296875, -1.9626922607421875, -1.879730224609375, -1.7967681884765625, -1.71380615234375, -1.6308441162109375, -1.547882080078125, -1.4649200439453125, -1.3819580078125, -1.2989959716796875, -1.216033935546875, -1.1330718994140625, -1.05010986328125, -0.9671478271484375, -0.884185791015625, -0.8012237548828125, -0.71826171875, -0.6352996826171875, -0.552337646484375, -0.4693756103515625, -0.38641357421875, -0.3034515380859375, -0.220489501953125, -0.1375274658203125, -0.0545654296875, 0.0283966064453125, 0.111358642578125, 0.1943206787109375, 0.27728271484375, 0.3602447509765625, 0.443206787109375, 0.5261688232421875, 0.609130859375, 0.6920928955078125, 0.775054931640625, 0.8580169677734375, 0.94097900390625, 1.0239410400390625, 1.106903076171875, 1.1898651123046875, 1.2728271484375, 1.3557891845703125, 1.438751220703125, 1.5217132568359375, 1.60467529296875, 1.6876373291015625, 1.770599365234375, 1.8535614013671875, 1.9365234375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 5.0, 7.0, 9.0, 4.0, 12.0, 21.0, 15.0, 34.0, 74.0, 89.0, 124.0, 155.0, 140.0, 108.0, 61.0, 33.0, 40.0, 24.0, 10.0, 5.0, 5.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00016760826110839844, -0.00016263872385025024, -0.00015766918659210205, -0.00015269964933395386, -0.00014773011207580566, -0.00014276057481765747, -0.00013779103755950928, -0.00013282150030136108, -0.0001278519630432129, -0.0001228824257850647, -0.0001179128885269165, -0.00011294335126876831, -0.00010797381401062012, -0.00010300427675247192, -9.803473949432373e-05, -9.306520223617554e-05, -8.809566497802734e-05, -8.312612771987915e-05, -7.815659046173096e-05, -7.318705320358276e-05, -6.821751594543457e-05, -6.324797868728638e-05, -5.8278441429138184e-05, -5.330890417098999e-05, -4.83393669128418e-05, -4.3369829654693604e-05, -3.840029239654541e-05, -3.343075513839722e-05, -2.8461217880249023e-05, -2.349168062210083e-05, -1.8522143363952637e-05, -1.3552606105804443e-05, -8.58306884765625e-06, -3.6135315895080566e-06, 1.3560056686401367e-06, 6.32554292678833e-06, 1.1295080184936523e-05, 1.6264617443084717e-05, 2.123415470123291e-05, 2.6203691959381104e-05, 3.11732292175293e-05, 3.614276647567749e-05, 4.1112303733825684e-05, 4.608184099197388e-05, 5.105137825012207e-05, 5.6020915508270264e-05, 6.099045276641846e-05, 6.595999002456665e-05, 7.092952728271484e-05, 7.589906454086304e-05, 8.086860179901123e-05, 8.583813905715942e-05, 9.080767631530762e-05, 9.577721357345581e-05, 0.000100746750831604, 0.0001057162880897522, 0.00011068582534790039, 0.00011565536260604858, 0.00012062489986419678, 0.00012559443712234497, 0.00013056397438049316, 0.00013553351163864136, 0.00014050304889678955, 0.00014547258615493774, 0.00015044212341308594]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 15.0, 30.0, 83.0, 179.0, 656.0, 3816.0, 613488.0, 426061.0, 3285.0, 596.0, 175.0, 88.0, 26.0, 20.0, 11.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.27984619140625, -2.1983642578125, -2.11688232421875, -2.035400390625, -1.95391845703125, -1.8724365234375, -1.79095458984375, -1.70947265625, -1.62799072265625, -1.5465087890625, -1.46502685546875, -1.383544921875, -1.30206298828125, -1.2205810546875, -1.13909912109375, -1.0576171875, -0.97613525390625, -0.8946533203125, -0.81317138671875, -0.731689453125, -0.65020751953125, -0.5687255859375, -0.48724365234375, -0.40576171875, -0.32427978515625, -0.2427978515625, -0.16131591796875, -0.079833984375, 0.00164794921875, 0.0831298828125, 0.16461181640625, 0.24609375, 0.32757568359375, 0.4090576171875, 0.49053955078125, 0.572021484375, 0.65350341796875, 0.7349853515625, 0.81646728515625, 0.89794921875, 0.97943115234375, 1.0609130859375, 1.14239501953125, 1.223876953125, 1.30535888671875, 1.3868408203125, 1.46832275390625, 1.5498046875, 1.63128662109375, 1.7127685546875, 1.79425048828125, 1.875732421875, 1.95721435546875, 2.0386962890625, 2.12017822265625, 2.20166015625, 2.28314208984375, 2.3646240234375, 2.44610595703125, 2.527587890625, 2.60906982421875, 2.6905517578125, 2.77203369140625, 2.853515625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 11.0, 18.0, 36.0, 54.0, 113.0, 165.0, 191.0, 147.0, 112.0, 49.0, 42.0, 16.0, 11.0, 2.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.71844482421875, -1.6556396484375, -1.59283447265625, -1.530029296875, -1.46722412109375, -1.4044189453125, -1.34161376953125, -1.27880859375, -1.21600341796875, -1.1531982421875, -1.09039306640625, -1.027587890625, -0.96478271484375, -0.9019775390625, -0.83917236328125, -0.7763671875, -0.71356201171875, -0.6507568359375, -0.58795166015625, -0.525146484375, -0.46234130859375, -0.3995361328125, -0.33673095703125, -0.27392578125, -0.21112060546875, -0.1483154296875, -0.08551025390625, -0.022705078125, 0.04010009765625, 0.1029052734375, 0.16571044921875, 0.228515625, 0.29132080078125, 0.3541259765625, 0.41693115234375, 0.479736328125, 0.54254150390625, 0.6053466796875, 0.66815185546875, 0.73095703125, 0.79376220703125, 0.8565673828125, 0.91937255859375, 0.982177734375, 1.04498291015625, 1.1077880859375, 1.17059326171875, 1.2333984375, 1.29620361328125, 1.3590087890625, 1.42181396484375, 1.484619140625, 1.54742431640625, 1.6102294921875, 1.67303466796875, 1.73583984375, 1.79864501953125, 1.8614501953125, 1.92425537109375, 1.987060546875, 2.04986572265625, 2.1126708984375, 2.17547607421875, 2.23828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 18.0, 107.0, 753.0, 119.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.78337097167969, -70.28732299804688, -65.79127502441406, -61.29523468017578, -56.79918670654297, -52.303138732910156, -47.80709457397461, -43.31105041503906, -38.81500244140625, -34.31895446777344, -29.82291030883789, -25.32686424255371, -20.83081817626953, -16.33477210998535, -11.838726043701172, -7.342679977416992, -2.8466339111328125, 1.6494121551513672, 6.145458221435547, 10.641504287719727, 15.137550354003906, 19.633596420288086, 24.129642486572266, 28.625688552856445, 33.121734619140625, 37.61778259277344, 42.113826751708984, 46.60987091064453, 51.105918884277344, 55.601966857910156, 60.0980110168457, 64.59405517578125, 69.090087890625, 73.58613586425781, 78.08218383789062, 82.5782241821289, 87.07427215576172, 91.57032012939453, 96.06636047363281, 100.56240844726562, 105.05845642089844, 109.55450439453125, 114.05055236816406, 118.54659271240234, 123.04264068603516, 127.53868865966797, 132.03472900390625, 136.53077697753906, 141.02682495117188, 145.5228729248047, 150.0189208984375, 154.5149688720703, 159.01101684570312, 163.50704956054688, 168.0030975341797, 172.4991455078125, 176.9951934814453, 181.49124145507812, 185.98728942871094, 190.48333740234375, 194.9793701171875, 199.4754180908203, 203.97146606445312, 208.46751403808594, 212.96356201171875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 8.0, 11.0, 7.0, 15.0, 18.0, 21.0, 28.0, 21.0, 30.0, 32.0, 45.0, 53.0, 40.0, 66.0, 58.0, 71.0, 58.0, 55.0, 63.0, 48.0, 39.0, 40.0, 25.0, 36.0, 21.0, 16.0, 13.0, 8.0, 18.0, 9.0, 8.0, 6.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-50.520450592041016, -49.17686462402344, -47.833274841308594, -46.489688873291016, -45.14609909057617, -43.802513122558594, -42.45892333984375, -41.11533737182617, -39.771751403808594, -38.428165435791016, -37.08457565307617, -35.740989685058594, -34.39739990234375, -33.05381393432617, -31.71022605895996, -30.36663818359375, -29.023048400878906, -27.679460525512695, -26.335872650146484, -24.992286682128906, -23.648696899414062, -22.305110931396484, -20.961523056030273, -19.617935180664062, -18.27434730529785, -16.93075942993164, -15.58717155456543, -14.243584632873535, -12.899996757507324, -11.556408882141113, -10.212821960449219, -8.869234085083008, -7.525646209716797, -6.182058334350586, -4.838470935821533, -3.4948835372924805, -2.1512956619262695, -0.8077077865600586, 0.5358791351318359, 1.8794670104980469, 3.223054885864258, 4.566642761230469, 5.9102301597595215, 7.253817558288574, 8.597405433654785, 9.940993309020996, 11.28458023071289, 12.628168106079102, 13.971755981445312, 15.315343856811523, 16.658931732177734, 18.002517700195312, 19.346107482910156, 20.689693450927734, 22.033281326293945, 23.376869201660156, 24.720457077026367, 26.064044952392578, 27.40763282775879, 28.751220703125, 30.094806671142578, 31.438396453857422, 32.781982421875, 34.125572204589844, 35.46915817260742]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 9.0, 7.0, 7.0, 18.0, 25.0, 45.0, 43.0, 58.0, 95.0, 148.0, 195.0, 314.0, 494.0, 728.0, 1177.0, 2208.0, 3643.0, 6756.0, 14781.0, 50151.0, 485755.0, 3324148.0, 244677.0, 32269.0, 11684.0, 5870.0, 3406.0, 2046.0, 1159.0, 779.0, 485.0, 340.0, 206.0, 170.0, 99.0, 79.0, 44.0, 56.0, 25.0, 25.0, 17.0, 7.0, 6.0, 6.0, 4.0, 9.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.4462890625, -1.4029693603515625, -1.359649658203125, -1.3163299560546875, -1.27301025390625, -1.2296905517578125, -1.186370849609375, -1.1430511474609375, -1.0997314453125, -1.0564117431640625, -1.013092041015625, -0.9697723388671875, -0.92645263671875, -0.8831329345703125, -0.839813232421875, -0.7964935302734375, -0.753173828125, -0.7098541259765625, -0.666534423828125, -0.6232147216796875, -0.57989501953125, -0.5365753173828125, -0.493255615234375, -0.4499359130859375, -0.4066162109375, -0.3632965087890625, -0.319976806640625, -0.2766571044921875, -0.23333740234375, -0.1900177001953125, -0.146697998046875, -0.1033782958984375, -0.06005859375, -0.0167388916015625, 0.026580810546875, 0.0699005126953125, 0.11322021484375, 0.1565399169921875, 0.199859619140625, 0.2431793212890625, 0.2864990234375, 0.3298187255859375, 0.373138427734375, 0.4164581298828125, 0.45977783203125, 0.5030975341796875, 0.546417236328125, 0.5897369384765625, 0.633056640625, 0.6763763427734375, 0.719696044921875, 0.7630157470703125, 0.80633544921875, 0.8496551513671875, 0.892974853515625, 0.9362945556640625, 0.9796142578125, 1.0229339599609375, 1.066253662109375, 1.1095733642578125, 1.15289306640625, 1.1962127685546875, 1.239532470703125, 1.2828521728515625, 1.326171875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 8.0, 7.0, 9.0, 12.0, 14.0, 14.0, 18.0, 25.0, 20.0, 21.0, 40.0, 45.0, 35.0, 40.0, 55.0, 64.0, 49.0, 43.0, 51.0, 46.0, 46.0, 54.0, 40.0, 33.0, 28.0, 29.0, 27.0, 17.0, 18.0, 14.0, 12.0, 12.0, 8.0, 5.0, 6.0, 3.0, 4.0, 3.0, 4.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0771484375, -1.04193115234375, -1.0067138671875, -0.97149658203125, -0.936279296875, -0.90106201171875, -0.8658447265625, -0.83062744140625, -0.79541015625, -0.76019287109375, -0.7249755859375, -0.68975830078125, -0.654541015625, -0.61932373046875, -0.5841064453125, -0.54888916015625, -0.513671875, -0.47845458984375, -0.4432373046875, -0.40802001953125, -0.372802734375, -0.33758544921875, -0.3023681640625, -0.26715087890625, -0.23193359375, -0.19671630859375, -0.1614990234375, -0.12628173828125, -0.091064453125, -0.05584716796875, -0.0206298828125, 0.01458740234375, 0.0498046875, 0.08502197265625, 0.1202392578125, 0.15545654296875, 0.190673828125, 0.22589111328125, 0.2611083984375, 0.29632568359375, 0.33154296875, 0.36676025390625, 0.4019775390625, 0.43719482421875, 0.472412109375, 0.50762939453125, 0.5428466796875, 0.57806396484375, 0.61328125, 0.64849853515625, 0.6837158203125, 0.71893310546875, 0.754150390625, 0.78936767578125, 0.8245849609375, 0.85980224609375, 0.89501953125, 0.93023681640625, 0.9654541015625, 1.00067138671875, 1.035888671875, 1.07110595703125, 1.1063232421875, 1.14154052734375, 1.1767578125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 6.0, 7.0, 10.0, 15.0, 20.0, 42.0, 61.0, 120.0, 193.0, 358.0, 1086.0, 5077.0, 47949.0, 4055045.0, 76053.0, 6036.0, 1191.0, 426.0, 209.0, 140.0, 73.0, 47.0, 31.0, 17.0, 15.0, 5.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.04296875, -4.9122314453125, -4.781494140625, -4.6507568359375, -4.52001953125, -4.3892822265625, -4.258544921875, -4.1278076171875, -3.9970703125, -3.8663330078125, -3.735595703125, -3.6048583984375, -3.47412109375, -3.3433837890625, -3.212646484375, -3.0819091796875, -2.951171875, -2.8204345703125, -2.689697265625, -2.5589599609375, -2.42822265625, -2.2974853515625, -2.166748046875, -2.0360107421875, -1.9052734375, -1.7745361328125, -1.643798828125, -1.5130615234375, -1.38232421875, -1.2515869140625, -1.120849609375, -0.9901123046875, -0.859375, -0.7286376953125, -0.597900390625, -0.4671630859375, -0.33642578125, -0.2056884765625, -0.074951171875, 0.0557861328125, 0.1865234375, 0.3172607421875, 0.447998046875, 0.5787353515625, 0.70947265625, 0.8402099609375, 0.970947265625, 1.1016845703125, 1.232421875, 1.3631591796875, 1.493896484375, 1.6246337890625, 1.75537109375, 1.8861083984375, 2.016845703125, 2.1475830078125, 2.2783203125, 2.4090576171875, 2.539794921875, 2.6705322265625, 2.80126953125, 2.9320068359375, 3.062744140625, 3.1934814453125, 3.32421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 5.0, 10.0, 9.0, 18.0, 12.0, 18.0, 27.0, 60.0, 112.0, 636.0, 2369.0, 566.0, 105.0, 48.0, 31.0, 17.0, 10.0, 6.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.982421875, -2.843597412109375, -2.70477294921875, -2.565948486328125, -2.4271240234375, -2.288299560546875, -2.14947509765625, -2.010650634765625, -1.871826171875, -1.733001708984375, -1.59417724609375, -1.455352783203125, -1.3165283203125, -1.177703857421875, -1.03887939453125, -0.900054931640625, -0.76123046875, -0.622406005859375, -0.48358154296875, -0.344757080078125, -0.2059326171875, -0.067108154296875, 0.07171630859375, 0.210540771484375, 0.349365234375, 0.488189697265625, 0.62701416015625, 0.765838623046875, 0.9046630859375, 1.043487548828125, 1.18231201171875, 1.321136474609375, 1.4599609375, 1.598785400390625, 1.73760986328125, 1.876434326171875, 2.0152587890625, 2.154083251953125, 2.29290771484375, 2.431732177734375, 2.570556640625, 2.709381103515625, 2.84820556640625, 2.987030029296875, 3.1258544921875, 3.264678955078125, 3.40350341796875, 3.542327880859375, 3.68115234375, 3.819976806640625, 3.95880126953125, 4.097625732421875, 4.2364501953125, 4.375274658203125, 4.51409912109375, 4.652923583984375, 4.791748046875, 4.930572509765625, 5.06939697265625, 5.208221435546875, 5.3470458984375, 5.485870361328125, 5.62469482421875, 5.763519287109375, 5.90234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 23.0, 133.0, 540.0, 230.0, 36.0, 19.0, 8.0, 3.0, 2.0, 8.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.58734130859375, -39.060829162597656, -37.53431701660156, -36.007808685302734, -34.48129653930664, -32.95478439331055, -31.428274154663086, -29.901763916015625, -28.37525177001953, -26.848739624023438, -25.322229385375977, -23.795719146728516, -22.269207000732422, -20.742694854736328, -19.216184616088867, -17.689674377441406, -16.163162231445312, -14.636651039123535, -13.110139846801758, -11.58362865447998, -10.057117462158203, -8.530606269836426, -7.004095077514648, -5.477583885192871, -3.9510726928710938, -2.4245615005493164, -0.8980503082275391, 0.6284608840942383, 2.1549720764160156, 3.681483268737793, 5.20799446105957, 6.734505653381348, 8.26102066040039, 9.787531852722168, 11.314043045043945, 12.840554237365723, 14.3670654296875, 15.893576622009277, 17.420087814331055, 18.946598052978516, 20.47311019897461, 21.999622344970703, 23.526132583618164, 25.052642822265625, 26.57915496826172, 28.105667114257812, 29.632177352905273, 31.158687591552734, 32.68519973754883, 34.21171188354492, 35.73822021484375, 37.264732360839844, 38.79124450683594, 40.31775665283203, 41.844268798828125, 43.37077713012695, 44.89728927612305, 46.42380142211914, 47.95030975341797, 49.47682189941406, 51.003334045410156, 52.52984619140625, 54.056358337402344, 55.58286666870117, 57.109378814697266]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 5.0, 4.0, 10.0, 14.0, 16.0, 29.0, 33.0, 48.0, 66.0, 65.0, 84.0, 69.0, 88.0, 96.0, 81.0, 49.0, 62.0, 41.0, 33.0, 33.0, 24.0, 18.0, 11.0, 9.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.377717971801758, -13.735590934753418, -13.093464851379395, -12.451337814331055, -11.809211730957031, -11.167084693908691, -10.524957656860352, -9.882831573486328, -9.240704536437988, -8.598577499389648, -7.956451416015625, -7.314324378967285, -6.6721978187561035, -6.030071258544922, -5.387944221496582, -4.7458176612854, -4.103691101074219, -3.461564540863037, -2.8194377422332764, -2.1773109436035156, -1.535184383392334, -0.8930578231811523, -0.2509310245513916, 0.39119577407836914, 1.0333223342895508, 1.675449013710022, 2.317575693130493, 2.959702491760254, 3.6018290519714355, 4.243955612182617, 4.886082649230957, 5.528209209442139, 6.1703338623046875, 6.812460422515869, 7.454586982727051, 8.09671401977539, 8.738840103149414, 9.380967140197754, 10.023094177246094, 10.665220260620117, 11.307347297668457, 11.949474334716797, 12.59160041809082, 13.23372745513916, 13.8758544921875, 14.517980575561523, 15.160107612609863, 15.802234649658203, 16.444360733032227, 17.08648681640625, 17.728614807128906, 18.37074089050293, 19.012866973876953, 19.65499496459961, 20.297121047973633, 20.939247131347656, 21.581375122070312, 22.223501205444336, 22.865629196166992, 23.507755279541016, 24.14988136291504, 24.792007446289062, 25.43413543701172, 26.076261520385742, 26.718387603759766]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 12.0, 18.0, 21.0, 34.0, 36.0, 44.0, 86.0, 123.0, 171.0, 252.0, 345.0, 509.0, 795.0, 1211.0, 1866.0, 2870.0, 4895.0, 8168.0, 14887.0, 28202.0, 58035.0, 130537.0, 285825.0, 272034.0, 121561.0, 54567.0, 26841.0, 14160.0, 7903.0, 4671.0, 2736.0, 1731.0, 1089.0, 752.0, 516.0, 318.0, 209.0, 166.0, 117.0, 67.0, 58.0, 34.0, 21.0, 23.0, 11.0, 10.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.845703125, -0.816497802734375, -0.78729248046875, -0.758087158203125, -0.7288818359375, -0.699676513671875, -0.67047119140625, -0.641265869140625, -0.612060546875, -0.582855224609375, -0.55364990234375, -0.524444580078125, -0.4952392578125, -0.466033935546875, -0.43682861328125, -0.407623291015625, -0.37841796875, -0.349212646484375, -0.32000732421875, -0.290802001953125, -0.2615966796875, -0.232391357421875, -0.20318603515625, -0.173980712890625, -0.144775390625, -0.115570068359375, -0.08636474609375, -0.057159423828125, -0.0279541015625, 0.001251220703125, 0.03045654296875, 0.059661865234375, 0.0888671875, 0.118072509765625, 0.14727783203125, 0.176483154296875, 0.2056884765625, 0.234893798828125, 0.26409912109375, 0.293304443359375, 0.322509765625, 0.351715087890625, 0.38092041015625, 0.410125732421875, 0.4393310546875, 0.468536376953125, 0.49774169921875, 0.526947021484375, 0.55615234375, 0.585357666015625, 0.61456298828125, 0.643768310546875, 0.6729736328125, 0.702178955078125, 0.73138427734375, 0.760589599609375, 0.789794921875, 0.819000244140625, 0.84820556640625, 0.877410888671875, 0.9066162109375, 0.935821533203125, 0.96502685546875, 0.994232177734375, 1.0234375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 8.0, 5.0, 11.0, 15.0, 16.0, 17.0, 15.0, 20.0, 20.0, 24.0, 25.0, 38.0, 33.0, 36.0, 52.0, 54.0, 51.0, 49.0, 51.0, 48.0, 58.0, 47.0, 49.0, 36.0, 35.0, 28.0, 29.0, 18.0, 17.0, 17.0, 14.0, 13.0, 7.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.978515625, -0.9448394775390625, -0.911163330078125, -0.8774871826171875, -0.84381103515625, -0.8101348876953125, -0.776458740234375, -0.7427825927734375, -0.7091064453125, -0.6754302978515625, -0.641754150390625, -0.6080780029296875, -0.57440185546875, -0.5407257080078125, -0.507049560546875, -0.4733734130859375, -0.439697265625, -0.4060211181640625, -0.372344970703125, -0.3386688232421875, -0.30499267578125, -0.2713165283203125, -0.237640380859375, -0.2039642333984375, -0.1702880859375, -0.1366119384765625, -0.102935791015625, -0.0692596435546875, -0.03558349609375, -0.0019073486328125, 0.031768798828125, 0.0654449462890625, 0.09912109375, 0.1327972412109375, 0.166473388671875, 0.2001495361328125, 0.23382568359375, 0.2675018310546875, 0.301177978515625, 0.3348541259765625, 0.3685302734375, 0.4022064208984375, 0.435882568359375, 0.4695587158203125, 0.50323486328125, 0.5369110107421875, 0.570587158203125, 0.6042633056640625, 0.637939453125, 0.6716156005859375, 0.705291748046875, 0.7389678955078125, 0.77264404296875, 0.8063201904296875, 0.839996337890625, 0.8736724853515625, 0.9073486328125, 0.9410247802734375, 0.974700927734375, 1.0083770751953125, 1.04205322265625, 1.0757293701171875, 1.109405517578125, 1.1430816650390625, 1.1767578125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 7.0, 12.0, 9.0, 18.0, 31.0, 36.0, 61.0, 65.0, 88.0, 133.0, 186.0, 272.0, 479.0, 756.0, 1482.0, 3920.0, 17371.0, 204722.0, 754002.0, 52176.0, 7832.0, 2362.0, 1013.0, 540.0, 291.0, 197.0, 120.0, 112.0, 80.0, 35.0, 38.0, 17.0, 25.0, 19.0, 9.0, 12.0, 4.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.36328125, -3.26214599609375, -3.1610107421875, -3.05987548828125, -2.958740234375, -2.85760498046875, -2.7564697265625, -2.65533447265625, -2.55419921875, -2.45306396484375, -2.3519287109375, -2.25079345703125, -2.149658203125, -2.04852294921875, -1.9473876953125, -1.84625244140625, -1.7451171875, -1.64398193359375, -1.5428466796875, -1.44171142578125, -1.340576171875, -1.23944091796875, -1.1383056640625, -1.03717041015625, -0.93603515625, -0.83489990234375, -0.7337646484375, -0.63262939453125, -0.531494140625, -0.43035888671875, -0.3292236328125, -0.22808837890625, -0.126953125, -0.02581787109375, 0.0753173828125, 0.17645263671875, 0.277587890625, 0.37872314453125, 0.4798583984375, 0.58099365234375, 0.68212890625, 0.78326416015625, 0.8843994140625, 0.98553466796875, 1.086669921875, 1.18780517578125, 1.2889404296875, 1.39007568359375, 1.4912109375, 1.59234619140625, 1.6934814453125, 1.79461669921875, 1.895751953125, 1.99688720703125, 2.0980224609375, 2.19915771484375, 2.30029296875, 2.40142822265625, 2.5025634765625, 2.60369873046875, 2.704833984375, 2.80596923828125, 2.9071044921875, 3.00823974609375, 3.109375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 6.0, 14.0, 4.0, 7.0, 14.0, 18.0, 23.0, 29.0, 24.0, 25.0, 29.0, 33.0, 37.0, 48.0, 41.0, 34.0, 37.0, 58.0, 52.0, 50.0, 51.0, 50.0, 41.0, 38.0, 40.0, 34.0, 14.0, 23.0, 24.0, 16.0, 18.0, 11.0, 7.0, 11.0, 14.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.640625, -4.48724365234375, -4.3338623046875, -4.18048095703125, -4.027099609375, -3.87371826171875, -3.7203369140625, -3.56695556640625, -3.41357421875, -3.26019287109375, -3.1068115234375, -2.95343017578125, -2.800048828125, -2.64666748046875, -2.4932861328125, -2.33990478515625, -2.1865234375, -2.03314208984375, -1.8797607421875, -1.72637939453125, -1.572998046875, -1.41961669921875, -1.2662353515625, -1.11285400390625, -0.95947265625, -0.80609130859375, -0.6527099609375, -0.49932861328125, -0.345947265625, -0.19256591796875, -0.0391845703125, 0.11419677734375, 0.267578125, 0.42095947265625, 0.5743408203125, 0.72772216796875, 0.881103515625, 1.03448486328125, 1.1878662109375, 1.34124755859375, 1.49462890625, 1.64801025390625, 1.8013916015625, 1.95477294921875, 2.108154296875, 2.26153564453125, 2.4149169921875, 2.56829833984375, 2.7216796875, 2.87506103515625, 3.0284423828125, 3.18182373046875, 3.335205078125, 3.48858642578125, 3.6419677734375, 3.79534912109375, 3.94873046875, 4.10211181640625, 4.2554931640625, 4.40887451171875, 4.562255859375, 4.71563720703125, 4.8690185546875, 5.02239990234375, 5.17578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 12.0, 16.0, 32.0, 39.0, 49.0, 102.0, 178.0, 290.0, 617.0, 1434.0, 4582.0, 28649.0, 889870.0, 110337.0, 8299.0, 2187.0, 863.0, 393.0, 196.0, 132.0, 66.0, 53.0, 33.0, 26.0, 18.0, 16.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-1.525390625, -1.48382568359375, -1.4422607421875, -1.40069580078125, -1.359130859375, -1.31756591796875, -1.2760009765625, -1.23443603515625, -1.19287109375, -1.15130615234375, -1.1097412109375, -1.06817626953125, -1.026611328125, -0.98504638671875, -0.9434814453125, -0.90191650390625, -0.8603515625, -0.81878662109375, -0.7772216796875, -0.73565673828125, -0.694091796875, -0.65252685546875, -0.6109619140625, -0.56939697265625, -0.52783203125, -0.48626708984375, -0.4447021484375, -0.40313720703125, -0.361572265625, -0.32000732421875, -0.2784423828125, -0.23687744140625, -0.1953125, -0.15374755859375, -0.1121826171875, -0.07061767578125, -0.029052734375, 0.01251220703125, 0.0540771484375, 0.09564208984375, 0.13720703125, 0.17877197265625, 0.2203369140625, 0.26190185546875, 0.303466796875, 0.34503173828125, 0.3865966796875, 0.42816162109375, 0.4697265625, 0.51129150390625, 0.5528564453125, 0.59442138671875, 0.635986328125, 0.67755126953125, 0.7191162109375, 0.76068115234375, 0.80224609375, 0.84381103515625, 0.8853759765625, 0.92694091796875, 0.968505859375, 1.01007080078125, 1.0516357421875, 1.09320068359375, 1.134765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 9.0, 12.0, 13.0, 33.0, 47.0, 80.0, 94.0, 154.0, 149.0, 151.0, 86.0, 61.0, 39.0, 23.0, 13.0, 4.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018656253814697266, -0.00018095038831233978, -0.0001753382384777069, -0.00016972608864307404, -0.00016411393880844116, -0.0001585017889738083, -0.00015288963913917542, -0.00014727748930454254, -0.00014166533946990967, -0.0001360531896352768, -0.00013044103980064392, -0.00012482888996601105, -0.00011921674013137817, -0.0001136045902967453, -0.00010799244046211243, -0.00010238029062747955, -9.676814079284668e-05, -9.11559909582138e-05, -8.554384112358093e-05, -7.993169128894806e-05, -7.431954145431519e-05, -6.870739161968231e-05, -6.309524178504944e-05, -5.7483091950416565e-05, -5.187094211578369e-05, -4.625879228115082e-05, -4.0646642446517944e-05, -3.503449261188507e-05, -2.9422342777252197e-05, -2.3810192942619324e-05, -1.819804310798645e-05, -1.2585893273353577e-05, -6.973743438720703e-06, -1.3615936040878296e-06, 4.250556230545044e-06, 9.862706065177917e-06, 1.547485589981079e-05, 2.1087005734443665e-05, 2.6699155569076538e-05, 3.231130540370941e-05, 3.7923455238342285e-05, 4.353560507297516e-05, 4.914775490760803e-05, 5.4759904742240906e-05, 6.037205457687378e-05, 6.598420441150665e-05, 7.159635424613953e-05, 7.72085040807724e-05, 8.282065391540527e-05, 8.843280375003815e-05, 9.404495358467102e-05, 9.96571034193039e-05, 0.00010526925325393677, 0.00011088140308856964, 0.00011649355292320251, 0.0001221057027578354, 0.00012771785259246826, 0.00013333000242710114, 0.000138942152261734, 0.00014455430209636688, 0.00015016645193099976, 0.00015577860176563263, 0.0001613907516002655, 0.00016700290143489838, 0.00017261505126953125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 10.0, 6.0, 12.0, 19.0, 24.0, 32.0, 63.0, 70.0, 127.0, 242.0, 482.0, 1211.0, 4527.0, 37564.0, 930250.0, 65709.0, 5564.0, 1415.0, 525.0, 269.0, 141.0, 80.0, 61.0, 50.0, 22.0, 19.0, 14.0, 5.0, 11.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.166015625, -1.1237335205078125, -1.081451416015625, -1.0391693115234375, -0.99688720703125, -0.9546051025390625, -0.912322998046875, -0.8700408935546875, -0.8277587890625, -0.7854766845703125, -0.743194580078125, -0.7009124755859375, -0.65863037109375, -0.6163482666015625, -0.574066162109375, -0.5317840576171875, -0.489501953125, -0.4472198486328125, -0.404937744140625, -0.3626556396484375, -0.32037353515625, -0.2780914306640625, -0.235809326171875, -0.1935272216796875, -0.1512451171875, -0.1089630126953125, -0.066680908203125, -0.0243988037109375, 0.01788330078125, 0.0601654052734375, 0.102447509765625, 0.1447296142578125, 0.18701171875, 0.2292938232421875, 0.271575927734375, 0.3138580322265625, 0.35614013671875, 0.3984222412109375, 0.440704345703125, 0.4829864501953125, 0.5252685546875, 0.5675506591796875, 0.609832763671875, 0.6521148681640625, 0.69439697265625, 0.7366790771484375, 0.778961181640625, 0.8212432861328125, 0.863525390625, 0.9058074951171875, 0.948089599609375, 0.9903717041015625, 1.03265380859375, 1.0749359130859375, 1.117218017578125, 1.1595001220703125, 1.2017822265625, 1.2440643310546875, 1.286346435546875, 1.3286285400390625, 1.37091064453125, 1.4131927490234375, 1.455474853515625, 1.4977569580078125, 1.5400390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 13.0, 14.0, 17.0, 29.0, 25.0, 65.0, 73.0, 86.0, 112.0, 103.0, 92.0, 80.0, 62.0, 59.0, 36.0, 28.0, 18.0, 17.0, 17.0, 12.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.9933319091796875, -0.956390380859375, -0.9194488525390625, -0.88250732421875, -0.8455657958984375, -0.808624267578125, -0.7716827392578125, -0.7347412109375, -0.6977996826171875, -0.660858154296875, -0.6239166259765625, -0.58697509765625, -0.5500335693359375, -0.513092041015625, -0.4761505126953125, -0.439208984375, -0.4022674560546875, -0.365325927734375, -0.3283843994140625, -0.29144287109375, -0.2545013427734375, -0.217559814453125, -0.1806182861328125, -0.1436767578125, -0.1067352294921875, -0.069793701171875, -0.0328521728515625, 0.00408935546875, 0.0410308837890625, 0.077972412109375, 0.1149139404296875, 0.15185546875, 0.1887969970703125, 0.225738525390625, 0.2626800537109375, 0.29962158203125, 0.3365631103515625, 0.373504638671875, 0.4104461669921875, 0.4473876953125, 0.4843292236328125, 0.521270751953125, 0.5582122802734375, 0.59515380859375, 0.6320953369140625, 0.669036865234375, 0.7059783935546875, 0.742919921875, 0.7798614501953125, 0.816802978515625, 0.8537445068359375, 0.89068603515625, 0.9276275634765625, 0.964569091796875, 1.0015106201171875, 1.0384521484375, 1.0753936767578125, 1.112335205078125, 1.1492767333984375, 1.18621826171875, 1.2231597900390625, 1.260101318359375, 1.2970428466796875, 1.333984375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 31.0, 335.0, 548.0, 59.0, 21.0, 10.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.13204956054688, -114.79032897949219, -112.4486083984375, -110.10688018798828, -107.7651596069336, -105.4234390258789, -103.08171081542969, -100.739990234375, -98.39826965332031, -96.05654907226562, -93.71482849121094, -91.37310028076172, -89.03137969970703, -86.68965911865234, -84.34793090820312, -82.00621032714844, -79.66448974609375, -77.32276916503906, -74.98104858398438, -72.63932037353516, -70.29759979248047, -67.95587921142578, -65.61415100097656, -63.272430419921875, -60.93070983886719, -58.5889892578125, -56.24726486206055, -53.905540466308594, -51.563819885253906, -49.22209930419922, -46.880374908447266, -44.53865051269531, -42.19693374633789, -39.85520935058594, -37.51348876953125, -35.17176818847656, -32.83004379272461, -30.48832130432129, -28.14659881591797, -25.80487632751465, -23.463153839111328, -21.121431350708008, -18.779708862304688, -16.437986373901367, -14.096263885498047, -11.754541397094727, -9.412818908691406, -7.071096420288086, -4.729373931884766, -2.3876514434814453, -0.045928955078125, 2.2957935333251953, 4.637516021728516, 6.979238510131836, 9.320960998535156, 11.662683486938477, 14.004405975341797, 16.346128463745117, 18.687850952148438, 21.029573440551758, 23.371295928955078, 25.7130184173584, 28.05474090576172, 30.39646339416504, 32.73818588256836]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 2.0, 8.0, 1.0, 8.0, 6.0, 14.0, 17.0, 17.0, 22.0, 14.0, 34.0, 23.0, 37.0, 40.0, 36.0, 40.0, 50.0, 48.0, 55.0, 60.0, 67.0, 64.0, 32.0, 57.0, 30.0, 28.0, 40.0, 28.0, 21.0, 17.0, 17.0, 11.0, 14.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.88896942138672, -17.256256103515625, -16.62354278564453, -15.990830421447754, -15.35811710357666, -14.725403785705566, -14.092691421508789, -13.459978103637695, -12.827264785766602, -12.194551467895508, -11.561838150024414, -10.929125785827637, -10.296412467956543, -9.66369915008545, -9.030986785888672, -8.398273468017578, -7.765560150146484, -7.132846832275391, -6.500133991241455, -5.8674211502075195, -5.234707832336426, -4.601994514465332, -3.9692816734313965, -3.336568832397461, -2.703855514526367, -2.0711424350738525, -1.438429355621338, -0.8057162761688232, -0.1730031967163086, 0.45970988273620605, 1.0924229621887207, 1.7251358032226562, 2.35784912109375, 2.9905622005462646, 3.6232752799987793, 4.255988121032715, 4.888701438903809, 5.521414756774902, 6.154127597808838, 6.786840438842773, 7.419553756713867, 8.052267074584961, 8.684980392456055, 9.317692756652832, 9.950406074523926, 10.58311939239502, 11.215831756591797, 11.84854507446289, 12.481258392333984, 13.113971710205078, 13.746685028076172, 14.37939739227295, 15.012110710144043, 15.644824028015137, 16.277536392211914, 16.910249710083008, 17.5429630279541, 18.175676345825195, 18.80838966369629, 19.441102981567383, 20.073814392089844, 20.706527709960938, 21.33924102783203, 21.971954345703125, 22.60466766357422]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 7.0, 4.0, 4.0, 8.0, 16.0, 21.0, 21.0, 16.0, 42.0, 61.0, 81.0, 174.0, 286.0, 884.0, 5830.0, 597190.0, 3579801.0, 7788.0, 1095.0, 353.0, 187.0, 112.0, 75.0, 65.0, 40.0, 34.0, 20.0, 13.0, 9.0, 15.0, 8.0, 3.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.98046875, -4.849761962890625, -4.71905517578125, -4.588348388671875, -4.4576416015625, -4.326934814453125, -4.19622802734375, -4.065521240234375, -3.934814453125, -3.804107666015625, -3.67340087890625, -3.542694091796875, -3.4119873046875, -3.281280517578125, -3.15057373046875, -3.019866943359375, -2.88916015625, -2.758453369140625, -2.62774658203125, -2.497039794921875, -2.3663330078125, -2.235626220703125, -2.10491943359375, -1.974212646484375, -1.843505859375, -1.712799072265625, -1.58209228515625, -1.451385498046875, -1.3206787109375, -1.189971923828125, -1.05926513671875, -0.928558349609375, -0.7978515625, -0.667144775390625, -0.53643798828125, -0.405731201171875, -0.2750244140625, -0.144317626953125, -0.01361083984375, 0.117095947265625, 0.247802734375, 0.378509521484375, 0.50921630859375, 0.639923095703125, 0.7706298828125, 0.901336669921875, 1.03204345703125, 1.162750244140625, 1.29345703125, 1.424163818359375, 1.55487060546875, 1.685577392578125, 1.8162841796875, 1.946990966796875, 2.07769775390625, 2.208404541015625, 2.339111328125, 2.469818115234375, 2.60052490234375, 2.731231689453125, 2.8619384765625, 2.992645263671875, 3.12335205078125, 3.254058837890625, 3.384765625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 12.0, 6.0, 16.0, 20.0, 34.0, 49.0, 76.0, 70.0, 84.0, 103.0, 93.0, 106.0, 83.0, 65.0, 59.0, 39.0, 36.0, 23.0, 15.0, 12.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40625, -1.340545654296875, -1.27484130859375, -1.209136962890625, -1.1434326171875, -1.077728271484375, -1.01202392578125, -0.946319580078125, -0.880615234375, -0.814910888671875, -0.74920654296875, -0.683502197265625, -0.6177978515625, -0.552093505859375, -0.48638916015625, -0.420684814453125, -0.35498046875, -0.289276123046875, -0.22357177734375, -0.157867431640625, -0.0921630859375, -0.026458740234375, 0.03924560546875, 0.104949951171875, 0.170654296875, 0.236358642578125, 0.30206298828125, 0.367767333984375, 0.4334716796875, 0.499176025390625, 0.56488037109375, 0.630584716796875, 0.6962890625, 0.761993408203125, 0.82769775390625, 0.893402099609375, 0.9591064453125, 1.024810791015625, 1.09051513671875, 1.156219482421875, 1.221923828125, 1.287628173828125, 1.35333251953125, 1.419036865234375, 1.4847412109375, 1.550445556640625, 1.61614990234375, 1.681854248046875, 1.74755859375, 1.813262939453125, 1.87896728515625, 1.944671630859375, 2.0103759765625, 2.076080322265625, 2.14178466796875, 2.207489013671875, 2.273193359375, 2.338897705078125, 2.40460205078125, 2.470306396484375, 2.5360107421875, 2.601715087890625, 2.66741943359375, 2.733123779296875, 2.798828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 21.0, 33.0, 61.0, 95.0, 160.0, 318.0, 1345.0, 10163.0, 695394.0, 3470816.0, 13274.0, 1591.0, 394.0, 191.0, 164.0, 101.0, 76.0, 36.0, 19.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.0828857421875, -2.954833984375, -2.8267822265625, -2.69873046875, -2.5706787109375, -2.442626953125, -2.3145751953125, -2.1865234375, -2.0584716796875, -1.930419921875, -1.8023681640625, -1.67431640625, -1.5462646484375, -1.418212890625, -1.2901611328125, -1.162109375, -1.0340576171875, -0.906005859375, -0.7779541015625, -0.64990234375, -0.5218505859375, -0.393798828125, -0.2657470703125, -0.1376953125, -0.0096435546875, 0.118408203125, 0.2464599609375, 0.37451171875, 0.5025634765625, 0.630615234375, 0.7586669921875, 0.88671875, 1.0147705078125, 1.142822265625, 1.2708740234375, 1.39892578125, 1.5269775390625, 1.655029296875, 1.7830810546875, 1.9111328125, 2.0391845703125, 2.167236328125, 2.2952880859375, 2.42333984375, 2.5513916015625, 2.679443359375, 2.8074951171875, 2.935546875, 3.0635986328125, 3.191650390625, 3.3197021484375, 3.44775390625, 3.5758056640625, 3.703857421875, 3.8319091796875, 3.9599609375, 4.0880126953125, 4.216064453125, 4.3441162109375, 4.47216796875, 4.6002197265625, 4.728271484375, 4.8563232421875, 4.984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 13.0, 24.0, 32.0, 71.0, 310.0, 1831.0, 1479.0, 180.0, 50.0, 25.0, 21.0, 4.0, 7.0, 10.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9365234375, -1.8147735595703125, -1.693023681640625, -1.5712738037109375, -1.44952392578125, -1.3277740478515625, -1.206024169921875, -1.0842742919921875, -0.9625244140625, -0.8407745361328125, -0.719024658203125, -0.5972747802734375, -0.47552490234375, -0.3537750244140625, -0.232025146484375, -0.1102752685546875, 0.011474609375, 0.1332244873046875, 0.254974365234375, 0.3767242431640625, 0.49847412109375, 0.6202239990234375, 0.741973876953125, 0.8637237548828125, 0.9854736328125, 1.1072235107421875, 1.228973388671875, 1.3507232666015625, 1.47247314453125, 1.5942230224609375, 1.715972900390625, 1.8377227783203125, 1.95947265625, 2.0812225341796875, 2.202972412109375, 2.3247222900390625, 2.44647216796875, 2.5682220458984375, 2.689971923828125, 2.8117218017578125, 2.9334716796875, 3.0552215576171875, 3.176971435546875, 3.2987213134765625, 3.42047119140625, 3.5422210693359375, 3.663970947265625, 3.7857208251953125, 3.907470703125, 4.0292205810546875, 4.150970458984375, 4.2727203369140625, 4.39447021484375, 4.5162200927734375, 4.637969970703125, 4.7597198486328125, 4.8814697265625, 5.0032196044921875, 5.124969482421875, 5.2467193603515625, 5.36846923828125, 5.4902191162109375, 5.611968994140625, 5.7337188720703125, 5.85546875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 9.0, 12.0, 27.0, 68.0, 192.0, 310.0, 216.0, 95.0, 27.0, 13.0, 7.0, 4.0, 1.0, 5.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.216959953308105, -8.717105865478516, -8.217252731323242, -7.717398643493652, -7.2175445556640625, -6.717690467834473, -6.217836856842041, -5.717983245849609, -5.2181291580200195, -4.71827507019043, -4.218421459197998, -3.7185676097869873, -3.2187137603759766, -2.718859910964966, -2.219006061553955, -1.7191522121429443, -1.2192983627319336, -0.7194445133209229, -0.2195906639099121, 0.28026318550109863, 0.7801170349121094, 1.2799708843231201, 1.7798247337341309, 2.2796785831451416, 2.7795324325561523, 3.279386281967163, 3.779240131378174, 4.2790937423706055, 4.778947830200195, 5.278801918029785, 5.778655529022217, 6.278509140014648, 6.778364181518555, 7.2782182693481445, 7.778071880340576, 8.277925491333008, 8.777779579162598, 9.277633666992188, 9.777486801147461, 10.27734088897705, 10.77719497680664, 11.27704906463623, 11.77690315246582, 12.276756286621094, 12.776610374450684, 13.276464462280273, 13.776317596435547, 14.276171684265137, 14.776025772094727, 15.275879859924316, 15.775733947753906, 16.27558708190918, 16.775440216064453, 17.27529525756836, 17.775148391723633, 18.27500343322754, 18.774856567382812, 19.274709701538086, 19.774564743041992, 20.274417877197266, 20.774272918701172, 21.274126052856445, 21.77397918701172, 22.273834228515625, 22.7736873626709]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 13.0, 12.0, 12.0, 30.0, 22.0, 28.0, 27.0, 31.0, 60.0, 61.0, 76.0, 72.0, 72.0, 57.0, 71.0, 66.0, 64.0, 43.0, 39.0, 30.0, 25.0, 16.0, 20.0, 11.0, 6.0, 7.0, 6.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.039983749389648, -10.702712059020996, -10.365440368652344, -10.028169631958008, -9.690897941589355, -9.353626251220703, -9.01635456085205, -8.679082870483398, -8.341812133789062, -8.00454044342041, -7.667269229888916, -7.329997539520264, -6.9927263259887695, -6.655454635620117, -6.318182945251465, -5.980911731719971, -5.643640041351318, -5.306368350982666, -4.969097137451172, -4.6318254470825195, -4.294554233551025, -3.957282543182373, -3.6200110912323, -3.2827396392822266, -2.9454681873321533, -2.60819673538208, -2.270925283432007, -1.933653712272644, -1.5963822603225708, -1.2591108083724976, -0.9218392372131348, -0.5845677852630615, -0.24729633331298828, 0.08997514843940735, 0.427246630191803, 0.764518141746521, 1.1017895936965942, 1.4390610456466675, 1.7763326168060303, 2.1136040687561035, 2.4508755207061768, 2.78814697265625, 3.1254184246063232, 3.4626898765563965, 3.799961566925049, 4.137232780456543, 4.474504470825195, 4.811776161193848, 5.149047374725342, 5.486319065093994, 5.823590278625488, 6.160861968994141, 6.498133182525635, 6.835404872894287, 7.172676086425781, 7.509947776794434, 7.847219467163086, 8.184491157531738, 8.52176284790039, 8.859033584594727, 9.196305274963379, 9.533576965332031, 9.870848655700684, 10.208120346069336, 10.545391082763672]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 13.0, 21.0, 30.0, 49.0, 91.0, 136.0, 249.0, 473.0, 1153.0, 2996.0, 9976.0, 41636.0, 224907.0, 583742.0, 143501.0, 28160.0, 7249.0, 2293.0, 915.0, 426.0, 211.0, 131.0, 69.0, 54.0, 22.0, 16.0, 11.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.736328125, -1.677215576171875, -1.61810302734375, -1.558990478515625, -1.4998779296875, -1.440765380859375, -1.38165283203125, -1.322540283203125, -1.263427734375, -1.204315185546875, -1.14520263671875, -1.086090087890625, -1.0269775390625, -0.967864990234375, -0.90875244140625, -0.849639892578125, -0.79052734375, -0.731414794921875, -0.67230224609375, -0.613189697265625, -0.5540771484375, -0.494964599609375, -0.43585205078125, -0.376739501953125, -0.317626953125, -0.258514404296875, -0.19940185546875, -0.140289306640625, -0.0811767578125, -0.022064208984375, 0.03704833984375, 0.096160888671875, 0.1552734375, 0.214385986328125, 0.27349853515625, 0.332611083984375, 0.3917236328125, 0.450836181640625, 0.50994873046875, 0.569061279296875, 0.628173828125, 0.687286376953125, 0.74639892578125, 0.805511474609375, 0.8646240234375, 0.923736572265625, 0.98284912109375, 1.041961669921875, 1.10107421875, 1.160186767578125, 1.21929931640625, 1.278411865234375, 1.3375244140625, 1.396636962890625, 1.45574951171875, 1.514862060546875, 1.573974609375, 1.633087158203125, 1.69219970703125, 1.751312255859375, 1.8104248046875, 1.869537353515625, 1.92864990234375, 1.987762451171875, 2.046875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 10.0, 12.0, 13.0, 15.0, 19.0, 15.0, 23.0, 42.0, 38.0, 42.0, 36.0, 43.0, 59.0, 47.0, 61.0, 41.0, 58.0, 56.0, 57.0, 39.0, 51.0, 39.0, 31.0, 24.0, 23.0, 24.0, 18.0, 14.0, 15.0, 9.0, 5.0, 8.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.001953125, -0.9654083251953125, -0.928863525390625, -0.8923187255859375, -0.85577392578125, -0.8192291259765625, -0.782684326171875, -0.7461395263671875, -0.7095947265625, -0.6730499267578125, -0.636505126953125, -0.5999603271484375, -0.56341552734375, -0.5268707275390625, -0.490325927734375, -0.4537811279296875, -0.417236328125, -0.3806915283203125, -0.344146728515625, -0.3076019287109375, -0.27105712890625, -0.2345123291015625, -0.197967529296875, -0.1614227294921875, -0.1248779296875, -0.0883331298828125, -0.051788330078125, -0.0152435302734375, 0.02130126953125, 0.0578460693359375, 0.094390869140625, 0.1309356689453125, 0.16748046875, 0.2040252685546875, 0.240570068359375, 0.2771148681640625, 0.31365966796875, 0.3502044677734375, 0.386749267578125, 0.4232940673828125, 0.4598388671875, 0.4963836669921875, 0.532928466796875, 0.5694732666015625, 0.60601806640625, 0.6425628662109375, 0.679107666015625, 0.7156524658203125, 0.752197265625, 0.7887420654296875, 0.825286865234375, 0.8618316650390625, 0.89837646484375, 0.9349212646484375, 0.971466064453125, 1.0080108642578125, 1.0445556640625, 1.0811004638671875, 1.117645263671875, 1.1541900634765625, 1.19073486328125, 1.2272796630859375, 1.263824462890625, 1.3003692626953125, 1.3369140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 9.0, 13.0, 19.0, 25.0, 32.0, 75.0, 129.0, 177.0, 383.0, 752.0, 1989.0, 9244.0, 152916.0, 836616.0, 39013.0, 4490.0, 1315.0, 618.0, 283.0, 169.0, 97.0, 59.0, 39.0, 25.0, 21.0, 10.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.609375, -4.489013671875, -4.36865234375, -4.248291015625, -4.1279296875, -4.007568359375, -3.88720703125, -3.766845703125, -3.646484375, -3.526123046875, -3.40576171875, -3.285400390625, -3.1650390625, -3.044677734375, -2.92431640625, -2.803955078125, -2.68359375, -2.563232421875, -2.44287109375, -2.322509765625, -2.2021484375, -2.081787109375, -1.96142578125, -1.841064453125, -1.720703125, -1.600341796875, -1.47998046875, -1.359619140625, -1.2392578125, -1.118896484375, -0.99853515625, -0.878173828125, -0.7578125, -0.637451171875, -0.51708984375, -0.396728515625, -0.2763671875, -0.156005859375, -0.03564453125, 0.084716796875, 0.205078125, 0.325439453125, 0.44580078125, 0.566162109375, 0.6865234375, 0.806884765625, 0.92724609375, 1.047607421875, 1.16796875, 1.288330078125, 1.40869140625, 1.529052734375, 1.6494140625, 1.769775390625, 1.89013671875, 2.010498046875, 2.130859375, 2.251220703125, 2.37158203125, 2.491943359375, 2.6123046875, 2.732666015625, 2.85302734375, 2.973388671875, 3.09375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 10.0, 13.0, 23.0, 45.0, 39.0, 69.0, 81.0, 86.0, 96.0, 111.0, 98.0, 82.0, 61.0, 45.0, 48.0, 28.0, 24.0, 18.0, 6.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.12994384765625, -8.8770751953125, -8.62420654296875, -8.371337890625, -8.11846923828125, -7.8656005859375, -7.61273193359375, -7.35986328125, -7.10699462890625, -6.8541259765625, -6.60125732421875, -6.348388671875, -6.09552001953125, -5.8426513671875, -5.58978271484375, -5.3369140625, -5.08404541015625, -4.8311767578125, -4.57830810546875, -4.325439453125, -4.07257080078125, -3.8197021484375, -3.56683349609375, -3.31396484375, -3.06109619140625, -2.8082275390625, -2.55535888671875, -2.302490234375, -2.04962158203125, -1.7967529296875, -1.54388427734375, -1.291015625, -1.03814697265625, -0.7852783203125, -0.53240966796875, -0.279541015625, -0.02667236328125, 0.2261962890625, 0.47906494140625, 0.73193359375, 0.98480224609375, 1.2376708984375, 1.49053955078125, 1.743408203125, 1.99627685546875, 2.2491455078125, 2.50201416015625, 2.7548828125, 3.00775146484375, 3.2606201171875, 3.51348876953125, 3.766357421875, 4.01922607421875, 4.2720947265625, 4.52496337890625, 4.77783203125, 5.03070068359375, 5.2835693359375, 5.53643798828125, 5.789306640625, 6.04217529296875, 6.2950439453125, 6.54791259765625, 6.80078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 4.0, 3.0, 4.0, 14.0, 17.0, 28.0, 27.0, 65.0, 96.0, 244.0, 651.0, 2590.0, 37509.0, 990136.0, 14445.0, 1810.0, 501.0, 209.0, 79.0, 46.0, 27.0, 18.0, 12.0, 13.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4140625, -3.325103759765625, -3.23614501953125, -3.147186279296875, -3.0582275390625, -2.969268798828125, -2.88031005859375, -2.791351318359375, -2.702392578125, -2.613433837890625, -2.52447509765625, -2.435516357421875, -2.3465576171875, -2.257598876953125, -2.16864013671875, -2.079681396484375, -1.99072265625, -1.901763916015625, -1.81280517578125, -1.723846435546875, -1.6348876953125, -1.545928955078125, -1.45697021484375, -1.368011474609375, -1.279052734375, -1.190093994140625, -1.10113525390625, -1.012176513671875, -0.9232177734375, -0.834259033203125, -0.74530029296875, -0.656341552734375, -0.5673828125, -0.478424072265625, -0.38946533203125, -0.300506591796875, -0.2115478515625, -0.122589111328125, -0.03363037109375, 0.055328369140625, 0.144287109375, 0.233245849609375, 0.32220458984375, 0.411163330078125, 0.5001220703125, 0.589080810546875, 0.67803955078125, 0.766998291015625, 0.85595703125, 0.944915771484375, 1.03387451171875, 1.122833251953125, 1.2117919921875, 1.300750732421875, 1.38970947265625, 1.478668212890625, 1.567626953125, 1.656585693359375, 1.74554443359375, 1.834503173828125, 1.9234619140625, 2.012420654296875, 2.10137939453125, 2.190338134765625, 2.279296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 8.0, 5.0, 13.0, 18.0, 30.0, 49.0, 74.0, 130.0, 182.0, 209.0, 134.0, 65.0, 29.0, 22.0, 13.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000324249267578125, -0.0003161393105983734, -0.0003080293536186218, -0.00029991939663887024, -0.00029180943965911865, -0.00028369948267936707, -0.0002755895256996155, -0.0002674795687198639, -0.0002593696117401123, -0.0002512596547603607, -0.00024314969778060913, -0.00023503974080085754, -0.00022692978382110596, -0.00021881982684135437, -0.00021070986986160278, -0.0002025999128818512, -0.0001944899559020996, -0.00018637999892234802, -0.00017827004194259644, -0.00017016008496284485, -0.00016205012798309326, -0.00015394017100334167, -0.0001458302140235901, -0.0001377202570438385, -0.00012961030006408691, -0.00012150034308433533, -0.00011339038610458374, -0.00010528042912483215, -9.717047214508057e-05, -8.906051516532898e-05, -8.095055818557739e-05, -7.28406012058258e-05, -6.473064422607422e-05, -5.662068724632263e-05, -4.8510730266571045e-05, -4.040077328681946e-05, -3.229081630706787e-05, -2.4180859327316284e-05, -1.6070902347564697e-05, -7.96094536781311e-06, 1.4901161193847656e-07, 8.258968591690063e-06, 1.636892557144165e-05, 2.4478882551193237e-05, 3.2588839530944824e-05, 4.069879651069641e-05, 4.8808753490448e-05, 5.6918710470199585e-05, 6.502866744995117e-05, 7.313862442970276e-05, 8.124858140945435e-05, 8.935853838920593e-05, 9.746849536895752e-05, 0.0001055784523487091, 0.0001136884093284607, 0.00012179836630821228, 0.00012990832328796387, 0.00013801828026771545, 0.00014612823724746704, 0.00015423819422721863, 0.00016234815120697021, 0.0001704581081867218, 0.0001785680651664734, 0.00018667802214622498, 0.00019478797912597656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 12.0, 12.0, 16.0, 17.0, 56.0, 80.0, 145.0, 282.0, 576.0, 1562.0, 6741.0, 109772.0, 890096.0, 33102.0, 4053.0, 1104.0, 429.0, 199.0, 123.0, 60.0, 24.0, 19.0, 9.0, 15.0, 7.0, 12.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.400390625, -1.3556976318359375, -1.311004638671875, -1.2663116455078125, -1.22161865234375, -1.1769256591796875, -1.132232666015625, -1.0875396728515625, -1.0428466796875, -0.9981536865234375, -0.953460693359375, -0.9087677001953125, -0.86407470703125, -0.8193817138671875, -0.774688720703125, -0.7299957275390625, -0.685302734375, -0.6406097412109375, -0.595916748046875, -0.5512237548828125, -0.50653076171875, -0.4618377685546875, -0.417144775390625, -0.3724517822265625, -0.3277587890625, -0.2830657958984375, -0.238372802734375, -0.1936798095703125, -0.14898681640625, -0.1042938232421875, -0.059600830078125, -0.0149078369140625, 0.02978515625, 0.0744781494140625, 0.119171142578125, 0.1638641357421875, 0.20855712890625, 0.2532501220703125, 0.297943115234375, 0.3426361083984375, 0.3873291015625, 0.4320220947265625, 0.476715087890625, 0.5214080810546875, 0.56610107421875, 0.6107940673828125, 0.655487060546875, 0.7001800537109375, 0.744873046875, 0.7895660400390625, 0.834259033203125, 0.8789520263671875, 0.92364501953125, 0.9683380126953125, 1.013031005859375, 1.0577239990234375, 1.1024169921875, 1.1471099853515625, 1.191802978515625, 1.2364959716796875, 1.28118896484375, 1.3258819580078125, 1.370574951171875, 1.4152679443359375, 1.4599609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 12.0, 21.0, 26.0, 44.0, 68.0, 92.0, 126.0, 132.0, 131.0, 118.0, 72.0, 46.0, 40.0, 21.0, 18.0, 11.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88525390625, -0.8405227661132812, -0.7957916259765625, -0.7510604858398438, -0.706329345703125, -0.6615982055664062, -0.6168670654296875, -0.5721359252929688, -0.52740478515625, -0.48267364501953125, -0.4379425048828125, -0.39321136474609375, -0.348480224609375, -0.30374908447265625, -0.2590179443359375, -0.21428680419921875, -0.1695556640625, -0.12482452392578125, -0.0800933837890625, -0.03536224365234375, 0.009368896484375, 0.05410003662109375, 0.0988311767578125, 0.14356231689453125, 0.18829345703125, 0.23302459716796875, 0.2777557373046875, 0.32248687744140625, 0.367218017578125, 0.41194915771484375, 0.4566802978515625, 0.5014114379882812, 0.546142578125, 0.5908737182617188, 0.6356048583984375, 0.6803359985351562, 0.725067138671875, 0.7697982788085938, 0.8145294189453125, 0.8592605590820312, 0.90399169921875, 0.9487228393554688, 0.9934539794921875, 1.0381851196289062, 1.082916259765625, 1.1276473999023438, 1.1723785400390625, 1.2171096801757812, 1.2618408203125, 1.3065719604492188, 1.3513031005859375, 1.3960342407226562, 1.440765380859375, 1.4854965209960938, 1.5302276611328125, 1.5749588012695312, 1.61968994140625, 1.6644210815429688, 1.7091522216796875, 1.7538833618164062, 1.798614501953125, 1.8433456420898438, 1.8880767822265625, 1.9328079223632812, 1.9775390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 11.0, 39.0, 82.0, 473.0, 351.0, 40.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.5853042602539, -87.7188949584961, -85.85249328613281, -83.986083984375, -82.11968231201172, -80.2532730102539, -78.38687133789062, -76.52046203613281, -74.654052734375, -72.78764343261719, -70.9212417602539, -69.0548324584961, -67.18843078613281, -65.322021484375, -63.45561599731445, -61.589210510253906, -59.722808837890625, -57.85640335083008, -55.98999786376953, -54.123592376708984, -52.25718688964844, -50.390777587890625, -48.52437210083008, -46.65796661376953, -44.791561126708984, -42.92515563964844, -41.05875015258789, -39.192344665527344, -37.32593536376953, -35.45953369140625, -33.59312438964844, -31.72671890258789, -29.860315322875977, -27.99390983581543, -26.12750244140625, -24.261096954345703, -22.394691467285156, -20.52828598022461, -18.661880493164062, -16.795473098754883, -14.929067611694336, -13.062662124633789, -11.196255683898926, -9.329849243164062, -7.463443756103516, -5.597038269042969, -3.7306318283081055, -1.8642253875732422, 0.0021800994873046875, 1.8685860633850098, 3.734992027282715, 5.60139799118042, 7.467803955078125, 9.334209442138672, 11.200615882873535, 13.067022323608398, 14.933427810668945, 16.799833297729492, 18.666240692138672, 20.53264617919922, 22.399051666259766, 24.265457153320312, 26.13186264038086, 27.99827003479004, 29.864675521850586]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 11.0, 4.0, 13.0, 13.0, 14.0, 27.0, 20.0, 43.0, 36.0, 54.0, 52.0, 58.0, 79.0, 91.0, 90.0, 64.0, 52.0, 40.0, 51.0, 45.0, 39.0, 22.0, 24.0, 13.0, 15.0, 11.0, 9.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.39104652404785, -22.52100372314453, -21.650962829589844, -20.780920028686523, -19.910879135131836, -19.040836334228516, -18.170795440673828, -17.300752639770508, -16.430709838867188, -15.560667991638184, -14.69062614440918, -13.82058334350586, -12.950542449951172, -12.080499649047852, -11.210457801818848, -10.340415954589844, -9.470375061035156, -8.600333213806152, -7.730291366577148, -6.860249042510986, -5.990207195281982, -5.1201653480529785, -4.250123023986816, -3.3800811767578125, -2.5100393295288086, -1.6399973630905151, -0.7699553966522217, 0.10008668899536133, 0.9701285362243652, 1.8401703834533691, 2.7102127075195312, 3.580254554748535, 4.450298309326172, 5.320340156555176, 6.19038200378418, 7.060424327850342, 7.930466175079346, 8.800508499145508, 9.670550346374512, 10.540592193603516, 11.41063404083252, 12.280675888061523, 13.150717735290527, 14.020759582519531, 14.890802383422852, 15.760843276977539, 16.63088607788086, 17.500926971435547, 18.370969772338867, 19.241012573242188, 20.111053466796875, 20.981096267700195, 21.851137161254883, 22.721179962158203, 23.59122085571289, 24.46126365661621, 25.33130645751953, 26.20134925842285, 27.07139015197754, 27.94143295288086, 28.811473846435547, 29.681516647338867, 30.551559448242188, 31.421600341796875, 32.29164123535156]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 12.0, 13.0, 11.0, 33.0, 57.0, 112.0, 203.0, 653.0, 2386.0, 18856.0, 991522.0, 3138210.0, 36627.0, 3758.0, 1055.0, 384.0, 156.0, 76.0, 51.0, 30.0, 28.0, 11.0, 9.0, 8.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0390625, -1.96661376953125, -1.8941650390625, -1.82171630859375, -1.749267578125, -1.67681884765625, -1.6043701171875, -1.53192138671875, -1.45947265625, -1.38702392578125, -1.3145751953125, -1.24212646484375, -1.169677734375, -1.09722900390625, -1.0247802734375, -0.95233154296875, -0.8798828125, -0.80743408203125, -0.7349853515625, -0.66253662109375, -0.590087890625, -0.51763916015625, -0.4451904296875, -0.37274169921875, -0.30029296875, -0.22784423828125, -0.1553955078125, -0.08294677734375, -0.010498046875, 0.06195068359375, 0.1343994140625, 0.20684814453125, 0.279296875, 0.35174560546875, 0.4241943359375, 0.49664306640625, 0.569091796875, 0.64154052734375, 0.7139892578125, 0.78643798828125, 0.85888671875, 0.93133544921875, 1.0037841796875, 1.07623291015625, 1.148681640625, 1.22113037109375, 1.2935791015625, 1.36602783203125, 1.4384765625, 1.51092529296875, 1.5833740234375, 1.65582275390625, 1.728271484375, 1.80072021484375, 1.8731689453125, 1.94561767578125, 2.01806640625, 2.09051513671875, 2.1629638671875, 2.23541259765625, 2.307861328125, 2.38031005859375, 2.4527587890625, 2.52520751953125, 2.59765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 9.0, 6.0, 14.0, 13.0, 14.0, 22.0, 23.0, 32.0, 28.0, 41.0, 46.0, 35.0, 67.0, 56.0, 60.0, 76.0, 49.0, 66.0, 62.0, 54.0, 46.0, 32.0, 26.0, 22.0, 17.0, 20.0, 14.0, 10.0, 8.0, 9.0, 4.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8868637084960938, -0.8503875732421875, -0.8139114379882812, -0.777435302734375, -0.7409591674804688, -0.7044830322265625, -0.6680068969726562, -0.63153076171875, -0.5950546264648438, -0.5585784912109375, -0.5221023559570312, -0.485626220703125, -0.44915008544921875, -0.4126739501953125, -0.37619781494140625, -0.3397216796875, -0.30324554443359375, -0.2667694091796875, -0.23029327392578125, -0.193817138671875, -0.15734100341796875, -0.1208648681640625, -0.08438873291015625, -0.04791259765625, -0.01143646240234375, 0.0250396728515625, 0.06151580810546875, 0.097991943359375, 0.13446807861328125, 0.1709442138671875, 0.20742034912109375, 0.243896484375, 0.28037261962890625, 0.3168487548828125, 0.35332489013671875, 0.389801025390625, 0.42627716064453125, 0.4627532958984375, 0.49922943115234375, 0.53570556640625, 0.5721817016601562, 0.6086578369140625, 0.6451339721679688, 0.681610107421875, 0.7180862426757812, 0.7545623779296875, 0.7910385131835938, 0.8275146484375, 0.8639907836914062, 0.9004669189453125, 0.9369430541992188, 0.973419189453125, 1.0098953247070312, 1.0463714599609375, 1.0828475952148438, 1.11932373046875, 1.1557998657226562, 1.1922760009765625, 1.2287521362304688, 1.265228271484375, 1.3017044067382812, 1.3381805419921875, 1.3746566772460938, 1.4111328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 10.0, 13.0, 32.0, 27.0, 51.0, 100.0, 168.0, 320.0, 706.0, 2477.0, 15526.0, 256635.0, 3845690.0, 63052.0, 6787.0, 1558.0, 501.0, 248.0, 132.0, 70.0, 56.0, 45.0, 24.0, 21.0, 17.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.17578125, -3.098907470703125, -3.02203369140625, -2.945159912109375, -2.8682861328125, -2.791412353515625, -2.71453857421875, -2.637664794921875, -2.560791015625, -2.483917236328125, -2.40704345703125, -2.330169677734375, -2.2532958984375, -2.176422119140625, -2.09954833984375, -2.022674560546875, -1.94580078125, -1.868927001953125, -1.79205322265625, -1.715179443359375, -1.6383056640625, -1.561431884765625, -1.48455810546875, -1.407684326171875, -1.330810546875, -1.253936767578125, -1.17706298828125, -1.100189208984375, -1.0233154296875, -0.946441650390625, -0.86956787109375, -0.792694091796875, -0.7158203125, -0.638946533203125, -0.56207275390625, -0.485198974609375, -0.4083251953125, -0.331451416015625, -0.25457763671875, -0.177703857421875, -0.100830078125, -0.023956298828125, 0.05291748046875, 0.129791259765625, 0.2066650390625, 0.283538818359375, 0.36041259765625, 0.437286376953125, 0.51416015625, 0.591033935546875, 0.66790771484375, 0.744781494140625, 0.8216552734375, 0.898529052734375, 0.97540283203125, 1.052276611328125, 1.129150390625, 1.206024169921875, 1.28289794921875, 1.359771728515625, 1.4366455078125, 1.513519287109375, 1.59039306640625, 1.667266845703125, 1.744140625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 12.0, 22.0, 23.0, 26.0, 47.0, 97.0, 183.0, 390.0, 1098.0, 1287.0, 481.0, 164.0, 77.0, 43.0, 27.0, 23.0, 10.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.53546142578125, -2.4537353515625, -2.37200927734375, -2.290283203125, -2.20855712890625, -2.1268310546875, -2.04510498046875, -1.96337890625, -1.88165283203125, -1.7999267578125, -1.71820068359375, -1.636474609375, -1.55474853515625, -1.4730224609375, -1.39129638671875, -1.3095703125, -1.22784423828125, -1.1461181640625, -1.06439208984375, -0.982666015625, -0.90093994140625, -0.8192138671875, -0.73748779296875, -0.65576171875, -0.57403564453125, -0.4923095703125, -0.41058349609375, -0.328857421875, -0.24713134765625, -0.1654052734375, -0.08367919921875, -0.001953125, 0.07977294921875, 0.1614990234375, 0.24322509765625, 0.324951171875, 0.40667724609375, 0.4884033203125, 0.57012939453125, 0.65185546875, 0.73358154296875, 0.8153076171875, 0.89703369140625, 0.978759765625, 1.06048583984375, 1.1422119140625, 1.22393798828125, 1.3056640625, 1.38739013671875, 1.4691162109375, 1.55084228515625, 1.632568359375, 1.71429443359375, 1.7960205078125, 1.87774658203125, 1.95947265625, 2.04119873046875, 2.1229248046875, 2.20465087890625, 2.286376953125, 2.36810302734375, 2.4498291015625, 2.53155517578125, 2.61328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 1.0, 16.0, 28.0, 79.0, 194.0, 255.0, 198.0, 114.0, 51.0, 33.0, 11.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.298234939575195, -25.710342407226562, -25.122447967529297, -24.534555435180664, -23.94666290283203, -23.3587703704834, -22.770877838134766, -22.1829833984375, -21.595090866088867, -21.007198333740234, -20.41930389404297, -19.831411361694336, -19.243518829345703, -18.65562629699707, -18.067733764648438, -17.479839324951172, -16.89194679260254, -16.304054260253906, -15.716160774230957, -15.128267288208008, -14.540374755859375, -13.952482223510742, -13.364588737487793, -12.776695251464844, -12.188802719116211, -11.600910186767578, -11.013016700744629, -10.42512321472168, -9.837230682373047, -9.249338150024414, -8.661444664001465, -8.073551177978516, -7.485658645629883, -6.897765636444092, -6.309872627258301, -5.72197961807251, -5.134086608886719, -4.546193599700928, -3.9583005905151367, -3.3704075813293457, -2.7825145721435547, -2.1946215629577637, -1.6067285537719727, -1.0188355445861816, -0.4309425354003906, 0.1569504737854004, 0.7448434829711914, 1.3327364921569824, 1.9206295013427734, 2.5085225105285645, 3.0964155197143555, 3.6843085289001465, 4.2722015380859375, 4.8600945472717285, 5.4479875564575195, 6.0358805656433105, 6.623773574829102, 7.211666584014893, 7.799559593200684, 8.387453079223633, 8.975345611572266, 9.563238143920898, 10.151131629943848, 10.739025115966797, 11.32691764831543]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 6.0, 10.0, 13.0, 16.0, 9.0, 19.0, 25.0, 24.0, 37.0, 35.0, 36.0, 42.0, 46.0, 44.0, 47.0, 41.0, 49.0, 51.0, 56.0, 51.0, 41.0, 46.0, 34.0, 34.0, 33.0, 23.0, 18.0, 24.0, 17.0, 14.0, 6.0, 6.0, 8.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.143954277038574, -8.823899269104004, -8.503843307495117, -8.183788299560547, -7.863733291625977, -7.543678283691406, -7.223622798919678, -6.903567314147949, -6.583512306213379, -6.263457298278809, -5.94340181350708, -5.623346328735352, -5.303291320800781, -4.983236312866211, -4.663180828094482, -4.343125343322754, -4.023070335388184, -3.703015089035034, -3.3829598426818848, -3.0629045963287354, -2.742849349975586, -2.4227941036224365, -2.102738857269287, -1.7826836109161377, -1.4626283645629883, -1.1425731182098389, -0.8225178718566895, -0.50246262550354, -0.18240737915039062, 0.1376478672027588, 0.4577031135559082, 0.7777583599090576, 1.097813606262207, 1.4178688526153564, 1.7379240989685059, 2.0579793453216553, 2.3780345916748047, 2.698089838027954, 3.0181450843811035, 3.338200330734253, 3.6582555770874023, 3.9783108234405518, 4.298366069793701, 4.61842155456543, 4.9384765625, 5.25853157043457, 5.578587055206299, 5.898642539978027, 6.218697547912598, 6.538752555847168, 6.8588080406188965, 7.178863525390625, 7.498918533325195, 7.818973541259766, 8.139028549194336, 8.459084510803223, 8.779139518737793, 9.099194526672363, 9.41925048828125, 9.73930549621582, 10.05936050415039, 10.379415512084961, 10.699470520019531, 11.019526481628418, 11.339581489562988]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 12.0, 15.0, 17.0, 21.0, 41.0, 55.0, 72.0, 125.0, 229.0, 330.0, 580.0, 937.0, 1823.0, 3510.0, 7109.0, 15476.0, 35550.0, 90527.0, 231727.0, 348797.0, 185939.0, 71830.0, 28761.0, 12521.0, 5717.0, 2986.0, 1588.0, 914.0, 545.0, 283.0, 175.0, 102.0, 85.0, 38.0, 36.0, 26.0, 18.0, 11.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.0654296875, -1.0361404418945312, -1.0068511962890625, -0.9775619506835938, -0.948272705078125, -0.9189834594726562, -0.8896942138671875, -0.8604049682617188, -0.83111572265625, -0.8018264770507812, -0.7725372314453125, -0.7432479858398438, -0.713958740234375, -0.6846694946289062, -0.6553802490234375, -0.6260910034179688, -0.5968017578125, -0.5675125122070312, -0.5382232666015625, -0.5089340209960938, -0.479644775390625, -0.45035552978515625, -0.4210662841796875, -0.39177703857421875, -0.36248779296875, -0.33319854736328125, -0.3039093017578125, -0.27462005615234375, -0.245330810546875, -0.21604156494140625, -0.1867523193359375, -0.15746307373046875, -0.128173828125, -0.09888458251953125, -0.0695953369140625, -0.04030609130859375, -0.011016845703125, 0.01827239990234375, 0.0475616455078125, 0.07685089111328125, 0.10614013671875, 0.13542938232421875, 0.1647186279296875, 0.19400787353515625, 0.223297119140625, 0.25258636474609375, 0.2818756103515625, 0.31116485595703125, 0.3404541015625, 0.36974334716796875, 0.3990325927734375, 0.42832183837890625, 0.457611083984375, 0.48690032958984375, 0.5161895751953125, 0.5454788208007812, 0.57476806640625, 0.6040573120117188, 0.6333465576171875, 0.6626358032226562, 0.691925048828125, 0.7212142944335938, 0.7505035400390625, 0.7797927856445312, 0.80908203125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 7.0, 8.0, 10.0, 12.0, 18.0, 11.0, 14.0, 23.0, 29.0, 21.0, 33.0, 46.0, 41.0, 53.0, 50.0, 61.0, 51.0, 55.0, 53.0, 62.0, 62.0, 49.0, 46.0, 37.0, 26.0, 19.0, 21.0, 17.0, 17.0, 11.0, 7.0, 14.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.876953125, -0.8430633544921875, -0.809173583984375, -0.7752838134765625, -0.74139404296875, -0.7075042724609375, -0.673614501953125, -0.6397247314453125, -0.6058349609375, -0.5719451904296875, -0.538055419921875, -0.5041656494140625, -0.47027587890625, -0.4363861083984375, -0.402496337890625, -0.3686065673828125, -0.334716796875, -0.3008270263671875, -0.266937255859375, -0.2330474853515625, -0.19915771484375, -0.1652679443359375, -0.131378173828125, -0.0974884033203125, -0.0635986328125, -0.0297088623046875, 0.004180908203125, 0.0380706787109375, 0.07196044921875, 0.1058502197265625, 0.139739990234375, 0.1736297607421875, 0.20751953125, 0.2414093017578125, 0.275299072265625, 0.3091888427734375, 0.34307861328125, 0.3769683837890625, 0.410858154296875, 0.4447479248046875, 0.4786376953125, 0.5125274658203125, 0.546417236328125, 0.5803070068359375, 0.61419677734375, 0.6480865478515625, 0.681976318359375, 0.7158660888671875, 0.749755859375, 0.7836456298828125, 0.817535400390625, 0.8514251708984375, 0.88531494140625, 0.9192047119140625, 0.953094482421875, 0.9869842529296875, 1.0208740234375, 1.0547637939453125, 1.088653564453125, 1.1225433349609375, 1.15643310546875, 1.1903228759765625, 1.224212646484375, 1.2581024169921875, 1.2919921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 7.0, 8.0, 11.0, 9.0, 16.0, 37.0, 42.0, 41.0, 64.0, 94.0, 100.0, 153.0, 204.0, 305.0, 452.0, 816.0, 1584.0, 4346.0, 24410.0, 583263.0, 403616.0, 21392.0, 3923.0, 1460.0, 693.0, 425.0, 291.0, 190.0, 158.0, 124.0, 78.0, 75.0, 50.0, 33.0, 27.0, 10.0, 11.0, 6.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.10546875, -3.008331298828125, -2.91119384765625, -2.814056396484375, -2.7169189453125, -2.619781494140625, -2.52264404296875, -2.425506591796875, -2.328369140625, -2.231231689453125, -2.13409423828125, -2.036956787109375, -1.9398193359375, -1.842681884765625, -1.74554443359375, -1.648406982421875, -1.55126953125, -1.454132080078125, -1.35699462890625, -1.259857177734375, -1.1627197265625, -1.065582275390625, -0.96844482421875, -0.871307373046875, -0.774169921875, -0.677032470703125, -0.57989501953125, -0.482757568359375, -0.3856201171875, -0.288482666015625, -0.19134521484375, -0.094207763671875, 0.0029296875, 0.100067138671875, 0.19720458984375, 0.294342041015625, 0.3914794921875, 0.488616943359375, 0.58575439453125, 0.682891845703125, 0.780029296875, 0.877166748046875, 0.97430419921875, 1.071441650390625, 1.1685791015625, 1.265716552734375, 1.36285400390625, 1.459991455078125, 1.55712890625, 1.654266357421875, 1.75140380859375, 1.848541259765625, 1.9456787109375, 2.042816162109375, 2.13995361328125, 2.237091064453125, 2.334228515625, 2.431365966796875, 2.52850341796875, 2.625640869140625, 2.7227783203125, 2.819915771484375, 2.91705322265625, 3.014190673828125, 3.111328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 9.0, 6.0, 7.0, 5.0, 16.0, 6.0, 9.0, 15.0, 19.0, 25.0, 27.0, 33.0, 47.0, 47.0, 49.0, 52.0, 49.0, 58.0, 66.0, 47.0, 56.0, 46.0, 47.0, 39.0, 32.0, 28.0, 29.0, 25.0, 22.0, 19.0, 9.0, 14.0, 13.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-5.3984375, -5.25030517578125, -5.1021728515625, -4.95404052734375, -4.805908203125, -4.65777587890625, -4.5096435546875, -4.36151123046875, -4.21337890625, -4.06524658203125, -3.9171142578125, -3.76898193359375, -3.620849609375, -3.47271728515625, -3.3245849609375, -3.17645263671875, -3.0283203125, -2.88018798828125, -2.7320556640625, -2.58392333984375, -2.435791015625, -2.28765869140625, -2.1395263671875, -1.99139404296875, -1.84326171875, -1.69512939453125, -1.5469970703125, -1.39886474609375, -1.250732421875, -1.10260009765625, -0.9544677734375, -0.80633544921875, -0.658203125, -0.51007080078125, -0.3619384765625, -0.21380615234375, -0.065673828125, 0.08245849609375, 0.2305908203125, 0.37872314453125, 0.52685546875, 0.67498779296875, 0.8231201171875, 0.97125244140625, 1.119384765625, 1.26751708984375, 1.4156494140625, 1.56378173828125, 1.7119140625, 1.86004638671875, 2.0081787109375, 2.15631103515625, 2.304443359375, 2.45257568359375, 2.6007080078125, 2.74884033203125, 2.89697265625, 3.04510498046875, 3.1932373046875, 3.34136962890625, 3.489501953125, 3.63763427734375, 3.7857666015625, 3.93389892578125, 4.08203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 12.0, 6.0, 21.0, 34.0, 43.0, 107.0, 204.0, 530.0, 1783.0, 10078.0, 939875.0, 89274.0, 4746.0, 1113.0, 402.0, 151.0, 84.0, 47.0, 19.0, 14.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2265625, -2.146514892578125, -2.06646728515625, -1.986419677734375, -1.9063720703125, -1.826324462890625, -1.74627685546875, -1.666229248046875, -1.586181640625, -1.506134033203125, -1.42608642578125, -1.346038818359375, -1.2659912109375, -1.185943603515625, -1.10589599609375, -1.025848388671875, -0.94580078125, -0.865753173828125, -0.78570556640625, -0.705657958984375, -0.6256103515625, -0.545562744140625, -0.46551513671875, -0.385467529296875, -0.305419921875, -0.225372314453125, -0.14532470703125, -0.065277099609375, 0.0147705078125, 0.094818115234375, 0.17486572265625, 0.254913330078125, 0.3349609375, 0.415008544921875, 0.49505615234375, 0.575103759765625, 0.6551513671875, 0.735198974609375, 0.81524658203125, 0.895294189453125, 0.975341796875, 1.055389404296875, 1.13543701171875, 1.215484619140625, 1.2955322265625, 1.375579833984375, 1.45562744140625, 1.535675048828125, 1.61572265625, 1.695770263671875, 1.77581787109375, 1.855865478515625, 1.9359130859375, 2.015960693359375, 2.09600830078125, 2.176055908203125, 2.256103515625, 2.336151123046875, 2.41619873046875, 2.496246337890625, 2.5762939453125, 2.656341552734375, 2.73638916015625, 2.816436767578125, 2.896484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 7.0, 11.0, 18.0, 34.0, 47.0, 138.0, 257.0, 219.0, 115.0, 60.0, 32.0, 29.0, 9.0, 8.0, 5.0, 3.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016450881958007812, -0.00015474483370780945, -0.00014498084783554077, -0.0001352168619632721, -0.00012545287609100342, -0.00011568889021873474, -0.00010592490434646606, -9.616091847419739e-05, -8.639693260192871e-05, -7.663294672966003e-05, -6.686896085739136e-05, -5.710497498512268e-05, -4.7340989112854004e-05, -3.757700324058533e-05, -2.781301736831665e-05, -1.8049031496047974e-05, -8.285045623779297e-06, 1.4789402484893799e-06, 1.1242926120758057e-05, 2.1006911993026733e-05, 3.077089786529541e-05, 4.053488373756409e-05, 5.0298869609832764e-05, 6.006285548210144e-05, 6.982684135437012e-05, 7.95908272266388e-05, 8.935481309890747e-05, 9.911879897117615e-05, 0.00010888278484344482, 0.0001186467707157135, 0.00012841075658798218, 0.00013817474246025085, 0.00014793872833251953, 0.0001577027142047882, 0.00016746670007705688, 0.00017723068594932556, 0.00018699467182159424, 0.00019675865769386292, 0.0002065226435661316, 0.00021628662943840027, 0.00022605061531066895, 0.00023581460118293762, 0.0002455785870552063, 0.000255342572927475, 0.00026510655879974365, 0.00027487054467201233, 0.000284634530544281, 0.0002943985164165497, 0.00030416250228881836, 0.00031392648816108704, 0.0003236904740333557, 0.0003334544599056244, 0.00034321844577789307, 0.00035298243165016174, 0.0003627464175224304, 0.0003725104033946991, 0.0003822743892669678, 0.00039203837513923645, 0.0004018023610115051, 0.0004115663468837738, 0.0004213303327560425, 0.00043109431862831116, 0.00044085830450057983, 0.0004506222903728485, 0.0004603862762451172]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 10.0, 17.0, 27.0, 31.0, 65.0, 107.0, 197.0, 385.0, 1013.0, 4260.0, 29570.0, 967377.0, 38533.0, 4900.0, 1231.0, 413.0, 151.0, 97.0, 59.0, 34.0, 15.0, 11.0, 7.0, 4.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4747772216796875, -1.421234130859375, -1.3676910400390625, -1.31414794921875, -1.2606048583984375, -1.207061767578125, -1.1535186767578125, -1.0999755859375, -1.0464324951171875, -0.992889404296875, -0.9393463134765625, -0.88580322265625, -0.8322601318359375, -0.778717041015625, -0.7251739501953125, -0.671630859375, -0.6180877685546875, -0.564544677734375, -0.5110015869140625, -0.45745849609375, -0.4039154052734375, -0.350372314453125, -0.2968292236328125, -0.2432861328125, -0.1897430419921875, -0.136199951171875, -0.0826568603515625, -0.02911376953125, 0.0244293212890625, 0.077972412109375, 0.1315155029296875, 0.18505859375, 0.2386016845703125, 0.292144775390625, 0.3456878662109375, 0.39923095703125, 0.4527740478515625, 0.506317138671875, 0.5598602294921875, 0.6134033203125, 0.6669464111328125, 0.720489501953125, 0.7740325927734375, 0.82757568359375, 0.8811187744140625, 0.934661865234375, 0.9882049560546875, 1.041748046875, 1.0952911376953125, 1.148834228515625, 1.2023773193359375, 1.25592041015625, 1.3094635009765625, 1.363006591796875, 1.4165496826171875, 1.4700927734375, 1.5236358642578125, 1.577178955078125, 1.6307220458984375, 1.68426513671875, 1.7378082275390625, 1.791351318359375, 1.8448944091796875, 1.8984375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 0.0, 3.0, 4.0, 7.0, 2.0, 6.0, 8.0, 9.0, 12.0, 18.0, 23.0, 28.0, 64.0, 108.0, 161.0, 165.0, 134.0, 87.0, 64.0, 25.0, 17.0, 8.0, 7.0, 6.0, 4.0, 6.0, 5.0, 0.0, 3.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.54296875, -1.5025787353515625, -1.462188720703125, -1.4217987060546875, -1.38140869140625, -1.3410186767578125, -1.300628662109375, -1.2602386474609375, -1.2198486328125, -1.1794586181640625, -1.139068603515625, -1.0986785888671875, -1.05828857421875, -1.0178985595703125, -0.977508544921875, -0.9371185302734375, -0.896728515625, -0.8563385009765625, -0.815948486328125, -0.7755584716796875, -0.73516845703125, -0.6947784423828125, -0.654388427734375, -0.6139984130859375, -0.5736083984375, -0.5332183837890625, -0.492828369140625, -0.4524383544921875, -0.41204833984375, -0.3716583251953125, -0.331268310546875, -0.2908782958984375, -0.25048828125, -0.2100982666015625, -0.169708251953125, -0.1293182373046875, -0.08892822265625, -0.0485382080078125, -0.008148193359375, 0.0322418212890625, 0.0726318359375, 0.1130218505859375, 0.153411865234375, 0.1938018798828125, 0.23419189453125, 0.2745819091796875, 0.314971923828125, 0.3553619384765625, 0.395751953125, 0.4361419677734375, 0.476531982421875, 0.5169219970703125, 0.55731201171875, 0.5977020263671875, 0.638092041015625, 0.6784820556640625, 0.7188720703125, 0.7592620849609375, 0.799652099609375, 0.8400421142578125, 0.88043212890625, 0.9208221435546875, 0.961212158203125, 1.0016021728515625, 1.0419921875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 18.0, 49.0, 107.0, 230.0, 333.0, 139.0, 55.0, 30.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.32586097717285, -20.44742202758789, -19.56898307800293, -18.69054412841797, -17.812105178833008, -16.933666229248047, -16.05522918701172, -15.176789283752441, -14.29835033416748, -13.41991138458252, -12.541472434997559, -11.663034439086914, -10.784595489501953, -9.906156539916992, -9.027717590332031, -8.14927864074707, -7.270839691162109, -6.392400741577148, -5.5139617919921875, -4.635523319244385, -3.757084369659424, -2.878645420074463, -2.00020694732666, -1.1217679977416992, -0.24332904815673828, 0.6351097822189331, 1.5135486125946045, 2.3919873237609863, 3.2704262733459473, 4.148865222930908, 5.027303695678711, 5.905742645263672, 6.784183502197266, 7.662622451782227, 8.541061401367188, 9.419500350952148, 10.29793930053711, 11.17637825012207, 12.054816246032715, 12.933255195617676, 13.811694145202637, 14.690133094787598, 15.568572044372559, 16.447010040283203, 17.325448989868164, 18.203887939453125, 19.082326889038086, 19.960765838623047, 20.839204788208008, 21.71764373779297, 22.59608268737793, 23.47452163696289, 24.35296058654785, 25.231399536132812, 26.10983657836914, 26.988277435302734, 27.866714477539062, 28.745153427124023, 29.623592376708984, 30.502031326293945, 31.380470275878906, 32.258907318115234, 33.13734817504883, 34.015785217285156, 34.89422607421875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 6.0, 4.0, 6.0, 11.0, 7.0, 8.0, 12.0, 23.0, 18.0, 25.0, 20.0, 17.0, 24.0, 26.0, 22.0, 25.0, 33.0, 35.0, 43.0, 46.0, 69.0, 69.0, 61.0, 42.0, 40.0, 30.0, 39.0, 23.0, 22.0, 21.0, 23.0, 18.0, 18.0, 21.0, 13.0, 11.0, 15.0, 13.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.533464431762695, -16.980764389038086, -16.428062438964844, -15.875362396240234, -15.322662353515625, -14.769962310791016, -14.21726131439209, -13.664560317993164, -13.111860275268555, -12.559160232543945, -12.00645923614502, -11.453758239746094, -10.901058197021484, -10.348358154296875, -9.79565715789795, -9.242956161499023, -8.690256118774414, -8.137556076049805, -7.584855079650879, -7.032154560089111, -6.479454040527344, -5.926753520965576, -5.374053001403809, -4.821352481842041, -4.268651962280273, -3.715951442718506, -3.1632509231567383, -2.6105504035949707, -2.057849884033203, -1.5051493644714355, -0.952448844909668, -0.3997483253479004, 0.1529541015625, 0.7056546211242676, 1.2583551406860352, 1.8110556602478027, 2.3637561798095703, 2.916456699371338, 3.4691572189331055, 4.021857738494873, 4.574558258056641, 5.127258777618408, 5.679959297180176, 6.232659816741943, 6.785360336303711, 7.3380608558654785, 7.890761375427246, 8.443462371826172, 8.996162414550781, 9.54886245727539, 10.101563453674316, 10.654264450073242, 11.206964492797852, 11.759664535522461, 12.312365531921387, 12.865066528320312, 13.417766571044922, 13.970466613769531, 14.523167610168457, 15.075868606567383, 15.628568649291992, 16.1812686920166, 16.733970642089844, 17.286670684814453, 17.839370727539062]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 4.0, 15.0, 15.0, 27.0, 44.0, 50.0, 65.0, 93.0, 146.0, 210.0, 393.0, 657.0, 1236.0, 3017.0, 10371.0, 52644.0, 394565.0, 2164245.0, 1344653.0, 183518.0, 26077.0, 6489.0, 2701.0, 1353.0, 715.0, 362.0, 211.0, 138.0, 87.0, 43.0, 38.0, 24.0, 16.0, 17.0, 8.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79541015625, -0.7695999145507812, -0.7437896728515625, -0.7179794311523438, -0.692169189453125, -0.6663589477539062, -0.6405487060546875, -0.6147384643554688, -0.58892822265625, -0.5631179809570312, -0.5373077392578125, -0.5114974975585938, -0.485687255859375, -0.45987701416015625, -0.4340667724609375, -0.40825653076171875, -0.3824462890625, -0.35663604736328125, -0.3308258056640625, -0.30501556396484375, -0.279205322265625, -0.25339508056640625, -0.2275848388671875, -0.20177459716796875, -0.17596435546875, -0.15015411376953125, -0.1243438720703125, -0.09853363037109375, -0.072723388671875, -0.04691314697265625, -0.0211029052734375, 0.00470733642578125, 0.030517578125, 0.05632781982421875, 0.0821380615234375, 0.10794830322265625, 0.133758544921875, 0.15956878662109375, 0.1853790283203125, 0.21118927001953125, 0.23699951171875, 0.26280975341796875, 0.2886199951171875, 0.31443023681640625, 0.340240478515625, 0.36605072021484375, 0.3918609619140625, 0.41767120361328125, 0.4434814453125, 0.46929168701171875, 0.4951019287109375, 0.5209121704101562, 0.546722412109375, 0.5725326538085938, 0.5983428955078125, 0.6241531372070312, 0.64996337890625, 0.6757736206054688, 0.7015838623046875, 0.7273941040039062, 0.753204345703125, 0.7790145874023438, 0.8048248291015625, 0.8306350708007812, 0.8564453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 4.0, 10.0, 15.0, 19.0, 21.0, 30.0, 37.0, 40.0, 57.0, 62.0, 64.0, 83.0, 61.0, 79.0, 68.0, 66.0, 63.0, 40.0, 50.0, 30.0, 24.0, 22.0, 20.0, 9.0, 12.0, 7.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7861328125, -1.7434158325195312, -1.7006988525390625, -1.6579818725585938, -1.615264892578125, -1.5725479125976562, -1.5298309326171875, -1.4871139526367188, -1.44439697265625, -1.4016799926757812, -1.3589630126953125, -1.3162460327148438, -1.273529052734375, -1.2308120727539062, -1.1880950927734375, -1.1453781127929688, -1.1026611328125, -1.0599441528320312, -1.0172271728515625, -0.9745101928710938, -0.931793212890625, -0.8890762329101562, -0.8463592529296875, -0.8036422729492188, -0.76092529296875, -0.7182083129882812, -0.6754913330078125, -0.6327743530273438, -0.590057373046875, -0.5473403930664062, -0.5046234130859375, -0.46190643310546875, -0.419189453125, -0.37647247314453125, -0.3337554931640625, -0.29103851318359375, -0.248321533203125, -0.20560455322265625, -0.1628875732421875, -0.12017059326171875, -0.07745361328125, -0.03473663330078125, 0.0079803466796875, 0.05069732666015625, 0.093414306640625, 0.13613128662109375, 0.1788482666015625, 0.22156524658203125, 0.2642822265625, 0.30699920654296875, 0.3497161865234375, 0.39243316650390625, 0.435150146484375, 0.47786712646484375, 0.5205841064453125, 0.5633010864257812, 0.60601806640625, 0.6487350463867188, 0.6914520263671875, 0.7341690063476562, 0.776885986328125, 0.8196029663085938, 0.8623199462890625, 0.9050369262695312, 0.94775390625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 5.0, 14.0, 15.0, 19.0, 32.0, 69.0, 109.0, 180.0, 414.0, 895.0, 2662.0, 11303.0, 97659.0, 3815672.0, 241335.0, 17857.0, 3486.0, 1172.0, 555.0, 320.0, 187.0, 114.0, 74.0, 45.0, 31.0, 17.0, 15.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.888671875, -1.8289642333984375, -1.769256591796875, -1.7095489501953125, -1.64984130859375, -1.5901336669921875, -1.530426025390625, -1.4707183837890625, -1.4110107421875, -1.3513031005859375, -1.291595458984375, -1.2318878173828125, -1.17218017578125, -1.1124725341796875, -1.052764892578125, -0.9930572509765625, -0.933349609375, -0.8736419677734375, -0.813934326171875, -0.7542266845703125, -0.69451904296875, -0.6348114013671875, -0.575103759765625, -0.5153961181640625, -0.4556884765625, -0.3959808349609375, -0.336273193359375, -0.2765655517578125, -0.21685791015625, -0.1571502685546875, -0.097442626953125, -0.0377349853515625, 0.02197265625, 0.0816802978515625, 0.141387939453125, 0.2010955810546875, 0.26080322265625, 0.3205108642578125, 0.380218505859375, 0.4399261474609375, 0.4996337890625, 0.5593414306640625, 0.619049072265625, 0.6787567138671875, 0.73846435546875, 0.7981719970703125, 0.857879638671875, 0.9175872802734375, 0.977294921875, 1.0370025634765625, 1.096710205078125, 1.1564178466796875, 1.21612548828125, 1.2758331298828125, 1.335540771484375, 1.3952484130859375, 1.4549560546875, 1.5146636962890625, 1.574371337890625, 1.6340789794921875, 1.69378662109375, 1.7534942626953125, 1.813201904296875, 1.8729095458984375, 1.9326171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 16.0, 19.0, 29.0, 44.0, 65.0, 158.0, 474.0, 1275.0, 1238.0, 436.0, 140.0, 55.0, 31.0, 18.0, 21.0, 18.0, 8.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.091827392578125, -2.00787353515625, -1.923919677734375, -1.8399658203125, -1.756011962890625, -1.67205810546875, -1.588104248046875, -1.504150390625, -1.420196533203125, -1.33624267578125, -1.252288818359375, -1.1683349609375, -1.084381103515625, -1.00042724609375, -0.916473388671875, -0.83251953125, -0.748565673828125, -0.66461181640625, -0.580657958984375, -0.4967041015625, -0.412750244140625, -0.32879638671875, -0.244842529296875, -0.160888671875, -0.076934814453125, 0.00701904296875, 0.090972900390625, 0.1749267578125, 0.258880615234375, 0.34283447265625, 0.426788330078125, 0.5107421875, 0.594696044921875, 0.67864990234375, 0.762603759765625, 0.8465576171875, 0.930511474609375, 1.01446533203125, 1.098419189453125, 1.182373046875, 1.266326904296875, 1.35028076171875, 1.434234619140625, 1.5181884765625, 1.602142333984375, 1.68609619140625, 1.770050048828125, 1.85400390625, 1.937957763671875, 2.02191162109375, 2.105865478515625, 2.1898193359375, 2.273773193359375, 2.35772705078125, 2.441680908203125, 2.525634765625, 2.609588623046875, 2.69354248046875, 2.777496337890625, 2.8614501953125, 2.945404052734375, 3.02935791015625, 3.113311767578125, 3.197265625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 55.0, 273.0, 448.0, 153.0, 29.0, 8.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.36346435546875, -31.420207977294922, -30.47694969177246, -29.53369140625, -28.590435028076172, -27.647178649902344, -26.703920364379883, -25.760662078857422, -24.817405700683594, -23.874149322509766, -22.930891036987305, -21.987632751464844, -21.044376373291016, -20.101119995117188, -19.157861709594727, -18.214603424072266, -17.271347045898438, -16.32809066772461, -15.384832382202148, -14.441575050354004, -13.49831771850586, -12.555060386657715, -11.61180305480957, -10.668545722961426, -9.725288391113281, -8.782031059265137, -7.838773727416992, -6.895516395568848, -5.952259063720703, -5.009001731872559, -4.065744400024414, -3.1224870681762695, -2.179231643676758, -1.2359743118286133, -0.29271697998046875, 0.6505403518676758, 1.5937976837158203, 2.537055015563965, 3.4803123474121094, 4.423569679260254, 5.366827011108398, 6.310084342956543, 7.2533416748046875, 8.196599006652832, 9.139856338500977, 10.083113670349121, 11.026371002197266, 11.96962833404541, 12.912885665893555, 13.8561429977417, 14.799400329589844, 15.742657661437988, 16.685914993286133, 17.629173278808594, 18.572429656982422, 19.51568603515625, 20.45894432067871, 21.402202606201172, 22.345458984375, 23.288715362548828, 24.23197364807129, 25.17523193359375, 26.118488311767578, 27.061744689941406, 28.005002975463867]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 16.0, 12.0, 23.0, 40.0, 34.0, 39.0, 61.0, 86.0, 75.0, 80.0, 67.0, 82.0, 64.0, 82.0, 51.0, 38.0, 31.0, 38.0, 26.0, 17.0, 15.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.638966083526611, -7.22601842880249, -6.813070774078369, -6.400123596191406, -5.987175941467285, -5.574228286743164, -5.161280632019043, -4.748332977294922, -4.335385322570801, -3.9224376678466797, -3.5094900131225586, -3.0965425968170166, -2.6835949420928955, -2.2706472873687744, -1.8576998710632324, -1.4447522163391113, -1.0318045616149902, -0.6188569664955139, -0.2059093713760376, 0.20703816413879395, 0.619985818862915, 1.0329334735870361, 1.4458808898925781, 1.8588285446166992, 2.2717761993408203, 2.6847238540649414, 3.0976715087890625, 3.5106189250946045, 3.9235665798187256, 4.336514472961426, 4.749461650848389, 5.16240930557251, 5.575357437133789, 5.98830509185791, 6.401252746582031, 6.814200401306152, 7.227148056030273, 7.6400957107543945, 8.053043365478516, 8.46599006652832, 8.878938674926758, 9.291886329650879, 9.704833984375, 10.117781639099121, 10.530729293823242, 10.943676948547363, 11.356624603271484, 11.769571304321289, 12.18251895904541, 12.595466613769531, 13.008414268493652, 13.421361923217773, 13.834309577941895, 14.247257232666016, 14.66020393371582, 15.073152542114258, 15.486099243164062, 15.899046897888184, 16.311994552612305, 16.72494125366211, 17.137889862060547, 17.55083656311035, 17.96378517150879, 18.376731872558594, 18.78968048095703]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 6.0, 20.0, 30.0, 43.0, 53.0, 96.0, 133.0, 224.0, 320.0, 553.0, 938.0, 1650.0, 2891.0, 5606.0, 11132.0, 23268.0, 49647.0, 110700.0, 241029.0, 303263.0, 160809.0, 71886.0, 32162.0, 15274.0, 7576.0, 3872.0, 2209.0, 1242.0, 729.0, 408.0, 307.0, 158.0, 104.0, 79.0, 38.0, 36.0, 18.0, 14.0, 8.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8480148315429688, -0.8224945068359375, -0.7969741821289062, -0.771453857421875, -0.7459335327148438, -0.7204132080078125, -0.6948928833007812, -0.66937255859375, -0.6438522338867188, -0.6183319091796875, -0.5928115844726562, -0.567291259765625, -0.5417709350585938, -0.5162506103515625, -0.49073028564453125, -0.4652099609375, -0.43968963623046875, -0.4141693115234375, -0.38864898681640625, -0.363128662109375, -0.33760833740234375, -0.3120880126953125, -0.28656768798828125, -0.26104736328125, -0.23552703857421875, -0.2100067138671875, -0.18448638916015625, -0.158966064453125, -0.13344573974609375, -0.1079254150390625, -0.08240509033203125, -0.056884765625, -0.03136444091796875, -0.0058441162109375, 0.01967620849609375, 0.045196533203125, 0.07071685791015625, 0.0962371826171875, 0.12175750732421875, 0.14727783203125, 0.17279815673828125, 0.1983184814453125, 0.22383880615234375, 0.249359130859375, 0.27487945556640625, 0.3003997802734375, 0.32592010498046875, 0.3514404296875, 0.37696075439453125, 0.4024810791015625, 0.42800140380859375, 0.453521728515625, 0.47904205322265625, 0.5045623779296875, 0.5300827026367188, 0.55560302734375, 0.5811233520507812, 0.6066436767578125, 0.6321640014648438, 0.657684326171875, 0.6832046508789062, 0.7087249755859375, 0.7342453002929688, 0.759765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 4.0, 6.0, 8.0, 5.0, 11.0, 16.0, 10.0, 15.0, 19.0, 22.0, 22.0, 34.0, 30.0, 36.0, 31.0, 50.0, 31.0, 49.0, 46.0, 50.0, 52.0, 39.0, 36.0, 32.0, 50.0, 39.0, 32.0, 36.0, 24.0, 23.0, 22.0, 16.0, 18.0, 18.0, 9.0, 12.0, 9.0, 7.0, 11.0, 4.0, 3.0, 5.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6865234375, -0.6621627807617188, -0.6378021240234375, -0.6134414672851562, -0.589080810546875, -0.5647201538085938, -0.5403594970703125, -0.5159988403320312, -0.49163818359375, -0.46727752685546875, -0.4429168701171875, -0.41855621337890625, -0.394195556640625, -0.36983489990234375, -0.3454742431640625, -0.32111358642578125, -0.2967529296875, -0.27239227294921875, -0.2480316162109375, -0.22367095947265625, -0.199310302734375, -0.17494964599609375, -0.1505889892578125, -0.12622833251953125, -0.10186767578125, -0.07750701904296875, -0.0531463623046875, -0.02878570556640625, -0.004425048828125, 0.01993560791015625, 0.0442962646484375, 0.06865692138671875, 0.093017578125, 0.11737823486328125, 0.1417388916015625, 0.16609954833984375, 0.190460205078125, 0.21482086181640625, 0.2391815185546875, 0.26354217529296875, 0.28790283203125, 0.31226348876953125, 0.3366241455078125, 0.36098480224609375, 0.385345458984375, 0.40970611572265625, 0.4340667724609375, 0.45842742919921875, 0.4827880859375, 0.5071487426757812, 0.5315093994140625, 0.5558700561523438, 0.580230712890625, 0.6045913696289062, 0.6289520263671875, 0.6533126831054688, 0.67767333984375, 0.7020339965820312, 0.7263946533203125, 0.7507553100585938, 0.775115966796875, 0.7994766235351562, 0.8238372802734375, 0.8481979370117188, 0.87255859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 6.0, 10.0, 10.0, 16.0, 16.0, 23.0, 27.0, 39.0, 48.0, 62.0, 92.0, 116.0, 164.0, 240.0, 301.0, 431.0, 711.0, 1245.0, 2544.0, 7021.0, 35032.0, 297084.0, 627940.0, 58112.0, 10208.0, 3170.0, 1351.0, 791.0, 499.0, 342.0, 248.0, 171.0, 117.0, 99.0, 62.0, 43.0, 43.0, 30.0, 21.0, 16.0, 14.0, 13.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9100189208984375, -1.844451904296875, -1.7788848876953125, -1.71331787109375, -1.6477508544921875, -1.582183837890625, -1.5166168212890625, -1.4510498046875, -1.3854827880859375, -1.319915771484375, -1.2543487548828125, -1.18878173828125, -1.1232147216796875, -1.057647705078125, -0.9920806884765625, -0.926513671875, -0.8609466552734375, -0.795379638671875, -0.7298126220703125, -0.66424560546875, -0.5986785888671875, -0.533111572265625, -0.4675445556640625, -0.4019775390625, -0.3364105224609375, -0.270843505859375, -0.2052764892578125, -0.13970947265625, -0.0741424560546875, -0.008575439453125, 0.0569915771484375, 0.12255859375, 0.1881256103515625, 0.253692626953125, 0.3192596435546875, 0.38482666015625, 0.4503936767578125, 0.515960693359375, 0.5815277099609375, 0.6470947265625, 0.7126617431640625, 0.778228759765625, 0.8437957763671875, 0.90936279296875, 0.9749298095703125, 1.040496826171875, 1.1060638427734375, 1.171630859375, 1.2371978759765625, 1.302764892578125, 1.3683319091796875, 1.43389892578125, 1.4994659423828125, 1.565032958984375, 1.6305999755859375, 1.6961669921875, 1.7617340087890625, 1.827301025390625, 1.8928680419921875, 1.95843505859375, 2.0240020751953125, 2.089569091796875, 2.1551361083984375, 2.220703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 8.0, 5.0, 5.0, 12.0, 10.0, 8.0, 11.0, 11.0, 18.0, 23.0, 25.0, 19.0, 33.0, 33.0, 26.0, 35.0, 42.0, 38.0, 53.0, 56.0, 44.0, 51.0, 58.0, 43.0, 38.0, 40.0, 32.0, 29.0, 25.0, 33.0, 28.0, 21.0, 10.0, 15.0, 15.0, 10.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.67431640625, -2.5810546875, -2.48779296875, -2.39453125, -2.30126953125, -2.2080078125, -2.11474609375, -2.021484375, -1.92822265625, -1.8349609375, -1.74169921875, -1.6484375, -1.55517578125, -1.4619140625, -1.36865234375, -1.275390625, -1.18212890625, -1.0888671875, -0.99560546875, -0.90234375, -0.80908203125, -0.7158203125, -0.62255859375, -0.529296875, -0.43603515625, -0.3427734375, -0.24951171875, -0.15625, -0.06298828125, 0.0302734375, 0.12353515625, 0.216796875, 0.31005859375, 0.4033203125, 0.49658203125, 0.58984375, 0.68310546875, 0.7763671875, 0.86962890625, 0.962890625, 1.05615234375, 1.1494140625, 1.24267578125, 1.3359375, 1.42919921875, 1.5224609375, 1.61572265625, 1.708984375, 1.80224609375, 1.8955078125, 1.98876953125, 2.08203125, 2.17529296875, 2.2685546875, 2.36181640625, 2.455078125, 2.54833984375, 2.6416015625, 2.73486328125, 2.828125, 2.92138671875, 3.0146484375, 3.10791015625, 3.201171875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 4.0, 13.0, 10.0, 20.0, 43.0, 44.0, 109.0, 146.0, 223.0, 375.0, 779.0, 1722.0, 4278.0, 11925.0, 44584.0, 357317.0, 555475.0, 50224.0, 13074.0, 4404.0, 1799.0, 840.0, 445.0, 238.0, 138.0, 98.0, 73.0, 38.0, 31.0, 22.0, 12.0, 10.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5286865234375, -0.507568359375, -0.4864501953125, -0.46533203125, -0.4442138671875, -0.423095703125, -0.4019775390625, -0.380859375, -0.3597412109375, -0.338623046875, -0.3175048828125, -0.29638671875, -0.2752685546875, -0.254150390625, -0.2330322265625, -0.2119140625, -0.1907958984375, -0.169677734375, -0.1485595703125, -0.12744140625, -0.1063232421875, -0.085205078125, -0.0640869140625, -0.04296875, -0.0218505859375, -0.000732421875, 0.0203857421875, 0.04150390625, 0.0626220703125, 0.083740234375, 0.1048583984375, 0.1259765625, 0.1470947265625, 0.168212890625, 0.1893310546875, 0.21044921875, 0.2315673828125, 0.252685546875, 0.2738037109375, 0.294921875, 0.3160400390625, 0.337158203125, 0.3582763671875, 0.37939453125, 0.4005126953125, 0.421630859375, 0.4427490234375, 0.4638671875, 0.4849853515625, 0.506103515625, 0.5272216796875, 0.54833984375, 0.5694580078125, 0.590576171875, 0.6116943359375, 0.6328125, 0.6539306640625, 0.675048828125, 0.6961669921875, 0.71728515625, 0.7384033203125, 0.759521484375, 0.7806396484375, 0.8017578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 9.0, 5.0, 5.0, 6.0, 15.0, 24.0, 28.0, 30.0, 52.0, 86.0, 132.0, 158.0, 142.0, 105.0, 61.0, 31.0, 30.0, 24.0, 15.0, 13.0, 12.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001838207244873047, -0.00017686188220977783, -0.00016990303993225098, -0.00016294419765472412, -0.00015598535537719727, -0.0001490265130996704, -0.00014206767082214355, -0.0001351088285446167, -0.00012814998626708984, -0.00012119114398956299, -0.00011423230171203613, -0.00010727345943450928, -0.00010031461715698242, -9.335577487945557e-05, -8.639693260192871e-05, -7.943809032440186e-05, -7.2479248046875e-05, -6.552040576934814e-05, -5.856156349182129e-05, -5.1602721214294434e-05, -4.464387893676758e-05, -3.768503665924072e-05, -3.072619438171387e-05, -2.3767352104187012e-05, -1.6808509826660156e-05, -9.8496675491333e-06, -2.8908252716064453e-06, 4.06801700592041e-06, 1.1026859283447266e-05, 1.798570156097412e-05, 2.4944543838500977e-05, 3.190338611602783e-05, 3.886222839355469e-05, 4.582107067108154e-05, 5.27799129486084e-05, 5.9738755226135254e-05, 6.669759750366211e-05, 7.365643978118896e-05, 8.061528205871582e-05, 8.757412433624268e-05, 9.453296661376953e-05, 0.00010149180889129639, 0.00010845065116882324, 0.0001154094934463501, 0.00012236833572387695, 0.0001293271780014038, 0.00013628602027893066, 0.00014324486255645752, 0.00015020370483398438, 0.00015716254711151123, 0.00016412138938903809, 0.00017108023166656494, 0.0001780390739440918, 0.00018499791622161865, 0.0001919567584991455, 0.00019891560077667236, 0.00020587444305419922, 0.00021283328533172607, 0.00021979212760925293, 0.00022675096988677979, 0.00023370981216430664, 0.0002406686544418335, 0.00024762749671936035, 0.0002545863389968872, 0.00026154518127441406]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 9.0, 4.0, 9.0, 10.0, 23.0, 32.0, 52.0, 70.0, 160.0, 275.0, 627.0, 1659.0, 5596.0, 30433.0, 661518.0, 319074.0, 21905.0, 4602.0, 1355.0, 597.0, 253.0, 107.0, 68.0, 40.0, 23.0, 14.0, 7.0, 9.0, 10.0, 3.0, 5.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -1.0034866333007812, -0.9747467041015625, -0.9460067749023438, -0.917266845703125, -0.8885269165039062, -0.8597869873046875, -0.8310470581054688, -0.80230712890625, -0.7735671997070312, -0.7448272705078125, -0.7160873413085938, -0.687347412109375, -0.6586074829101562, -0.6298675537109375, -0.6011276245117188, -0.5723876953125, -0.5436477661132812, -0.5149078369140625, -0.48616790771484375, -0.457427978515625, -0.42868804931640625, -0.3999481201171875, -0.37120819091796875, -0.34246826171875, -0.31372833251953125, -0.2849884033203125, -0.25624847412109375, -0.227508544921875, -0.19876861572265625, -0.1700286865234375, -0.14128875732421875, -0.112548828125, -0.08380889892578125, -0.0550689697265625, -0.02632904052734375, 0.002410888671875, 0.03115081787109375, 0.0598907470703125, 0.08863067626953125, 0.11737060546875, 0.14611053466796875, 0.1748504638671875, 0.20359039306640625, 0.232330322265625, 0.26107025146484375, 0.2898101806640625, 0.31855010986328125, 0.3472900390625, 0.37602996826171875, 0.4047698974609375, 0.43350982666015625, 0.462249755859375, 0.49098968505859375, 0.5197296142578125, 0.5484695434570312, 0.57720947265625, 0.6059494018554688, 0.6346893310546875, 0.6634292602539062, 0.692169189453125, 0.7209091186523438, 0.7496490478515625, 0.7783889770507812, 0.80712890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 7.0, 5.0, 9.0, 18.0, 17.0, 28.0, 43.0, 49.0, 67.0, 69.0, 87.0, 94.0, 94.0, 93.0, 58.0, 67.0, 51.0, 33.0, 24.0, 25.0, 11.0, 15.0, 7.0, 6.0, 4.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5266876220703125, -0.504547119140625, -0.4824066162109375, -0.46026611328125, -0.4381256103515625, -0.415985107421875, -0.3938446044921875, -0.3717041015625, -0.3495635986328125, -0.327423095703125, -0.3052825927734375, -0.28314208984375, -0.2610015869140625, -0.238861083984375, -0.2167205810546875, -0.194580078125, -0.1724395751953125, -0.150299072265625, -0.1281585693359375, -0.10601806640625, -0.0838775634765625, -0.061737060546875, -0.0395965576171875, -0.0174560546875, 0.0046844482421875, 0.026824951171875, 0.0489654541015625, 0.07110595703125, 0.0932464599609375, 0.115386962890625, 0.1375274658203125, 0.15966796875, 0.1818084716796875, 0.203948974609375, 0.2260894775390625, 0.24822998046875, 0.2703704833984375, 0.292510986328125, 0.3146514892578125, 0.3367919921875, 0.3589324951171875, 0.381072998046875, 0.4032135009765625, 0.42535400390625, 0.4474945068359375, 0.469635009765625, 0.4917755126953125, 0.513916015625, 0.5360565185546875, 0.558197021484375, 0.5803375244140625, 0.60247802734375, 0.6246185302734375, 0.646759033203125, 0.6688995361328125, 0.6910400390625, 0.7131805419921875, 0.735321044921875, 0.7574615478515625, 0.77960205078125, 0.8017425537109375, 0.823883056640625, 0.8460235595703125, 0.8681640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 12.0, 18.0, 36.0, 70.0, 153.0, 270.0, 281.0, 103.0, 29.0, 10.0, 7.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.917949676513672, -19.180561065673828, -18.443174362182617, -17.705787658691406, -16.968399047851562, -16.23101043701172, -15.493623733520508, -14.75623607635498, -14.018848419189453, -13.281460762023926, -12.544073104858398, -11.806685447692871, -11.069297790527344, -10.331910133361816, -9.594522476196289, -8.857134819030762, -8.119747161865234, -7.382359504699707, -6.64497184753418, -5.907584190368652, -5.170196533203125, -4.432808876037598, -3.6954212188720703, -2.958033561706543, -2.2206459045410156, -1.4832582473754883, -0.7458705902099609, -0.008482933044433594, 0.7289047241210938, 1.466292381286621, 2.2036800384521484, 2.941067695617676, 3.678455352783203, 4.4158430099487305, 5.153230667114258, 5.890618324279785, 6.6280059814453125, 7.36539363861084, 8.102781295776367, 8.840168952941895, 9.577556610107422, 10.31494426727295, 11.052331924438477, 11.789719581604004, 12.527107238769531, 13.264494895935059, 14.001882553100586, 14.739270210266113, 15.47665786743164, 16.214046478271484, 16.951433181762695, 17.688819885253906, 18.42620849609375, 19.163597106933594, 19.900983810424805, 20.638370513916016, 21.37575912475586, 22.113147735595703, 22.850534439086914, 23.587921142578125, 24.32530975341797, 25.062698364257812, 25.800085067749023, 26.537471771240234, 27.274860382080078]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 9.0, 11.0, 12.0, 19.0, 18.0, 22.0, 29.0, 22.0, 26.0, 38.0, 34.0, 54.0, 50.0, 76.0, 73.0, 74.0, 47.0, 47.0, 40.0, 32.0, 30.0, 34.0, 26.0, 21.0, 20.0, 24.0, 20.0, 9.0, 17.0, 6.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.846213340759277, -12.441523551940918, -12.036832809448242, -11.632143020629883, -11.227452278137207, -10.822762489318848, -10.418071746826172, -10.013381958007812, -9.608692169189453, -9.204002380371094, -8.799311637878418, -8.394621849060059, -7.989931106567383, -7.585241317749023, -7.180551052093506, -6.775860786437988, -6.3711700439453125, -5.966479778289795, -5.561789512634277, -5.157099723815918, -4.752408981323242, -4.347719192504883, -3.9430289268493652, -3.5383386611938477, -3.13364839553833, -2.7289581298828125, -2.324267864227295, -1.9195778369903564, -1.5148875713348389, -1.1101973056793213, -0.7055072784423828, -0.30081701278686523, 0.10387229919433594, 0.5085625052452087, 0.9132527112960815, 1.3179428577423096, 1.7226331233978271, 2.1273233890533447, 2.532013416290283, 2.936703681945801, 3.3413939476013184, 3.746084213256836, 4.1507744789123535, 4.555464744567871, 4.9601545333862305, 5.364845275878906, 5.769535064697266, 6.174225330352783, 6.578915596008301, 6.983605861663818, 7.388296127319336, 7.792985916137695, 8.197676658630371, 8.60236644744873, 9.007057189941406, 9.411746978759766, 9.816436767578125, 10.221126556396484, 10.62581729888916, 11.03050708770752, 11.435197830200195, 11.839887619018555, 12.244577407836914, 12.64926815032959, 13.053958892822266]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 7.0, 9.0, 8.0, 20.0, 31.0, 46.0, 55.0, 81.0, 137.0, 203.0, 345.0, 673.0, 1840.0, 6810.0, 77591.0, 1777544.0, 2213455.0, 103583.0, 7827.0, 2149.0, 854.0, 402.0, 224.0, 129.0, 100.0, 51.0, 37.0, 26.0, 21.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91357421875, -0.8755874633789062, -0.8376007080078125, -0.7996139526367188, -0.761627197265625, -0.7236404418945312, -0.6856536865234375, -0.6476669311523438, -0.60968017578125, -0.5716934204101562, -0.5337066650390625, -0.49571990966796875, -0.457733154296875, -0.41974639892578125, -0.3817596435546875, -0.34377288818359375, -0.3057861328125, -0.26779937744140625, -0.2298126220703125, -0.19182586669921875, -0.153839111328125, -0.11585235595703125, -0.0778656005859375, -0.03987884521484375, -0.00189208984375, 0.03609466552734375, 0.0740814208984375, 0.11206817626953125, 0.150054931640625, 0.18804168701171875, 0.2260284423828125, 0.26401519775390625, 0.302001953125, 0.33998870849609375, 0.3779754638671875, 0.41596221923828125, 0.453948974609375, 0.49193572998046875, 0.5299224853515625, 0.5679092407226562, 0.60589599609375, 0.6438827514648438, 0.6818695068359375, 0.7198562622070312, 0.757843017578125, 0.7958297729492188, 0.8338165283203125, 0.8718032836914062, 0.9097900390625, 0.9477767944335938, 0.9857635498046875, 1.0237503051757812, 1.061737060546875, 1.0997238159179688, 1.1377105712890625, 1.1756973266601562, 1.21368408203125, 1.2516708374023438, 1.2896575927734375, 1.3276443481445312, 1.365631103515625, 1.4036178588867188, 1.4416046142578125, 1.4795913696289062, 1.517578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 9.0, 2.0, 7.0, 9.0, 13.0, 20.0, 10.0, 22.0, 20.0, 23.0, 17.0, 24.0, 25.0, 33.0, 35.0, 40.0, 22.0, 47.0, 44.0, 37.0, 43.0, 48.0, 47.0, 30.0, 35.0, 30.0, 40.0, 25.0, 30.0, 26.0, 32.0, 27.0, 22.0, 17.0, 12.0, 15.0, 9.0, 7.0, 6.0, 12.0, 7.0, 6.0, 5.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.69921875, -0.677947998046875, -0.65667724609375, -0.635406494140625, -0.6141357421875, -0.592864990234375, -0.57159423828125, -0.550323486328125, -0.529052734375, -0.507781982421875, -0.48651123046875, -0.465240478515625, -0.4439697265625, -0.422698974609375, -0.40142822265625, -0.380157470703125, -0.35888671875, -0.337615966796875, -0.31634521484375, -0.295074462890625, -0.2738037109375, -0.252532958984375, -0.23126220703125, -0.209991455078125, -0.188720703125, -0.167449951171875, -0.14617919921875, -0.124908447265625, -0.1036376953125, -0.082366943359375, -0.06109619140625, -0.039825439453125, -0.0185546875, 0.002716064453125, 0.02398681640625, 0.045257568359375, 0.0665283203125, 0.087799072265625, 0.10906982421875, 0.130340576171875, 0.151611328125, 0.172882080078125, 0.19415283203125, 0.215423583984375, 0.2366943359375, 0.257965087890625, 0.27923583984375, 0.300506591796875, 0.32177734375, 0.343048095703125, 0.36431884765625, 0.385589599609375, 0.4068603515625, 0.428131103515625, 0.44940185546875, 0.470672607421875, 0.491943359375, 0.513214111328125, 0.53448486328125, 0.555755615234375, 0.5770263671875, 0.598297119140625, 0.61956787109375, 0.640838623046875, 0.662109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 16.0, 33.0, 70.0, 266.0, 1002.0, 4906.0, 4053357.0, 132177.0, 1719.0, 443.0, 163.0, 74.0, 32.0, 14.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.71099853515625, -5.5469970703125, -5.38299560546875, -5.218994140625, -5.05499267578125, -4.8909912109375, -4.72698974609375, -4.56298828125, -4.39898681640625, -4.2349853515625, -4.07098388671875, -3.906982421875, -3.74298095703125, -3.5789794921875, -3.41497802734375, -3.2509765625, -3.08697509765625, -2.9229736328125, -2.75897216796875, -2.594970703125, -2.43096923828125, -2.2669677734375, -2.10296630859375, -1.93896484375, -1.77496337890625, -1.6109619140625, -1.44696044921875, -1.282958984375, -1.11895751953125, -0.9549560546875, -0.79095458984375, -0.626953125, -0.46295166015625, -0.2989501953125, -0.13494873046875, 0.029052734375, 0.19305419921875, 0.3570556640625, 0.52105712890625, 0.68505859375, 0.84906005859375, 1.0130615234375, 1.17706298828125, 1.341064453125, 1.50506591796875, 1.6690673828125, 1.83306884765625, 1.9970703125, 2.16107177734375, 2.3250732421875, 2.48907470703125, 2.653076171875, 2.81707763671875, 2.9810791015625, 3.14508056640625, 3.30908203125, 3.47308349609375, 3.6370849609375, 3.80108642578125, 3.965087890625, 4.12908935546875, 4.2930908203125, 4.45709228515625, 4.62109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 7.0, 13.0, 23.0, 41.0, 171.0, 1095.0, 2088.0, 489.0, 84.0, 28.0, 19.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.83160400390625, -2.7100830078125, -2.58856201171875, -2.467041015625, -2.34552001953125, -2.2239990234375, -2.10247802734375, -1.98095703125, -1.85943603515625, -1.7379150390625, -1.61639404296875, -1.494873046875, -1.37335205078125, -1.2518310546875, -1.13031005859375, -1.0087890625, -0.88726806640625, -0.7657470703125, -0.64422607421875, -0.522705078125, -0.40118408203125, -0.2796630859375, -0.15814208984375, -0.03662109375, 0.08489990234375, 0.2064208984375, 0.32794189453125, 0.449462890625, 0.57098388671875, 0.6925048828125, 0.81402587890625, 0.935546875, 1.05706787109375, 1.1785888671875, 1.30010986328125, 1.421630859375, 1.54315185546875, 1.6646728515625, 1.78619384765625, 1.90771484375, 2.02923583984375, 2.1507568359375, 2.27227783203125, 2.393798828125, 2.51531982421875, 2.6368408203125, 2.75836181640625, 2.8798828125, 3.00140380859375, 3.1229248046875, 3.24444580078125, 3.365966796875, 3.48748779296875, 3.6090087890625, 3.73052978515625, 3.85205078125, 3.97357177734375, 4.0950927734375, 4.21661376953125, 4.338134765625, 4.45965576171875, 4.5811767578125, 4.70269775390625, 4.82421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 26.0, 213.0, 639.0, 92.0, 22.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.84754180908203, -46.53004455566406, -45.21255111694336, -43.89505386352539, -42.57756042480469, -41.26006317138672, -39.942569732666016, -38.62507247924805, -37.307579040527344, -35.990081787109375, -34.67258834838867, -33.3550910949707, -32.03759765625, -30.72010040283203, -29.402605056762695, -28.08510971069336, -26.76761245727539, -25.450117111206055, -24.13262176513672, -22.815126419067383, -21.497631072998047, -20.180133819580078, -18.862638473510742, -17.545143127441406, -16.22764778137207, -14.910152435302734, -13.592657089233398, -12.275160789489746, -10.95766544342041, -9.640170097351074, -8.322673797607422, -7.005178451538086, -5.687679290771484, -4.370183944702148, -3.0526881217956543, -1.7351925373077393, -0.4176969528198242, 0.8997983932495117, 2.217294216156006, 3.5347900390625, 4.852285385131836, 6.169780731201172, 7.487276554107666, 8.80477237701416, 10.122267723083496, 11.439763069152832, 12.757259368896484, 14.07475471496582, 15.392250061035156, 16.709745407104492, 18.027240753173828, 19.344736099243164, 20.6622314453125, 21.97972869873047, 23.297224044799805, 24.61471939086914, 25.932214736938477, 27.249710083007812, 28.56720542907715, 29.884700775146484, 31.202198028564453, 32.519691467285156, 33.837188720703125, 35.154685974121094, 36.4721794128418]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 7.0, 9.0, 15.0, 19.0, 21.0, 36.0, 41.0, 86.0, 70.0, 71.0, 82.0, 90.0, 71.0, 76.0, 74.0, 57.0, 43.0, 44.0, 26.0, 16.0, 13.0, 11.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.046524047851562, -13.661247253417969, -13.275970458984375, -12.890694618225098, -12.505417823791504, -12.12014102935791, -11.734864234924316, -11.349588394165039, -10.964311599731445, -10.579034805297852, -10.193758010864258, -9.80848217010498, -9.423205375671387, -9.037928581237793, -8.6526517868042, -8.267375946044922, -7.88209867477417, -7.496821880340576, -7.111545562744141, -6.726268768310547, -6.340992450714111, -5.955715656280518, -5.570439338684082, -5.185162544250488, -4.7998857498168945, -4.414608955383301, -4.029332637786865, -3.6440558433532715, -3.258779525756836, -2.873502731323242, -2.4882261753082275, -2.102949619293213, -1.7176733016967773, -1.3323967456817627, -0.9471201300621033, -0.5618435144424438, -0.1765669584274292, 0.20870959758758545, 0.5939862728118896, 0.9792628288269043, 1.364539384841919, 1.7498159408569336, 2.1350924968719482, 2.520369052886963, 2.9056458473205566, 3.290922164916992, 3.676198959350586, 4.06147575378418, 4.446752071380615, 4.832028865814209, 5.2173051834106445, 5.602581977844238, 5.987858295440674, 6.373135089874268, 6.758411407470703, 7.143688201904297, 7.528964996337891, 7.914241790771484, 8.299518585205078, 8.684794425964355, 9.07007122039795, 9.455348014831543, 9.840624809265137, 10.225900650024414, 10.611177444458008]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 5.0, 9.0, 13.0, 29.0, 43.0, 55.0, 96.0, 132.0, 164.0, 246.0, 349.0, 530.0, 847.0, 1311.0, 2063.0, 3181.0, 4971.0, 8207.0, 13769.0, 23122.0, 39852.0, 68664.0, 115301.0, 174431.0, 197658.0, 154650.0, 98291.0, 57342.0, 33237.0, 19466.0, 11592.0, 7035.0, 4254.0, 2729.0, 1707.0, 1119.0, 692.0, 450.0, 285.0, 178.0, 145.0, 96.0, 73.0, 42.0, 34.0, 21.0, 16.0, 15.0, 11.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0], "bins": [-0.4794921875, -0.4651069641113281, -0.45072174072265625, -0.4363365173339844, -0.4219512939453125, -0.4075660705566406, -0.39318084716796875, -0.3787956237792969, -0.364410400390625, -0.3500251770019531, -0.33563995361328125, -0.3212547302246094, -0.3068695068359375, -0.2924842834472656, -0.27809906005859375, -0.2637138366699219, -0.24932861328125, -0.23494338989257812, -0.22055816650390625, -0.20617294311523438, -0.1917877197265625, -0.17740249633789062, -0.16301727294921875, -0.14863204956054688, -0.134246826171875, -0.11986160278320312, -0.10547637939453125, -0.09109115600585938, -0.0767059326171875, -0.062320709228515625, -0.04793548583984375, -0.033550262451171875, -0.0191650390625, -0.004779815673828125, 0.00960540771484375, 0.023990631103515625, 0.0383758544921875, 0.052761077880859375, 0.06714630126953125, 0.08153152465820312, 0.095916748046875, 0.11030197143554688, 0.12468719482421875, 0.13907241821289062, 0.1534576416015625, 0.16784286499023438, 0.18222808837890625, 0.19661331176757812, 0.21099853515625, 0.22538375854492188, 0.23976898193359375, 0.2541542053222656, 0.2685394287109375, 0.2829246520996094, 0.29730987548828125, 0.3116950988769531, 0.326080322265625, 0.3404655456542969, 0.35485076904296875, 0.3692359924316406, 0.3836212158203125, 0.3980064392089844, 0.41239166259765625, 0.4267768859863281, 0.441162109375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 11.0, 7.0, 16.0, 9.0, 16.0, 21.0, 16.0, 24.0, 30.0, 20.0, 31.0, 30.0, 40.0, 50.0, 41.0, 31.0, 35.0, 42.0, 35.0, 38.0, 47.0, 37.0, 36.0, 37.0, 33.0, 38.0, 27.0, 27.0, 32.0, 32.0, 10.0, 13.0, 6.0, 14.0, 10.0, 8.0, 4.0, 6.0, 5.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.74365234375, -0.7215423583984375, -0.699432373046875, -0.6773223876953125, -0.65521240234375, -0.6331024169921875, -0.610992431640625, -0.5888824462890625, -0.5667724609375, -0.5446624755859375, -0.522552490234375, -0.5004425048828125, -0.47833251953125, -0.4562225341796875, -0.434112548828125, -0.4120025634765625, -0.389892578125, -0.3677825927734375, -0.345672607421875, -0.3235626220703125, -0.30145263671875, -0.2793426513671875, -0.257232666015625, -0.2351226806640625, -0.2130126953125, -0.1909027099609375, -0.168792724609375, -0.1466827392578125, -0.12457275390625, -0.1024627685546875, -0.080352783203125, -0.0582427978515625, -0.0361328125, -0.0140228271484375, 0.008087158203125, 0.0301971435546875, 0.05230712890625, 0.0744171142578125, 0.096527099609375, 0.1186370849609375, 0.1407470703125, 0.1628570556640625, 0.184967041015625, 0.2070770263671875, 0.22918701171875, 0.2512969970703125, 0.273406982421875, 0.2955169677734375, 0.317626953125, 0.3397369384765625, 0.361846923828125, 0.3839569091796875, 0.40606689453125, 0.4281768798828125, 0.450286865234375, 0.4723968505859375, 0.4945068359375, 0.5166168212890625, 0.538726806640625, 0.5608367919921875, 0.58294677734375, 0.6050567626953125, 0.627166748046875, 0.6492767333984375, 0.67138671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 5.0, 4.0, 9.0, 11.0, 13.0, 14.0, 16.0, 34.0, 56.0, 81.0, 123.0, 188.0, 345.0, 865.0, 2429.0, 10546.0, 70587.0, 638114.0, 280084.0, 35726.0, 6230.0, 1659.0, 618.0, 315.0, 158.0, 102.0, 62.0, 43.0, 29.0, 17.0, 17.0, 16.0, 11.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.037109375, -1.9786224365234375, -1.920135498046875, -1.8616485595703125, -1.80316162109375, -1.7446746826171875, -1.686187744140625, -1.6277008056640625, -1.5692138671875, -1.5107269287109375, -1.452239990234375, -1.3937530517578125, -1.33526611328125, -1.2767791748046875, -1.218292236328125, -1.1598052978515625, -1.101318359375, -1.0428314208984375, -0.984344482421875, -0.9258575439453125, -0.86737060546875, -0.8088836669921875, -0.750396728515625, -0.6919097900390625, -0.6334228515625, -0.5749359130859375, -0.516448974609375, -0.4579620361328125, -0.39947509765625, -0.3409881591796875, -0.282501220703125, -0.2240142822265625, -0.16552734375, -0.1070404052734375, -0.048553466796875, 0.0099334716796875, 0.06842041015625, 0.1269073486328125, 0.185394287109375, 0.2438812255859375, 0.3023681640625, 0.3608551025390625, 0.419342041015625, 0.4778289794921875, 0.53631591796875, 0.5948028564453125, 0.653289794921875, 0.7117767333984375, 0.770263671875, 0.8287506103515625, 0.887237548828125, 0.9457244873046875, 1.00421142578125, 1.0626983642578125, 1.121185302734375, 1.1796722412109375, 1.2381591796875, 1.2966461181640625, 1.355133056640625, 1.4136199951171875, 1.47210693359375, 1.5305938720703125, 1.589080810546875, 1.6475677490234375, 1.7060546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 13.0, 18.0, 18.0, 26.0, 28.0, 26.0, 30.0, 31.0, 32.0, 39.0, 39.0, 41.0, 52.0, 46.0, 50.0, 54.0, 41.0, 41.0, 41.0, 46.0, 45.0, 37.0, 23.0, 38.0, 20.0, 19.0, 19.0, 13.0, 15.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.6328125, -2.546905517578125, -2.46099853515625, -2.375091552734375, -2.2891845703125, -2.203277587890625, -2.11737060546875, -2.031463623046875, -1.945556640625, -1.859649658203125, -1.77374267578125, -1.687835693359375, -1.6019287109375, -1.516021728515625, -1.43011474609375, -1.344207763671875, -1.25830078125, -1.172393798828125, -1.08648681640625, -1.000579833984375, -0.9146728515625, -0.828765869140625, -0.74285888671875, -0.656951904296875, -0.571044921875, -0.485137939453125, -0.39923095703125, -0.313323974609375, -0.2274169921875, -0.141510009765625, -0.05560302734375, 0.030303955078125, 0.1162109375, 0.202117919921875, 0.28802490234375, 0.373931884765625, 0.4598388671875, 0.545745849609375, 0.63165283203125, 0.717559814453125, 0.803466796875, 0.889373779296875, 0.97528076171875, 1.061187744140625, 1.1470947265625, 1.233001708984375, 1.31890869140625, 1.404815673828125, 1.49072265625, 1.576629638671875, 1.66253662109375, 1.748443603515625, 1.8343505859375, 1.920257568359375, 2.00616455078125, 2.092071533203125, 2.177978515625, 2.263885498046875, 2.34979248046875, 2.435699462890625, 2.5216064453125, 2.607513427734375, 2.69342041015625, 2.779327392578125, 2.865234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 3.0, 6.0, 14.0, 16.0, 21.0, 42.0, 68.0, 91.0, 151.0, 231.0, 401.0, 633.0, 1202.0, 2253.0, 4658.0, 10123.0, 24078.0, 61860.0, 172050.0, 508251.0, 162112.0, 58617.0, 22636.0, 9529.0, 4464.0, 2147.0, 1175.0, 651.0, 361.0, 241.0, 145.0, 106.0, 68.0, 37.0, 36.0, 19.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2491455078125, -0.2409687042236328, -0.23279190063476562, -0.22461509704589844, -0.21643829345703125, -0.20826148986816406, -0.20008468627929688, -0.1919078826904297, -0.1837310791015625, -0.1755542755126953, -0.16737747192382812, -0.15920066833496094, -0.15102386474609375, -0.14284706115722656, -0.13467025756835938, -0.1264934539794922, -0.118316650390625, -0.11013984680175781, -0.10196304321289062, -0.09378623962402344, -0.08560943603515625, -0.07743263244628906, -0.06925582885742188, -0.06107902526855469, -0.0529022216796875, -0.04472541809082031, -0.036548614501953125, -0.028371810913085938, -0.02019500732421875, -0.012018203735351562, -0.003841400146484375, 0.0043354034423828125, 0.01251220703125, 0.020689010620117188, 0.028865814208984375, 0.03704261779785156, 0.04521942138671875, 0.05339622497558594, 0.061573028564453125, 0.06974983215332031, 0.0779266357421875, 0.08610343933105469, 0.09428024291992188, 0.10245704650878906, 0.11063385009765625, 0.11881065368652344, 0.12698745727539062, 0.1351642608642578, 0.143341064453125, 0.1515178680419922, 0.15969467163085938, 0.16787147521972656, 0.17604827880859375, 0.18422508239746094, 0.19240188598632812, 0.2005786895751953, 0.2087554931640625, 0.2169322967529297, 0.22510910034179688, 0.23328590393066406, 0.24146270751953125, 0.24963951110839844, 0.2578163146972656, 0.2659931182861328, 0.274169921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 4.0, 7.0, 14.0, 12.0, 14.0, 26.0, 23.0, 30.0, 45.0, 59.0, 87.0, 103.0, 91.0, 88.0, 82.0, 69.0, 56.0, 45.0, 36.0, 29.0, 15.0, 12.0, 11.0, 9.0, 8.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013113021850585938, -0.00012723542749881744, -0.0001233406364917755, -0.00011944584548473358, -0.00011555105447769165, -0.00011165626347064972, -0.00010776147246360779, -0.00010386668145656586, -9.997189044952393e-05, -9.6077099442482e-05, -9.218230843544006e-05, -8.828751742839813e-05, -8.43927264213562e-05, -8.049793541431427e-05, -7.660314440727234e-05, -7.270835340023041e-05, -6.881356239318848e-05, -6.491877138614655e-05, -6.1023980379104614e-05, -5.712918937206268e-05, -5.323439836502075e-05, -4.933960735797882e-05, -4.544481635093689e-05, -4.155002534389496e-05, -3.765523433685303e-05, -3.3760443329811096e-05, -2.9865652322769165e-05, -2.5970861315727234e-05, -2.2076070308685303e-05, -1.818127930164337e-05, -1.428648829460144e-05, -1.039169728755951e-05, -6.496906280517578e-06, -2.602115273475647e-06, 1.2926757335662842e-06, 5.187466740608215e-06, 9.082257747650146e-06, 1.2977048754692078e-05, 1.687183976173401e-05, 2.076663076877594e-05, 2.466142177581787e-05, 2.8556212782859802e-05, 3.2451003789901733e-05, 3.6345794796943665e-05, 4.0240585803985596e-05, 4.413537681102753e-05, 4.803016781806946e-05, 5.192495882511139e-05, 5.581974983215332e-05, 5.971454083919525e-05, 6.360933184623718e-05, 6.750412285327911e-05, 7.139891386032104e-05, 7.529370486736298e-05, 7.918849587440491e-05, 8.308328688144684e-05, 8.697807788848877e-05, 9.08728688955307e-05, 9.476765990257263e-05, 9.866245090961456e-05, 0.0001025572419166565, 0.00010645203292369843, 0.00011034682393074036, 0.00011424161493778229, 0.00011813640594482422]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 5.0, 9.0, 9.0, 20.0, 28.0, 25.0, 66.0, 108.0, 184.0, 322.0, 778.0, 2110.0, 6778.0, 27587.0, 136189.0, 632547.0, 190330.0, 38166.0, 8905.0, 2586.0, 892.0, 380.0, 203.0, 121.0, 73.0, 28.0, 31.0, 26.0, 9.0, 14.0, 7.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.50390625, -0.49085235595703125, -0.4777984619140625, -0.46474456787109375, -0.451690673828125, -0.43863677978515625, -0.4255828857421875, -0.41252899169921875, -0.39947509765625, -0.38642120361328125, -0.3733673095703125, -0.36031341552734375, -0.347259521484375, -0.33420562744140625, -0.3211517333984375, -0.30809783935546875, -0.2950439453125, -0.28199005126953125, -0.2689361572265625, -0.25588226318359375, -0.242828369140625, -0.22977447509765625, -0.2167205810546875, -0.20366668701171875, -0.19061279296875, -0.17755889892578125, -0.1645050048828125, -0.15145111083984375, -0.138397216796875, -0.12534332275390625, -0.1122894287109375, -0.09923553466796875, -0.086181640625, -0.07312774658203125, -0.0600738525390625, -0.04701995849609375, -0.033966064453125, -0.02091217041015625, -0.0078582763671875, 0.00519561767578125, 0.01824951171875, 0.03130340576171875, 0.0443572998046875, 0.05741119384765625, 0.070465087890625, 0.08351898193359375, 0.0965728759765625, 0.10962677001953125, 0.1226806640625, 0.13573455810546875, 0.1487884521484375, 0.16184234619140625, 0.174896240234375, 0.18795013427734375, 0.2010040283203125, 0.21405792236328125, 0.22711181640625, 0.24016571044921875, 0.2532196044921875, 0.26627349853515625, 0.279327392578125, 0.29238128662109375, 0.3054351806640625, 0.31848907470703125, 0.33154296875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 3.0, 6.0, 12.0, 5.0, 10.0, 21.0, 14.0, 32.0, 23.0, 44.0, 36.0, 34.0, 55.0, 53.0, 79.0, 59.0, 69.0, 72.0, 58.0, 56.0, 37.0, 48.0, 33.0, 28.0, 24.0, 17.0, 17.0, 10.0, 9.0, 7.0, 5.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.458984375, -0.4465827941894531, -0.43418121337890625, -0.4217796325683594, -0.4093780517578125, -0.3969764709472656, -0.38457489013671875, -0.3721733093261719, -0.359771728515625, -0.3473701477050781, -0.33496856689453125, -0.3225669860839844, -0.3101654052734375, -0.2977638244628906, -0.28536224365234375, -0.2729606628417969, -0.26055908203125, -0.24815750122070312, -0.23575592041015625, -0.22335433959960938, -0.2109527587890625, -0.19855117797851562, -0.18614959716796875, -0.17374801635742188, -0.161346435546875, -0.14894485473632812, -0.13654327392578125, -0.12414169311523438, -0.1117401123046875, -0.09933853149414062, -0.08693695068359375, -0.07453536987304688, -0.0621337890625, -0.049732208251953125, -0.03733062744140625, -0.024929046630859375, -0.0125274658203125, -0.000125885009765625, 0.01227569580078125, 0.024677276611328125, 0.037078857421875, 0.049480438232421875, 0.06188201904296875, 0.07428359985351562, 0.0866851806640625, 0.09908676147460938, 0.11148834228515625, 0.12388992309570312, 0.13629150390625, 0.14869308471679688, 0.16109466552734375, 0.17349624633789062, 0.1858978271484375, 0.19829940795898438, 0.21070098876953125, 0.22310256958007812, 0.235504150390625, 0.24790573120117188, 0.26030731201171875, 0.2727088928222656, 0.2851104736328125, 0.2975120544433594, 0.30991363525390625, 0.3223152160644531, 0.334716796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 10.0, 6.0, 12.0, 34.0, 70.0, 114.0, 243.0, 258.0, 139.0, 53.0, 27.0, 9.0, 12.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.426286697387695, -20.980152130126953, -20.534015655517578, -20.087881088256836, -19.641746520996094, -19.19561004638672, -18.749475479125977, -18.303340911865234, -17.857206344604492, -17.41107177734375, -16.964935302734375, -16.518800735473633, -16.07266616821289, -15.626530647277832, -15.180395126342773, -14.734260559082031, -14.288124084472656, -13.841988563537598, -13.395853996276855, -12.949718475341797, -12.503583908081055, -12.057448387145996, -11.611312866210938, -11.165178298950195, -10.719043731689453, -10.272908210754395, -9.826773643493652, -9.380638122558594, -8.934503555297852, -8.488368034362793, -8.042232513427734, -7.596097946166992, -7.149962902069092, -6.703827857971191, -6.257692813873291, -5.811557769775391, -5.365422248840332, -4.919287204742432, -4.473152160644531, -4.027016639709473, -3.5808818340301514, -3.134746789932251, -2.6886115074157715, -2.242476463317871, -1.7963413000106812, -1.3502061367034912, -0.9040710926055908, -0.45793581008911133, -0.011800765991210938, 0.4343343675136566, 0.8804695010185242, 1.3266046047210693, 1.7727397680282593, 2.218874931335449, 2.6650099754333496, 3.111145257949829, 3.5572803020477295, 4.003415584564209, 4.449550628662109, 4.89568567276001, 5.34182071685791, 5.787956237792969, 6.234090805053711, 6.6802263259887695, 7.12636137008667]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 10.0, 16.0, 15.0, 20.0, 28.0, 17.0, 22.0, 36.0, 39.0, 27.0, 27.0, 50.0, 53.0, 74.0, 84.0, 82.0, 59.0, 34.0, 38.0, 37.0, 30.0, 33.0, 26.0, 20.0, 17.0, 13.0, 8.0, 20.0, 10.0, 6.0, 5.0, 6.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.30596923828125, -12.929471969604492, -12.55297565460205, -12.176478385925293, -11.799982070922852, -11.423484802246094, -11.046987533569336, -10.670491218566895, -10.293994903564453, -9.917497634887695, -9.541001319885254, -9.164504051208496, -8.788007736206055, -8.411510467529297, -8.035013198852539, -7.658516883850098, -7.28201961517334, -6.90552282333374, -6.529026031494141, -6.152528762817383, -5.776032447814941, -5.399535179138184, -5.023038387298584, -4.646541595458984, -4.270044803619385, -3.893548011779785, -3.5170512199401855, -3.140554189682007, -2.7640573978424072, -2.3875606060028076, -2.011063575744629, -1.6345667839050293, -1.2580690383911133, -0.8815721869468689, -0.5050753355026245, -0.12857842445373535, 0.24791836738586426, 0.6244151592254639, 1.0009121894836426, 1.3774089813232422, 1.7539057731628418, 2.1304025650024414, 2.506899356842041, 2.8833963871002197, 3.2598931789398193, 3.636389970779419, 4.012887001037598, 4.389383792877197, 4.765880584716797, 5.1423773765563965, 5.518874168395996, 5.895371437072754, 6.271867752075195, 6.648365020751953, 7.024861812591553, 7.401358604431152, 7.777855396270752, 8.154352188110352, 8.53084945678711, 8.90734577178955, 9.283843040466309, 9.66033935546875, 10.036836624145508, 10.413333892822266, 10.789830207824707]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 14.0, 13.0, 17.0, 17.0, 22.0, 28.0, 56.0, 58.0, 88.0, 155.0, 254.0, 363.0, 699.0, 1430.0, 3162.0, 8168.0, 33958.0, 188740.0, 1014218.0, 2084151.0, 710856.0, 115405.0, 21214.0, 5914.0, 2407.0, 1187.0, 617.0, 341.0, 214.0, 143.0, 78.0, 62.0, 49.0, 33.0, 27.0, 22.0, 10.0, 17.0, 6.0, 6.0, 8.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0], "bins": [-0.62841796875, -0.6083908081054688, -0.5883636474609375, -0.5683364868164062, -0.548309326171875, -0.5282821655273438, -0.5082550048828125, -0.48822784423828125, -0.46820068359375, -0.44817352294921875, -0.4281463623046875, -0.40811920166015625, -0.388092041015625, -0.36806488037109375, -0.3480377197265625, -0.32801055908203125, -0.3079833984375, -0.28795623779296875, -0.2679290771484375, -0.24790191650390625, -0.227874755859375, -0.20784759521484375, -0.1878204345703125, -0.16779327392578125, -0.14776611328125, -0.12773895263671875, -0.1077117919921875, -0.08768463134765625, -0.067657470703125, -0.04763031005859375, -0.0276031494140625, -0.00757598876953125, 0.012451171875, 0.03247833251953125, 0.0525054931640625, 0.07253265380859375, 0.092559814453125, 0.11258697509765625, 0.1326141357421875, 0.15264129638671875, 0.17266845703125, 0.19269561767578125, 0.2127227783203125, 0.23274993896484375, 0.252777099609375, 0.27280426025390625, 0.2928314208984375, 0.31285858154296875, 0.3328857421875, 0.35291290283203125, 0.3729400634765625, 0.39296722412109375, 0.412994384765625, 0.43302154541015625, 0.4530487060546875, 0.47307586669921875, 0.49310302734375, 0.5131301879882812, 0.5331573486328125, 0.5531845092773438, 0.573211669921875, 0.5932388305664062, 0.6132659912109375, 0.6332931518554688, 0.6533203125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 9.0, 8.0, 10.0, 13.0, 11.0, 16.0, 20.0, 27.0, 21.0, 30.0, 29.0, 35.0, 50.0, 46.0, 41.0, 42.0, 40.0, 37.0, 52.0, 43.0, 37.0, 32.0, 28.0, 40.0, 37.0, 24.0, 41.0, 30.0, 24.0, 17.0, 19.0, 15.0, 11.0, 12.0, 8.0, 5.0, 8.0, 5.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.72119140625, -0.6995468139648438, -0.6779022216796875, -0.6562576293945312, -0.634613037109375, -0.6129684448242188, -0.5913238525390625, -0.5696792602539062, -0.54803466796875, -0.5263900756835938, -0.5047454833984375, -0.48310089111328125, -0.461456298828125, -0.43981170654296875, -0.4181671142578125, -0.39652252197265625, -0.3748779296875, -0.35323333740234375, -0.3315887451171875, -0.30994415283203125, -0.288299560546875, -0.26665496826171875, -0.2450103759765625, -0.22336578369140625, -0.20172119140625, -0.18007659912109375, -0.1584320068359375, -0.13678741455078125, -0.115142822265625, -0.09349822998046875, -0.0718536376953125, -0.05020904541015625, -0.028564453125, -0.00691986083984375, 0.0147247314453125, 0.03636932373046875, 0.058013916015625, 0.07965850830078125, 0.1013031005859375, 0.12294769287109375, 0.14459228515625, 0.16623687744140625, 0.1878814697265625, 0.20952606201171875, 0.231170654296875, 0.25281524658203125, 0.2744598388671875, 0.29610443115234375, 0.3177490234375, 0.33939361572265625, 0.3610382080078125, 0.38268280029296875, 0.404327392578125, 0.42597198486328125, 0.4476165771484375, 0.46926116943359375, 0.49090576171875, 0.5125503540039062, 0.5341949462890625, 0.5558395385742188, 0.577484130859375, 0.5991287231445312, 0.6207733154296875, 0.6424179077148438, 0.6640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 8.0, 16.0, 25.0, 37.0, 60.0, 168.0, 487.0, 2074.0, 22792.0, 3977354.0, 184984.0, 4921.0, 839.0, 263.0, 125.0, 47.0, 29.0, 17.0, 10.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.959686279296875, -2.87445068359375, -2.789215087890625, -2.7039794921875, -2.618743896484375, -2.53350830078125, -2.448272705078125, -2.363037109375, -2.277801513671875, -2.19256591796875, -2.107330322265625, -2.0220947265625, -1.936859130859375, -1.85162353515625, -1.766387939453125, -1.68115234375, -1.595916748046875, -1.51068115234375, -1.425445556640625, -1.3402099609375, -1.254974365234375, -1.16973876953125, -1.084503173828125, -0.999267578125, -0.914031982421875, -0.82879638671875, -0.743560791015625, -0.6583251953125, -0.573089599609375, -0.48785400390625, -0.402618408203125, -0.3173828125, -0.232147216796875, -0.14691162109375, -0.061676025390625, 0.0235595703125, 0.108795166015625, 0.19403076171875, 0.279266357421875, 0.364501953125, 0.449737548828125, 0.53497314453125, 0.620208740234375, 0.7054443359375, 0.790679931640625, 0.87591552734375, 0.961151123046875, 1.04638671875, 1.131622314453125, 1.21685791015625, 1.302093505859375, 1.3873291015625, 1.472564697265625, 1.55780029296875, 1.643035888671875, 1.728271484375, 1.813507080078125, 1.89874267578125, 1.983978271484375, 2.0692138671875, 2.154449462890625, 2.23968505859375, 2.324920654296875, 2.41015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 12.0, 7.0, 20.0, 29.0, 49.0, 69.0, 155.0, 326.0, 586.0, 826.0, 834.0, 508.0, 287.0, 150.0, 83.0, 42.0, 25.0, 15.0, 11.0, 15.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.236053466796875, -1.19183349609375, -1.147613525390625, -1.1033935546875, -1.059173583984375, -1.01495361328125, -0.970733642578125, -0.926513671875, -0.882293701171875, -0.83807373046875, -0.793853759765625, -0.7496337890625, -0.705413818359375, -0.66119384765625, -0.616973876953125, -0.57275390625, -0.528533935546875, -0.48431396484375, -0.440093994140625, -0.3958740234375, -0.351654052734375, -0.30743408203125, -0.263214111328125, -0.218994140625, -0.174774169921875, -0.13055419921875, -0.086334228515625, -0.0421142578125, 0.002105712890625, 0.04632568359375, 0.090545654296875, 0.134765625, 0.178985595703125, 0.22320556640625, 0.267425537109375, 0.3116455078125, 0.355865478515625, 0.40008544921875, 0.444305419921875, 0.488525390625, 0.532745361328125, 0.57696533203125, 0.621185302734375, 0.6654052734375, 0.709625244140625, 0.75384521484375, 0.798065185546875, 0.84228515625, 0.886505126953125, 0.93072509765625, 0.974945068359375, 1.0191650390625, 1.063385009765625, 1.10760498046875, 1.151824951171875, 1.196044921875, 1.240264892578125, 1.28448486328125, 1.328704833984375, 1.3729248046875, 1.417144775390625, 1.46136474609375, 1.505584716796875, 1.5498046875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 10.0, 8.0, 15.0, 28.0, 50.0, 94.0, 136.0, 187.0, 178.0, 135.0, 72.0, 41.0, 18.0, 13.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.531072616577148, -6.243812561035156, -5.956552028656006, -5.6692914962768555, -5.382031440734863, -5.094771385192871, -4.807510852813721, -4.52025032043457, -4.232990264892578, -3.945729970932007, -3.6584696769714355, -3.3712093830108643, -3.083949089050293, -2.7966887950897217, -2.5094285011291504, -2.222168207168579, -1.9349079132080078, -1.6476476192474365, -1.3603873252868652, -1.073127031326294, -0.7858667373657227, -0.49860644340515137, -0.21134614944458008, 0.07591414451599121, 0.3631744384765625, 0.6504347324371338, 0.9376950263977051, 1.2249553203582764, 1.5122156143188477, 1.799475908279419, 2.0867362022399902, 2.3739964962005615, 2.661256790161133, 2.948517084121704, 3.2357773780822754, 3.5230376720428467, 3.810297966003418, 4.09755802154541, 4.3848185539245605, 4.672079086303711, 4.959339141845703, 5.246599197387695, 5.533859729766846, 5.821120262145996, 6.108380317687988, 6.3956403732299805, 6.682900905609131, 6.970161437988281, 7.257421493530273, 7.544681549072266, 7.831942081451416, 8.119202613830566, 8.406462669372559, 8.69372272491455, 8.98098373413086, 9.268243789672852, 9.555503845214844, 9.842763900756836, 10.130023956298828, 10.417284965515137, 10.704545021057129, 10.991805076599121, 11.27906608581543, 11.566326141357422, 11.853586196899414]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 7.0, 9.0, 10.0, 19.0, 21.0, 21.0, 27.0, 26.0, 30.0, 37.0, 44.0, 43.0, 56.0, 55.0, 41.0, 60.0, 59.0, 38.0, 58.0, 44.0, 35.0, 32.0, 33.0, 26.0, 35.0, 18.0, 23.0, 16.0, 10.0, 13.0, 11.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.750917434692383, -4.580790996551514, -4.4106645584106445, -4.240538120269775, -4.070411682128906, -3.900285243988037, -3.730158567428589, -3.5600321292877197, -3.3899056911468506, -3.2197792530059814, -3.0496528148651123, -2.879526138305664, -2.709399700164795, -2.539273262023926, -2.3691468238830566, -2.1990203857421875, -2.0288939476013184, -1.8587675094604492, -1.68864107131958, -1.5185145139694214, -1.3483880758285522, -1.178261637687683, -1.0081350803375244, -0.8380086421966553, -0.6678822040557861, -0.4977557361125946, -0.3276292681694031, -0.15750277042388916, 0.01262366771697998, 0.18275010585784912, 0.3528766632080078, 0.523003101348877, 0.6931295394897461, 0.8632559776306152, 1.0333824157714844, 1.203508973121643, 1.3736354112625122, 1.5437618494033813, 1.71388840675354, 1.8840148448944092, 2.0541412830352783, 2.2242677211761475, 2.3943941593170166, 2.564520835876465, 2.734647274017334, 2.904773712158203, 3.0749001502990723, 3.2450265884399414, 3.4151530265808105, 3.5852794647216797, 3.755405902862549, 3.925532341003418, 4.095658779144287, 4.265785217285156, 4.435912132263184, 4.6060380935668945, 4.776165008544922, 4.946291446685791, 5.11641788482666, 5.286544322967529, 5.456670761108398, 5.626797199249268, 5.796923637390137, 5.967050552368164, 6.137176513671875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 7.0, 7.0, 15.0, 17.0, 18.0, 42.0, 50.0, 81.0, 126.0, 207.0, 304.0, 458.0, 775.0, 1191.0, 1861.0, 3169.0, 5061.0, 9008.0, 15686.0, 28179.0, 52291.0, 98586.0, 177618.0, 240454.0, 184469.0, 103816.0, 55608.0, 29973.0, 16310.0, 9311.0, 5285.0, 3271.0, 1985.0, 1209.0, 719.0, 481.0, 317.0, 219.0, 127.0, 90.0, 68.0, 31.0, 23.0, 11.0, 16.0, 7.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.42148590087890625, -0.4049835205078125, -0.38848114013671875, -0.371978759765625, -0.35547637939453125, -0.3389739990234375, -0.32247161865234375, -0.30596923828125, -0.28946685791015625, -0.2729644775390625, -0.25646209716796875, -0.239959716796875, -0.22345733642578125, -0.2069549560546875, -0.19045257568359375, -0.1739501953125, -0.15744781494140625, -0.1409454345703125, -0.12444305419921875, -0.107940673828125, -0.09143829345703125, -0.0749359130859375, -0.05843353271484375, -0.04193115234375, -0.02542877197265625, -0.0089263916015625, 0.00757598876953125, 0.024078369140625, 0.04058074951171875, 0.0570831298828125, 0.07358551025390625, 0.090087890625, 0.10659027099609375, 0.1230926513671875, 0.13959503173828125, 0.156097412109375, 0.17259979248046875, 0.1891021728515625, 0.20560455322265625, 0.22210693359375, 0.23860931396484375, 0.2551116943359375, 0.27161407470703125, 0.288116455078125, 0.30461883544921875, 0.3211212158203125, 0.33762359619140625, 0.3541259765625, 0.37062835693359375, 0.3871307373046875, 0.40363311767578125, 0.420135498046875, 0.43663787841796875, 0.4531402587890625, 0.46964263916015625, 0.48614501953125, 0.5026473999023438, 0.5191497802734375, 0.5356521606445312, 0.552154541015625, 0.5686569213867188, 0.5851593017578125, 0.6016616821289062, 0.6181640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 11.0, 12.0, 14.0, 19.0, 20.0, 34.0, 27.0, 30.0, 32.0, 44.0, 40.0, 54.0, 46.0, 47.0, 36.0, 47.0, 38.0, 37.0, 33.0, 36.0, 46.0, 41.0, 34.0, 30.0, 31.0, 17.0, 15.0, 19.0, 16.0, 11.0, 11.0, 9.0, 8.0, 8.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.74267578125, -0.7204360961914062, -0.6981964111328125, -0.6759567260742188, -0.653717041015625, -0.6314773559570312, -0.6092376708984375, -0.5869979858398438, -0.56475830078125, -0.5425186157226562, -0.5202789306640625, -0.49803924560546875, -0.475799560546875, -0.45355987548828125, -0.4313201904296875, -0.40908050537109375, -0.3868408203125, -0.36460113525390625, -0.3423614501953125, -0.32012176513671875, -0.297882080078125, -0.27564239501953125, -0.2534027099609375, -0.23116302490234375, -0.20892333984375, -0.18668365478515625, -0.1644439697265625, -0.14220428466796875, -0.119964599609375, -0.09772491455078125, -0.0754852294921875, -0.05324554443359375, -0.031005859375, -0.00876617431640625, 0.0134735107421875, 0.03571319580078125, 0.057952880859375, 0.08019256591796875, 0.1024322509765625, 0.12467193603515625, 0.14691162109375, 0.16915130615234375, 0.1913909912109375, 0.21363067626953125, 0.235870361328125, 0.25811004638671875, 0.2803497314453125, 0.30258941650390625, 0.3248291015625, 0.34706878662109375, 0.3693084716796875, 0.39154815673828125, 0.413787841796875, 0.43602752685546875, 0.4582672119140625, 0.48050689697265625, 0.50274658203125, 0.5249862670898438, 0.5472259521484375, 0.5694656372070312, 0.591705322265625, 0.6139450073242188, 0.6361846923828125, 0.6584243774414062, 0.6806640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 8.0, 24.0, 22.0, 22.0, 34.0, 40.0, 55.0, 81.0, 102.0, 132.0, 232.0, 354.0, 610.0, 1221.0, 3384.0, 13719.0, 86053.0, 726584.0, 181863.0, 24817.0, 5309.0, 1760.0, 815.0, 438.0, 242.0, 170.0, 113.0, 87.0, 76.0, 53.0, 32.0, 30.0, 20.0, 13.0, 10.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40625, -1.3535308837890625, -1.300811767578125, -1.2480926513671875, -1.19537353515625, -1.1426544189453125, -1.089935302734375, -1.0372161865234375, -0.9844970703125, -0.9317779541015625, -0.879058837890625, -0.8263397216796875, -0.77362060546875, -0.7209014892578125, -0.668182373046875, -0.6154632568359375, -0.562744140625, -0.5100250244140625, -0.457305908203125, -0.4045867919921875, -0.35186767578125, -0.2991485595703125, -0.246429443359375, -0.1937103271484375, -0.1409912109375, -0.0882720947265625, -0.035552978515625, 0.0171661376953125, 0.06988525390625, 0.1226043701171875, 0.175323486328125, 0.2280426025390625, 0.28076171875, 0.3334808349609375, 0.386199951171875, 0.4389190673828125, 0.49163818359375, 0.5443572998046875, 0.597076416015625, 0.6497955322265625, 0.7025146484375, 0.7552337646484375, 0.807952880859375, 0.8606719970703125, 0.91339111328125, 0.9661102294921875, 1.018829345703125, 1.0715484619140625, 1.124267578125, 1.1769866943359375, 1.229705810546875, 1.2824249267578125, 1.33514404296875, 1.3878631591796875, 1.440582275390625, 1.4933013916015625, 1.5460205078125, 1.5987396240234375, 1.651458740234375, 1.7041778564453125, 1.75689697265625, 1.8096160888671875, 1.862335205078125, 1.9150543212890625, 1.9677734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 5.0, 8.0, 4.0, 11.0, 13.0, 13.0, 24.0, 12.0, 19.0, 28.0, 28.0, 46.0, 54.0, 46.0, 50.0, 56.0, 39.0, 53.0, 54.0, 48.0, 50.0, 53.0, 35.0, 41.0, 26.0, 42.0, 20.0, 16.0, 17.0, 9.0, 18.0, 11.0, 6.0, 5.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.292694091796875, -2.21624755859375, -2.139801025390625, -2.0633544921875, -1.986907958984375, -1.91046142578125, -1.834014892578125, -1.757568359375, -1.681121826171875, -1.60467529296875, -1.528228759765625, -1.4517822265625, -1.375335693359375, -1.29888916015625, -1.222442626953125, -1.14599609375, -1.069549560546875, -0.99310302734375, -0.916656494140625, -0.8402099609375, -0.763763427734375, -0.68731689453125, -0.610870361328125, -0.534423828125, -0.457977294921875, -0.38153076171875, -0.305084228515625, -0.2286376953125, -0.152191162109375, -0.07574462890625, 0.000701904296875, 0.0771484375, 0.153594970703125, 0.23004150390625, 0.306488037109375, 0.3829345703125, 0.459381103515625, 0.53582763671875, 0.612274169921875, 0.688720703125, 0.765167236328125, 0.84161376953125, 0.918060302734375, 0.9945068359375, 1.070953369140625, 1.14739990234375, 1.223846435546875, 1.30029296875, 1.376739501953125, 1.45318603515625, 1.529632568359375, 1.6060791015625, 1.682525634765625, 1.75897216796875, 1.835418701171875, 1.911865234375, 1.988311767578125, 2.06475830078125, 2.141204833984375, 2.2176513671875, 2.294097900390625, 2.37054443359375, 2.446990966796875, 2.5234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 7.0, 2.0, 8.0, 14.0, 14.0, 26.0, 56.0, 89.0, 142.0, 325.0, 968.0, 3334.0, 20748.0, 378343.0, 616827.0, 22385.0, 3560.0, 960.0, 343.0, 164.0, 80.0, 50.0, 27.0, 25.0, 8.0, 9.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76953125, -0.7462234497070312, -0.7229156494140625, -0.6996078491210938, -0.676300048828125, -0.6529922485351562, -0.6296844482421875, -0.6063766479492188, -0.58306884765625, -0.5597610473632812, -0.5364532470703125, -0.5131454467773438, -0.489837646484375, -0.46652984619140625, -0.4432220458984375, -0.41991424560546875, -0.3966064453125, -0.37329864501953125, -0.3499908447265625, -0.32668304443359375, -0.303375244140625, -0.28006744384765625, -0.2567596435546875, -0.23345184326171875, -0.21014404296875, -0.18683624267578125, -0.1635284423828125, -0.14022064208984375, -0.116912841796875, -0.09360504150390625, -0.0702972412109375, -0.04698944091796875, -0.023681640625, -0.00037384033203125, 0.0229339599609375, 0.04624176025390625, 0.069549560546875, 0.09285736083984375, 0.1161651611328125, 0.13947296142578125, 0.16278076171875, 0.18608856201171875, 0.2093963623046875, 0.23270416259765625, 0.256011962890625, 0.27931976318359375, 0.3026275634765625, 0.32593536376953125, 0.3492431640625, 0.37255096435546875, 0.3958587646484375, 0.41916656494140625, 0.442474365234375, 0.46578216552734375, 0.4890899658203125, 0.5123977661132812, 0.53570556640625, 0.5590133666992188, 0.5823211669921875, 0.6056289672851562, 0.628936767578125, 0.6522445678710938, 0.6755523681640625, 0.6988601684570312, 0.72216796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 8.0, 6.0, 5.0, 5.0, 5.0, 9.0, 8.0, 15.0, 18.0, 26.0, 32.0, 38.0, 42.0, 64.0, 83.0, 110.0, 108.0, 101.0, 79.0, 59.0, 40.0, 37.0, 19.0, 8.0, 13.0, 12.0, 14.0, 12.0, 5.0, 4.0, 6.0, 6.0, 1.0, 3.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011354684829711914, -0.00011004973202943802, -0.0001065526157617569, -0.00010305549949407578, -9.955838322639465e-05, -9.606126695871353e-05, -9.256415069103241e-05, -8.906703442335129e-05, -8.556991815567017e-05, -8.207280188798904e-05, -7.857568562030792e-05, -7.50785693526268e-05, -7.158145308494568e-05, -6.808433681726456e-05, -6.458722054958344e-05, -6.109010428190231e-05, -5.759298801422119e-05, -5.409587174654007e-05, -5.059875547885895e-05, -4.7101639211177826e-05, -4.3604522943496704e-05, -4.010740667581558e-05, -3.661029040813446e-05, -3.311317414045334e-05, -2.9616057872772217e-05, -2.6118941605091095e-05, -2.2621825337409973e-05, -1.912470906972885e-05, -1.562759280204773e-05, -1.2130476534366608e-05, -8.633360266685486e-06, -5.136243999004364e-06, -1.6391277313232422e-06, 1.8579885363578796e-06, 5.3551048040390015e-06, 8.852221071720123e-06, 1.2349337339401245e-05, 1.5846453607082367e-05, 1.934356987476349e-05, 2.284068614244461e-05, 2.6337802410125732e-05, 2.9834918677806854e-05, 3.3332034945487976e-05, 3.68291512131691e-05, 4.032626748085022e-05, 4.382338374853134e-05, 4.732050001621246e-05, 5.0817616283893585e-05, 5.431473255157471e-05, 5.781184881925583e-05, 6.130896508693695e-05, 6.480608135461807e-05, 6.83031976222992e-05, 7.180031388998032e-05, 7.529743015766144e-05, 7.879454642534256e-05, 8.229166269302368e-05, 8.57887789607048e-05, 8.928589522838593e-05, 9.278301149606705e-05, 9.628012776374817e-05, 9.977724403142929e-05, 0.00010327436029911041, 0.00010677147656679153, 0.00011026859283447266]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 3.0, 9.0, 4.0, 7.0, 19.0, 25.0, 43.0, 68.0, 185.0, 427.0, 1275.0, 6405.0, 142734.0, 875447.0, 18377.0, 2407.0, 622.0, 233.0, 121.0, 47.0, 28.0, 22.0, 13.0, 12.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.025390625, -0.993560791015625, -0.96173095703125, -0.929901123046875, -0.8980712890625, -0.866241455078125, -0.83441162109375, -0.802581787109375, -0.770751953125, -0.738922119140625, -0.70709228515625, -0.675262451171875, -0.6434326171875, -0.611602783203125, -0.57977294921875, -0.547943115234375, -0.51611328125, -0.484283447265625, -0.45245361328125, -0.420623779296875, -0.3887939453125, -0.356964111328125, -0.32513427734375, -0.293304443359375, -0.261474609375, -0.229644775390625, -0.19781494140625, -0.165985107421875, -0.1341552734375, -0.102325439453125, -0.07049560546875, -0.038665771484375, -0.0068359375, 0.024993896484375, 0.05682373046875, 0.088653564453125, 0.1204833984375, 0.152313232421875, 0.18414306640625, 0.215972900390625, 0.247802734375, 0.279632568359375, 0.31146240234375, 0.343292236328125, 0.3751220703125, 0.406951904296875, 0.43878173828125, 0.470611572265625, 0.50244140625, 0.534271240234375, 0.56610107421875, 0.597930908203125, 0.6297607421875, 0.661590576171875, 0.69342041015625, 0.725250244140625, 0.757080078125, 0.788909912109375, 0.82073974609375, 0.852569580078125, 0.8843994140625, 0.916229248046875, 0.94805908203125, 0.979888916015625, 1.01171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 17.0, 14.0, 25.0, 30.0, 37.0, 77.0, 126.0, 164.0, 151.0, 131.0, 79.0, 46.0, 31.0, 25.0, 12.0, 14.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.70751953125, -0.686767578125, -0.666015625, -0.645263671875, -0.62451171875, -0.603759765625, -0.5830078125, -0.562255859375, -0.54150390625, -0.520751953125, -0.5, -0.479248046875, -0.45849609375, -0.437744140625, -0.4169921875, -0.396240234375, -0.37548828125, -0.354736328125, -0.333984375, -0.313232421875, -0.29248046875, -0.271728515625, -0.2509765625, -0.230224609375, -0.20947265625, -0.188720703125, -0.16796875, -0.147216796875, -0.12646484375, -0.105712890625, -0.0849609375, -0.064208984375, -0.04345703125, -0.022705078125, -0.001953125, 0.018798828125, 0.03955078125, 0.060302734375, 0.0810546875, 0.101806640625, 0.12255859375, 0.143310546875, 0.1640625, 0.184814453125, 0.20556640625, 0.226318359375, 0.2470703125, 0.267822265625, 0.28857421875, 0.309326171875, 0.330078125, 0.350830078125, 0.37158203125, 0.392333984375, 0.4130859375, 0.433837890625, 0.45458984375, 0.475341796875, 0.49609375, 0.516845703125, 0.53759765625, 0.558349609375, 0.5791015625, 0.599853515625, 0.62060546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 10.0, 8.0, 19.0, 23.0, 54.0, 68.0, 85.0, 193.0, 234.0, 113.0, 66.0, 57.0, 18.0, 20.0, 12.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.690298080444336, -7.406672477722168, -7.123046875, -6.839421272277832, -6.555795669555664, -6.272170066833496, -5.988544464111328, -5.70491886138916, -5.421293258666992, -5.137667655944824, -4.854042053222656, -4.570416450500488, -4.28679084777832, -4.003165245056152, -3.7195394039154053, -3.4359138011932373, -3.1522879600524902, -2.8686623573303223, -2.5850367546081543, -2.3014111518859863, -2.0177855491638184, -1.7341598272323608, -1.4505341053009033, -1.1669085025787354, -0.8832828998565674, -0.5996572971343994, -0.31603163480758667, -0.032405972480773926, 0.25121963024139404, 0.534845232963562, 0.8184709548950195, 1.1020965576171875, 1.3857221603393555, 1.6693477630615234, 1.9529733657836914, 2.2365989685058594, 2.5202245712280273, 2.8038501739501953, 3.0874760150909424, 3.3711016178131104, 3.6547272205352783, 3.9383528232574463, 4.221978664398193, 4.505604267120361, 4.789229869842529, 5.072855472564697, 5.356481075286865, 5.640106678009033, 5.923732280731201, 6.207357883453369, 6.490983486175537, 6.774609088897705, 7.058234691619873, 7.341860294342041, 7.625486373901367, 7.909111976623535, 8.192737579345703, 8.476363182067871, 8.759988784790039, 9.043614387512207, 9.327239990234375, 9.610865592956543, 9.894491195678711, 10.178116798400879, 10.461742401123047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 7.0, 8.0, 3.0, 9.0, 8.0, 12.0, 16.0, 18.0, 29.0, 19.0, 33.0, 34.0, 30.0, 41.0, 52.0, 101.0, 116.0, 108.0, 45.0, 33.0, 50.0, 41.0, 32.0, 26.0, 17.0, 26.0, 13.0, 13.0, 16.0, 8.0, 9.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.586888313293457, -8.25255012512207, -7.918211936950684, -7.583873748779297, -7.24953556060791, -6.915197372436523, -6.580859661102295, -6.246521472930908, -5.9121832847595215, -5.577845096588135, -5.243506908416748, -4.9091691970825195, -4.574831008911133, -4.240492820739746, -3.9061546325683594, -3.5718164443969727, -3.237478256225586, -2.903140068054199, -2.5688018798828125, -2.234463930130005, -1.9001257419586182, -1.5657875537872314, -1.2314496040344238, -0.8971114158630371, -0.5627732276916504, -0.22843509912490845, 0.1059030294418335, 0.44024109840393066, 0.7745792865753174, 1.108917474746704, 1.4432554244995117, 1.7775936126708984, 2.1119308471679688, 2.4462690353393555, 2.780607223510742, 3.11494517326355, 3.4492833614349365, 3.7836215496063232, 4.117959499359131, 4.452297687530518, 4.786635875701904, 5.120974063873291, 5.455312252044678, 5.789649963378906, 6.123988151550293, 6.45832633972168, 6.792664527893066, 7.127002716064453, 7.46134090423584, 7.795679092407227, 8.130017280578613, 8.46435546875, 8.798693656921387, 9.133031845092773, 9.467369079589844, 9.801708221435547, 10.136045455932617, 10.470383644104004, 10.80472183227539, 11.139060020446777, 11.473398208618164, 11.80773639678955, 12.142074584960938, 12.476411819458008, 12.810750961303711]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 7.0, 10.0, 16.0, 28.0, 35.0, 62.0, 77.0, 104.0, 193.0, 287.0, 537.0, 956.0, 1710.0, 4036.0, 11020.0, 37266.0, 151041.0, 653087.0, 1795357.0, 1167246.0, 285946.0, 59946.0, 14928.0, 5191.0, 2300.0, 1154.0, 631.0, 380.0, 250.0, 154.0, 101.0, 65.0, 54.0, 34.0, 22.0, 17.0, 10.0, 7.0, 11.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5263671875, -0.5086517333984375, -0.490936279296875, -0.4732208251953125, -0.45550537109375, -0.4377899169921875, -0.420074462890625, -0.4023590087890625, -0.3846435546875, -0.3669281005859375, -0.349212646484375, -0.3314971923828125, -0.31378173828125, -0.2960662841796875, -0.278350830078125, -0.2606353759765625, -0.242919921875, -0.2252044677734375, -0.207489013671875, -0.1897735595703125, -0.17205810546875, -0.1543426513671875, -0.136627197265625, -0.1189117431640625, -0.1011962890625, -0.0834808349609375, -0.065765380859375, -0.0480499267578125, -0.03033447265625, -0.0126190185546875, 0.005096435546875, 0.0228118896484375, 0.04052734375, 0.0582427978515625, 0.075958251953125, 0.0936737060546875, 0.11138916015625, 0.1291046142578125, 0.146820068359375, 0.1645355224609375, 0.1822509765625, 0.1999664306640625, 0.217681884765625, 0.2353973388671875, 0.25311279296875, 0.2708282470703125, 0.288543701171875, 0.3062591552734375, 0.323974609375, 0.3416900634765625, 0.359405517578125, 0.3771209716796875, 0.39483642578125, 0.4125518798828125, 0.430267333984375, 0.4479827880859375, 0.4656982421875, 0.4834136962890625, 0.501129150390625, 0.5188446044921875, 0.53656005859375, 0.5542755126953125, 0.571990966796875, 0.5897064208984375, 0.607421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 6.0, 10.0, 11.0, 12.0, 8.0, 21.0, 18.0, 22.0, 23.0, 27.0, 34.0, 44.0, 45.0, 46.0, 50.0, 47.0, 50.0, 41.0, 42.0, 42.0, 45.0, 47.0, 40.0, 31.0, 42.0, 32.0, 21.0, 23.0, 21.0, 21.0, 14.0, 7.0, 13.0, 8.0, 6.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.76513671875, -0.7425003051757812, -0.7198638916015625, -0.6972274780273438, -0.674591064453125, -0.6519546508789062, -0.6293182373046875, -0.6066818237304688, -0.58404541015625, -0.5614089965820312, -0.5387725830078125, -0.5161361694335938, -0.493499755859375, -0.47086334228515625, -0.4482269287109375, -0.42559051513671875, -0.4029541015625, -0.38031768798828125, -0.3576812744140625, -0.33504486083984375, -0.312408447265625, -0.28977203369140625, -0.2671356201171875, -0.24449920654296875, -0.22186279296875, -0.19922637939453125, -0.1765899658203125, -0.15395355224609375, -0.131317138671875, -0.10868072509765625, -0.0860443115234375, -0.06340789794921875, -0.040771484375, -0.01813507080078125, 0.0045013427734375, 0.02713775634765625, 0.049774169921875, 0.07241058349609375, 0.0950469970703125, 0.11768341064453125, 0.14031982421875, 0.16295623779296875, 0.1855926513671875, 0.20822906494140625, 0.230865478515625, 0.25350189208984375, 0.2761383056640625, 0.29877471923828125, 0.3214111328125, 0.34404754638671875, 0.3666839599609375, 0.38932037353515625, 0.411956787109375, 0.43459320068359375, 0.4572296142578125, 0.47986602783203125, 0.50250244140625, 0.5251388549804688, 0.5477752685546875, 0.5704116821289062, 0.593048095703125, 0.6156845092773438, 0.6383209228515625, 0.6609573364257812, 0.68359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 10.0, 4.0, 15.0, 14.0, 16.0, 33.0, 51.0, 112.0, 220.0, 650.0, 2483.0, 20751.0, 3566821.0, 591693.0, 9138.0, 1510.0, 423.0, 164.0, 64.0, 31.0, 19.0, 18.0, 12.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.90625, -2.827392578125, -2.74853515625, -2.669677734375, -2.5908203125, -2.511962890625, -2.43310546875, -2.354248046875, -2.275390625, -2.196533203125, -2.11767578125, -2.038818359375, -1.9599609375, -1.881103515625, -1.80224609375, -1.723388671875, -1.64453125, -1.565673828125, -1.48681640625, -1.407958984375, -1.3291015625, -1.250244140625, -1.17138671875, -1.092529296875, -1.013671875, -0.934814453125, -0.85595703125, -0.777099609375, -0.6982421875, -0.619384765625, -0.54052734375, -0.461669921875, -0.3828125, -0.303955078125, -0.22509765625, -0.146240234375, -0.0673828125, 0.011474609375, 0.09033203125, 0.169189453125, 0.248046875, 0.326904296875, 0.40576171875, 0.484619140625, 0.5634765625, 0.642333984375, 0.72119140625, 0.800048828125, 0.87890625, 0.957763671875, 1.03662109375, 1.115478515625, 1.1943359375, 1.273193359375, 1.35205078125, 1.430908203125, 1.509765625, 1.588623046875, 1.66748046875, 1.746337890625, 1.8251953125, 1.904052734375, 1.98291015625, 2.061767578125, 2.140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 7.0, 11.0, 24.0, 45.0, 51.0, 101.0, 167.0, 382.0, 655.0, 925.0, 784.0, 431.0, 199.0, 108.0, 57.0, 32.0, 19.0, 14.0, 12.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.662109375, -1.6141204833984375, -1.566131591796875, -1.5181427001953125, -1.47015380859375, -1.4221649169921875, -1.374176025390625, -1.3261871337890625, -1.2781982421875, -1.2302093505859375, -1.182220458984375, -1.1342315673828125, -1.08624267578125, -1.0382537841796875, -0.990264892578125, -0.9422760009765625, -0.894287109375, -0.8462982177734375, -0.798309326171875, -0.7503204345703125, -0.70233154296875, -0.6543426513671875, -0.606353759765625, -0.5583648681640625, -0.5103759765625, -0.4623870849609375, -0.414398193359375, -0.3664093017578125, -0.31842041015625, -0.2704315185546875, -0.222442626953125, -0.1744537353515625, -0.12646484375, -0.0784759521484375, -0.030487060546875, 0.0175018310546875, 0.06549072265625, 0.1134796142578125, 0.161468505859375, 0.2094573974609375, 0.2574462890625, 0.3054351806640625, 0.353424072265625, 0.4014129638671875, 0.44940185546875, 0.4973907470703125, 0.545379638671875, 0.5933685302734375, 0.641357421875, 0.6893463134765625, 0.737335205078125, 0.7853240966796875, 0.83331298828125, 0.8813018798828125, 0.929290771484375, 0.9772796630859375, 1.0252685546875, 1.0732574462890625, 1.121246337890625, 1.1692352294921875, 1.21722412109375, 1.2652130126953125, 1.313201904296875, 1.3611907958984375, 1.4091796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 5.0, 7.0, 4.0, 8.0, 20.0, 41.0, 52.0, 116.0, 245.0, 205.0, 167.0, 71.0, 33.0, 12.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.540128707885742, -19.15174674987793, -18.76336669921875, -18.374984741210938, -17.986602783203125, -17.598220825195312, -17.2098388671875, -16.82145881652832, -16.433076858520508, -16.044694900512695, -15.6563138961792, -15.267932891845703, -14.87955093383789, -14.491168975830078, -14.102787971496582, -13.714406967163086, -13.326025009155273, -12.937643051147461, -12.549262046813965, -12.160881042480469, -11.772499084472656, -11.384117126464844, -10.995736122131348, -10.607355117797852, -10.218973159790039, -9.830591201782227, -9.44221019744873, -9.053829193115234, -8.665447235107422, -8.27706527709961, -7.888684272766113, -7.500302791595459, -7.111921310424805, -6.72353982925415, -6.335158348083496, -5.946776866912842, -5.5583953857421875, -5.170013904571533, -4.781632423400879, -4.393250942230225, -4.00486946105957, -3.616487979888916, -3.2281064987182617, -2.8397250175476074, -2.451343536376953, -2.062962055206299, -1.6745805740356445, -1.2861990928649902, -0.8978176116943359, -0.5094361305236816, -0.12105464935302734, 0.26732683181762695, 0.6557083129882812, 1.0440897941589355, 1.4324712753295898, 1.8208527565002441, 2.2092342376708984, 2.5976157188415527, 2.985997200012207, 3.3743786811828613, 3.7627601623535156, 4.15114164352417, 4.539523124694824, 4.9279046058654785, 5.316286087036133]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 4.0, 7.0, 9.0, 13.0, 8.0, 21.0, 21.0, 32.0, 23.0, 39.0, 23.0, 35.0, 36.0, 36.0, 41.0, 53.0, 49.0, 49.0, 33.0, 34.0, 44.0, 40.0, 37.0, 42.0, 25.0, 43.0, 23.0, 30.0, 27.0, 24.0, 13.0, 16.0, 11.0, 9.0, 9.0, 13.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98276424407959, -4.801346778869629, -4.619929313659668, -4.438512325286865, -4.257094860076904, -4.075677394866943, -3.8942601680755615, -3.7128429412841797, -3.5314254760742188, -3.350008010864258, -3.168590784072876, -2.987173557281494, -2.805756092071533, -2.6243386268615723, -2.4429214000701904, -2.2615041732788086, -2.0800867080688477, -1.8986693620681763, -1.7172520160675049, -1.5358346700668335, -1.354417324066162, -1.1729999780654907, -0.9915826320648193, -0.810165286064148, -0.6287479400634766, -0.4473305940628052, -0.2659132480621338, -0.0844959020614624, 0.09692144393920898, 0.27833878993988037, 0.45975613594055176, 0.6411734819412231, 0.8225908279418945, 1.004008173942566, 1.1854255199432373, 1.3668428659439087, 1.54826021194458, 1.7296775579452515, 1.9110949039459229, 2.0925121307373047, 2.2739295959472656, 2.4553470611572266, 2.6367642879486084, 2.8181815147399902, 2.999598979949951, 3.181016445159912, 3.362433671951294, 3.543850898742676, 3.7252683639526367, 3.9066858291625977, 4.088103294372559, 4.269520282745361, 4.450937747955322, 4.632355213165283, 4.813772201538086, 4.995189666748047, 5.176607131958008, 5.358024597167969, 5.53944206237793, 5.720859050750732, 5.902276515960693, 6.083693981170654, 6.265110969543457, 6.446528434753418, 6.627945899963379]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 12.0, 14.0, 24.0, 35.0, 65.0, 101.0, 122.0, 216.0, 340.0, 522.0, 904.0, 1546.0, 2821.0, 5614.0, 11699.0, 26743.0, 70099.0, 209611.0, 409898.0, 194319.0, 65368.0, 25330.0, 11246.0, 5373.0, 2745.0, 1568.0, 871.0, 504.0, 316.0, 193.0, 90.0, 76.0, 48.0, 36.0, 22.0, 18.0, 7.0, 11.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1357421875, -1.1027908325195312, -1.0698394775390625, -1.0368881225585938, -1.003936767578125, -0.9709854125976562, -0.9380340576171875, -0.9050827026367188, -0.87213134765625, -0.8391799926757812, -0.8062286376953125, -0.7732772827148438, -0.740325927734375, -0.7073745727539062, -0.6744232177734375, -0.6414718627929688, -0.6085205078125, -0.5755691528320312, -0.5426177978515625, -0.5096664428710938, -0.476715087890625, -0.44376373291015625, -0.4108123779296875, -0.37786102294921875, -0.34490966796875, -0.31195831298828125, -0.2790069580078125, -0.24605560302734375, -0.213104248046875, -0.18015289306640625, -0.1472015380859375, -0.11425018310546875, -0.081298828125, -0.04834747314453125, -0.0153961181640625, 0.01755523681640625, 0.050506591796875, 0.08345794677734375, 0.1164093017578125, 0.14936065673828125, 0.18231201171875, 0.21526336669921875, 0.2482147216796875, 0.28116607666015625, 0.314117431640625, 0.34706878662109375, 0.3800201416015625, 0.41297149658203125, 0.4459228515625, 0.47887420654296875, 0.5118255615234375, 0.5447769165039062, 0.577728271484375, 0.6106796264648438, 0.6436309814453125, 0.6765823364257812, 0.70953369140625, 0.7424850463867188, 0.7754364013671875, 0.8083877563476562, 0.841339111328125, 0.8742904663085938, 0.9072418212890625, 0.9401931762695312, 0.97314453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 11.0, 12.0, 8.0, 9.0, 12.0, 20.0, 18.0, 21.0, 26.0, 35.0, 39.0, 47.0, 35.0, 54.0, 45.0, 56.0, 45.0, 57.0, 34.0, 52.0, 46.0, 48.0, 33.0, 37.0, 34.0, 36.0, 22.0, 21.0, 13.0, 11.0, 12.0, 8.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.6949996948242188, -0.6712493896484375, -0.6474990844726562, -0.623748779296875, -0.5999984741210938, -0.5762481689453125, -0.5524978637695312, -0.52874755859375, -0.5049972534179688, -0.4812469482421875, -0.45749664306640625, -0.433746337890625, -0.40999603271484375, -0.3862457275390625, -0.36249542236328125, -0.3387451171875, -0.31499481201171875, -0.2912445068359375, -0.26749420166015625, -0.243743896484375, -0.21999359130859375, -0.1962432861328125, -0.17249298095703125, -0.14874267578125, -0.12499237060546875, -0.1012420654296875, -0.07749176025390625, -0.053741455078125, -0.02999114990234375, -0.0062408447265625, 0.01750946044921875, 0.041259765625, 0.06501007080078125, 0.0887603759765625, 0.11251068115234375, 0.136260986328125, 0.16001129150390625, 0.1837615966796875, 0.20751190185546875, 0.23126220703125, 0.25501251220703125, 0.2787628173828125, 0.30251312255859375, 0.326263427734375, 0.35001373291015625, 0.3737640380859375, 0.39751434326171875, 0.4212646484375, 0.44501495361328125, 0.4687652587890625, 0.49251556396484375, 0.516265869140625, 0.5400161743164062, 0.5637664794921875, 0.5875167846679688, 0.61126708984375, 0.6350173950195312, 0.6587677001953125, 0.6825180053710938, 0.706268310546875, 0.7300186157226562, 0.7537689208984375, 0.7775192260742188, 0.80126953125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 7.0, 15.0, 16.0, 28.0, 37.0, 45.0, 43.0, 82.0, 95.0, 128.0, 166.0, 264.0, 396.0, 620.0, 1015.0, 2024.0, 6153.0, 33066.0, 582565.0, 379306.0, 31502.0, 6051.0, 2001.0, 966.0, 577.0, 404.0, 252.0, 188.0, 127.0, 90.0, 88.0, 62.0, 47.0, 33.0, 27.0, 10.0, 17.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-2.095703125, -2.0340423583984375, -1.972381591796875, -1.9107208251953125, -1.84906005859375, -1.7873992919921875, -1.725738525390625, -1.6640777587890625, -1.6024169921875, -1.5407562255859375, -1.479095458984375, -1.4174346923828125, -1.35577392578125, -1.2941131591796875, -1.232452392578125, -1.1707916259765625, -1.109130859375, -1.0474700927734375, -0.985809326171875, -0.9241485595703125, -0.86248779296875, -0.8008270263671875, -0.739166259765625, -0.6775054931640625, -0.6158447265625, -0.5541839599609375, -0.492523193359375, -0.4308624267578125, -0.36920166015625, -0.3075408935546875, -0.245880126953125, -0.1842193603515625, -0.12255859375, -0.0608978271484375, 0.000762939453125, 0.0624237060546875, 0.12408447265625, 0.1857452392578125, 0.247406005859375, 0.3090667724609375, 0.3707275390625, 0.4323883056640625, 0.494049072265625, 0.5557098388671875, 0.61737060546875, 0.6790313720703125, 0.740692138671875, 0.8023529052734375, 0.864013671875, 0.9256744384765625, 0.987335205078125, 1.0489959716796875, 1.11065673828125, 1.1723175048828125, 1.233978271484375, 1.2956390380859375, 1.3572998046875, 1.4189605712890625, 1.480621337890625, 1.5422821044921875, 1.60394287109375, 1.6656036376953125, 1.727264404296875, 1.7889251708984375, 1.8505859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 6.0, 3.0, 19.0, 12.0, 7.0, 16.0, 14.0, 23.0, 24.0, 27.0, 37.0, 53.0, 41.0, 46.0, 58.0, 62.0, 66.0, 54.0, 49.0, 57.0, 44.0, 49.0, 36.0, 41.0, 31.0, 17.0, 14.0, 19.0, 11.0, 10.0, 10.0, 11.0, 9.0, 8.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.582916259765625, -2.49591064453125, -2.408905029296875, -2.3218994140625, -2.234893798828125, -2.14788818359375, -2.060882568359375, -1.973876953125, -1.886871337890625, -1.79986572265625, -1.712860107421875, -1.6258544921875, -1.538848876953125, -1.45184326171875, -1.364837646484375, -1.27783203125, -1.190826416015625, -1.10382080078125, -1.016815185546875, -0.9298095703125, -0.842803955078125, -0.75579833984375, -0.668792724609375, -0.581787109375, -0.494781494140625, -0.40777587890625, -0.320770263671875, -0.2337646484375, -0.146759033203125, -0.05975341796875, 0.027252197265625, 0.1142578125, 0.201263427734375, 0.28826904296875, 0.375274658203125, 0.4622802734375, 0.549285888671875, 0.63629150390625, 0.723297119140625, 0.810302734375, 0.897308349609375, 0.98431396484375, 1.071319580078125, 1.1583251953125, 1.245330810546875, 1.33233642578125, 1.419342041015625, 1.50634765625, 1.593353271484375, 1.68035888671875, 1.767364501953125, 1.8543701171875, 1.941375732421875, 2.02838134765625, 2.115386962890625, 2.202392578125, 2.289398193359375, 2.37640380859375, 2.463409423828125, 2.5504150390625, 2.637420654296875, 2.72442626953125, 2.811431884765625, 2.8984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 8.0, 6.0, 18.0, 21.0, 27.0, 48.0, 104.0, 236.0, 459.0, 1180.0, 5276.0, 55813.0, 899478.0, 76954.0, 6450.0, 1409.0, 532.0, 245.0, 115.0, 56.0, 36.0, 28.0, 14.0, 14.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6005859375, -0.5795516967773438, -0.5585174560546875, -0.5374832153320312, -0.516448974609375, -0.49541473388671875, -0.4743804931640625, -0.45334625244140625, -0.43231201171875, -0.41127777099609375, -0.3902435302734375, -0.36920928955078125, -0.348175048828125, -0.32714080810546875, -0.3061065673828125, -0.28507232666015625, -0.2640380859375, -0.24300384521484375, -0.2219696044921875, -0.20093536376953125, -0.179901123046875, -0.15886688232421875, -0.1378326416015625, -0.11679840087890625, -0.09576416015625, -0.07472991943359375, -0.0536956787109375, -0.03266143798828125, -0.011627197265625, 0.00940704345703125, 0.0304412841796875, 0.05147552490234375, 0.072509765625, 0.09354400634765625, 0.1145782470703125, 0.13561248779296875, 0.156646728515625, 0.17768096923828125, 0.1987152099609375, 0.21974945068359375, 0.24078369140625, 0.26181793212890625, 0.2828521728515625, 0.30388641357421875, 0.324920654296875, 0.34595489501953125, 0.3669891357421875, 0.38802337646484375, 0.4090576171875, 0.43009185791015625, 0.4511260986328125, 0.47216033935546875, 0.493194580078125, 0.5142288208007812, 0.5352630615234375, 0.5562973022460938, 0.57733154296875, 0.5983657836914062, 0.6194000244140625, 0.6404342651367188, 0.661468505859375, 0.6825027465820312, 0.7035369873046875, 0.7245712280273438, 0.74560546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 0.0, 3.0, 7.0, 4.0, 13.0, 16.0, 17.0, 34.0, 39.0, 45.0, 53.0, 87.0, 131.0, 142.0, 123.0, 81.0, 62.0, 39.0, 35.0, 14.0, 9.0, 7.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00013875961303710938, -0.00013402849435806274, -0.0001292973756790161, -0.00012456625699996948, -0.00011983513832092285, -0.00011510401964187622, -0.00011037290096282959, -0.00010564178228378296, -0.00010091066360473633, -9.61795449256897e-05, -9.144842624664307e-05, -8.671730756759644e-05, -8.19861888885498e-05, -7.725507020950317e-05, -7.252395153045654e-05, -6.779283285140991e-05, -6.306171417236328e-05, -5.833059549331665e-05, -5.359947681427002e-05, -4.886835813522339e-05, -4.413723945617676e-05, -3.940612077713013e-05, -3.4675002098083496e-05, -2.9943883419036865e-05, -2.5212764739990234e-05, -2.0481646060943604e-05, -1.5750527381896973e-05, -1.1019408702850342e-05, -6.288290023803711e-06, -1.55717134475708e-06, 3.1739473342895508e-06, 7.905066013336182e-06, 1.2636184692382812e-05, 1.7367303371429443e-05, 2.2098422050476074e-05, 2.6829540729522705e-05, 3.1560659408569336e-05, 3.629177808761597e-05, 4.10228967666626e-05, 4.575401544570923e-05, 5.048513412475586e-05, 5.521625280380249e-05, 5.994737148284912e-05, 6.467849016189575e-05, 6.940960884094238e-05, 7.414072751998901e-05, 7.887184619903564e-05, 8.360296487808228e-05, 8.83340835571289e-05, 9.306520223617554e-05, 9.779632091522217e-05, 0.0001025274395942688, 0.00010725855827331543, 0.00011198967695236206, 0.00011672079563140869, 0.00012145191431045532, 0.00012618303298950195, 0.00013091415166854858, 0.00013564527034759521, 0.00014037638902664185, 0.00014510750770568848, 0.0001498386263847351, 0.00015456974506378174, 0.00015930086374282837, 0.000164031982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 11.0, 21.0, 34.0, 55.0, 97.0, 192.0, 362.0, 725.0, 2402.0, 13183.0, 203790.0, 791150.0, 30372.0, 4009.0, 1127.0, 484.0, 211.0, 114.0, 64.0, 55.0, 28.0, 19.0, 7.0, 10.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5801162719726562, -0.5620880126953125, -0.5440597534179688, -0.526031494140625, -0.5080032348632812, -0.4899749755859375, -0.47194671630859375, -0.45391845703125, -0.43589019775390625, -0.4178619384765625, -0.39983367919921875, -0.381805419921875, -0.36377716064453125, -0.3457489013671875, -0.32772064208984375, -0.3096923828125, -0.29166412353515625, -0.2736358642578125, -0.25560760498046875, -0.237579345703125, -0.21955108642578125, -0.2015228271484375, -0.18349456787109375, -0.16546630859375, -0.14743804931640625, -0.1294097900390625, -0.11138153076171875, -0.093353271484375, -0.07532501220703125, -0.0572967529296875, -0.03926849365234375, -0.021240234375, -0.00321197509765625, 0.0148162841796875, 0.03284454345703125, 0.050872802734375, 0.06890106201171875, 0.0869293212890625, 0.10495758056640625, 0.12298583984375, 0.14101409912109375, 0.1590423583984375, 0.17707061767578125, 0.195098876953125, 0.21312713623046875, 0.2311553955078125, 0.24918365478515625, 0.2672119140625, 0.28524017333984375, 0.3032684326171875, 0.32129669189453125, 0.339324951171875, 0.35735321044921875, 0.3753814697265625, 0.39340972900390625, 0.41143798828125, 0.42946624755859375, 0.4474945068359375, 0.46552276611328125, 0.483551025390625, 0.5015792846679688, 0.5196075439453125, 0.5376358032226562, 0.5556640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 13.0, 19.0, 30.0, 55.0, 96.0, 102.0, 164.0, 144.0, 115.0, 89.0, 50.0, 38.0, 22.0, 16.0, 10.0, 8.0, 10.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.5220260620117188, -0.5020599365234375, -0.48209381103515625, -0.462127685546875, -0.44216156005859375, -0.4221954345703125, -0.40222930908203125, -0.38226318359375, -0.36229705810546875, -0.3423309326171875, -0.32236480712890625, -0.302398681640625, -0.28243255615234375, -0.2624664306640625, -0.24250030517578125, -0.2225341796875, -0.20256805419921875, -0.1826019287109375, -0.16263580322265625, -0.142669677734375, -0.12270355224609375, -0.1027374267578125, -0.08277130126953125, -0.06280517578125, -0.04283905029296875, -0.0228729248046875, -0.00290679931640625, 0.017059326171875, 0.03702545166015625, 0.0569915771484375, 0.07695770263671875, 0.096923828125, 0.11688995361328125, 0.1368560791015625, 0.15682220458984375, 0.176788330078125, 0.19675445556640625, 0.2167205810546875, 0.23668670654296875, 0.25665283203125, 0.27661895751953125, 0.2965850830078125, 0.31655120849609375, 0.336517333984375, 0.35648345947265625, 0.3764495849609375, 0.39641571044921875, 0.4163818359375, 0.43634796142578125, 0.4563140869140625, 0.47628021240234375, 0.496246337890625, 0.5162124633789062, 0.5361785888671875, 0.5561447143554688, 0.57611083984375, 0.5960769653320312, 0.6160430908203125, 0.6360092163085938, 0.655975341796875, 0.6759414672851562, 0.6959075927734375, 0.7158737182617188, 0.73583984375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 25.0, 86.0, 286.0, 405.0, 110.0, 55.0, 13.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.710681915283203, -17.05512237548828, -16.39956283569336, -15.744002342224121, -15.0884428024292, -14.432882308959961, -13.777322769165039, -13.121763229370117, -12.466203689575195, -11.810644149780273, -11.155083656311035, -10.499524116516113, -9.843964576721191, -9.188404083251953, -8.532844543457031, -7.877285003662109, -7.221724510192871, -6.566164493560791, -5.910604953765869, -5.255044937133789, -4.599485397338867, -3.943925380706787, -3.288365364074707, -2.632805824279785, -1.977245807647705, -1.321686029434204, -0.6661261320114136, -0.010566234588623047, 0.6449935436248779, 1.300553321838379, 1.956113338470459, 2.611672878265381, 3.267232894897461, 3.922792673110962, 4.578352451324463, 5.233912467956543, 5.889472007751465, 6.545032024383545, 7.200592041015625, 7.856151580810547, 8.511711120605469, 9.16727066040039, 9.822831153869629, 10.47839069366455, 11.133950233459473, 11.789510726928711, 12.445070266723633, 13.100629806518555, 13.756190299987793, 14.411749839782715, 15.067310333251953, 15.722869873046875, 16.378429412841797, 17.03398895263672, 17.68954849243164, 18.345108032226562, 19.000669479370117, 19.65622901916504, 20.31178855895996, 20.967350006103516, 21.622909545898438, 22.27846908569336, 22.93402862548828, 23.589588165283203, 24.245147705078125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 9.0, 15.0, 19.0, 16.0, 10.0, 18.0, 26.0, 37.0, 34.0, 27.0, 34.0, 41.0, 48.0, 76.0, 158.0, 93.0, 25.0, 25.0, 22.0, 23.0, 34.0, 28.0, 26.0, 20.0, 27.0, 13.0, 11.0, 10.0, 6.0, 8.0, 8.0, 4.0, 12.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.109341621398926, -9.798173904418945, -9.487005233764648, -9.175836563110352, -8.864668846130371, -8.55350112915039, -8.242332458496094, -7.931164264678955, -7.619996070861816, -7.308827877044678, -6.997659683227539, -6.6864914894104, -6.375323295593262, -6.064155101776123, -5.752986907958984, -5.441818714141846, -5.130650520324707, -4.819482326507568, -4.50831413269043, -4.197145938873291, -3.8859777450561523, -3.5748095512390137, -3.263641357421875, -2.9524731636047363, -2.6413049697875977, -2.330136775970459, -2.0189685821533203, -1.7078003883361816, -1.396632194519043, -1.0854640007019043, -0.7742958068847656, -0.46312761306762695, -0.1519603729248047, 0.15920782089233398, 0.47037601470947266, 0.7815442085266113, 1.09271240234375, 1.4038805961608887, 1.7150487899780273, 2.026216983795166, 2.3373851776123047, 2.6485533714294434, 2.959721565246582, 3.2708897590637207, 3.5820579528808594, 3.893226146697998, 4.204394340515137, 4.515562534332275, 4.826730728149414, 5.137898921966553, 5.449067115783691, 5.76023530960083, 6.071403503417969, 6.382571697235107, 6.693739891052246, 7.004908084869385, 7.316076278686523, 7.627244472503662, 7.938412666320801, 8.249580383300781, 8.560749053955078, 8.871917724609375, 9.183085441589355, 9.494253158569336, 9.805421829223633]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 22.0, 12.0, 24.0, 41.0, 56.0, 106.0, 133.0, 203.0, 260.0, 462.0, 839.0, 2005.0, 5248.0, 17168.0, 108779.0, 1024656.0, 2439782.0, 528723.0, 49517.0, 9450.0, 3300.0, 1459.0, 747.0, 430.0, 256.0, 175.0, 130.0, 95.0, 58.0, 38.0, 36.0, 17.0, 19.0, 8.0, 6.0, 8.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7958984375, -0.7602691650390625, -0.724639892578125, -0.6890106201171875, -0.65338134765625, -0.6177520751953125, -0.582122802734375, -0.5464935302734375, -0.5108642578125, -0.4752349853515625, -0.439605712890625, -0.4039764404296875, -0.36834716796875, -0.3327178955078125, -0.297088623046875, -0.2614593505859375, -0.225830078125, -0.1902008056640625, -0.154571533203125, -0.1189422607421875, -0.08331298828125, -0.0476837158203125, -0.012054443359375, 0.0235748291015625, 0.0592041015625, 0.0948333740234375, 0.130462646484375, 0.1660919189453125, 0.20172119140625, 0.2373504638671875, 0.272979736328125, 0.3086090087890625, 0.34423828125, 0.3798675537109375, 0.415496826171875, 0.4511260986328125, 0.48675537109375, 0.5223846435546875, 0.558013916015625, 0.5936431884765625, 0.6292724609375, 0.6649017333984375, 0.700531005859375, 0.7361602783203125, 0.77178955078125, 0.8074188232421875, 0.843048095703125, 0.8786773681640625, 0.914306640625, 0.9499359130859375, 0.985565185546875, 1.0211944580078125, 1.05682373046875, 1.0924530029296875, 1.128082275390625, 1.1637115478515625, 1.1993408203125, 1.2349700927734375, 1.270599365234375, 1.3062286376953125, 1.34185791015625, 1.3774871826171875, 1.413116455078125, 1.4487457275390625, 1.484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 9.0, 10.0, 6.0, 17.0, 13.0, 20.0, 32.0, 39.0, 42.0, 40.0, 56.0, 63.0, 64.0, 60.0, 60.0, 66.0, 57.0, 49.0, 60.0, 40.0, 46.0, 30.0, 34.0, 24.0, 20.0, 12.0, 9.0, 8.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.6522140502929688, -0.6232757568359375, -0.5943374633789062, -0.565399169921875, -0.5364608764648438, -0.5075225830078125, -0.47858428955078125, -0.44964599609375, -0.42070770263671875, -0.3917694091796875, -0.36283111572265625, -0.333892822265625, -0.30495452880859375, -0.2760162353515625, -0.24707794189453125, -0.2181396484375, -0.18920135498046875, -0.1602630615234375, -0.13132476806640625, -0.102386474609375, -0.07344818115234375, -0.0445098876953125, -0.01557159423828125, 0.01336669921875, 0.04230499267578125, 0.0712432861328125, 0.10018157958984375, 0.129119873046875, 0.15805816650390625, 0.1869964599609375, 0.21593475341796875, 0.244873046875, 0.27381134033203125, 0.3027496337890625, 0.33168792724609375, 0.360626220703125, 0.38956451416015625, 0.4185028076171875, 0.44744110107421875, 0.47637939453125, 0.5053176879882812, 0.5342559814453125, 0.5631942749023438, 0.592132568359375, 0.6210708618164062, 0.6500091552734375, 0.6789474487304688, 0.7078857421875, 0.7368240356445312, 0.7657623291015625, 0.7947006225585938, 0.823638916015625, 0.8525772094726562, 0.8815155029296875, 0.9104537963867188, 0.93939208984375, 0.9683303833007812, 0.9972686767578125, 1.0262069702148438, 1.055145263671875, 1.0840835571289062, 1.1130218505859375, 1.1419601440429688, 1.1708984375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 6.0, 8.0, 18.0, 36.0, 100.0, 408.0, 1965.0, 276874.0, 3910955.0, 3073.0, 586.0, 142.0, 58.0, 19.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.859619140625, -9.57861328125, -9.297607421875, -9.0166015625, -8.735595703125, -8.45458984375, -8.173583984375, -7.892578125, -7.611572265625, -7.33056640625, -7.049560546875, -6.7685546875, -6.487548828125, -6.20654296875, -5.925537109375, -5.64453125, -5.363525390625, -5.08251953125, -4.801513671875, -4.5205078125, -4.239501953125, -3.95849609375, -3.677490234375, -3.396484375, -3.115478515625, -2.83447265625, -2.553466796875, -2.2724609375, -1.991455078125, -1.71044921875, -1.429443359375, -1.1484375, -0.867431640625, -0.58642578125, -0.305419921875, -0.0244140625, 0.256591796875, 0.53759765625, 0.818603515625, 1.099609375, 1.380615234375, 1.66162109375, 1.942626953125, 2.2236328125, 2.504638671875, 2.78564453125, 3.066650390625, 3.34765625, 3.628662109375, 3.90966796875, 4.190673828125, 4.4716796875, 4.752685546875, 5.03369140625, 5.314697265625, 5.595703125, 5.876708984375, 6.15771484375, 6.438720703125, 6.7197265625, 7.000732421875, 7.28173828125, 7.562744140625, 7.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 18.0, 48.0, 102.0, 225.0, 585.0, 1387.0, 1046.0, 376.0, 152.0, 65.0, 31.0, 11.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.081146240234375, -1.94940185546875, -1.817657470703125, -1.6859130859375, -1.554168701171875, -1.42242431640625, -1.290679931640625, -1.158935546875, -1.027191162109375, -0.89544677734375, -0.763702392578125, -0.6319580078125, -0.500213623046875, -0.36846923828125, -0.236724853515625, -0.10498046875, 0.026763916015625, 0.15850830078125, 0.290252685546875, 0.4219970703125, 0.553741455078125, 0.68548583984375, 0.817230224609375, 0.948974609375, 1.080718994140625, 1.21246337890625, 1.344207763671875, 1.4759521484375, 1.607696533203125, 1.73944091796875, 1.871185302734375, 2.0029296875, 2.134674072265625, 2.26641845703125, 2.398162841796875, 2.5299072265625, 2.661651611328125, 2.79339599609375, 2.925140380859375, 3.056884765625, 3.188629150390625, 3.32037353515625, 3.452117919921875, 3.5838623046875, 3.715606689453125, 3.84735107421875, 3.979095458984375, 4.11083984375, 4.242584228515625, 4.37432861328125, 4.506072998046875, 4.6378173828125, 4.769561767578125, 4.90130615234375, 5.033050537109375, 5.164794921875, 5.296539306640625, 5.42828369140625, 5.560028076171875, 5.6917724609375, 5.823516845703125, 5.95526123046875, 6.087005615234375, 6.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 29.0, 147.0, 552.0, 221.0, 38.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.905344009399414, -27.04261016845703, -25.17987632751465, -23.317142486572266, -21.45440673828125, -19.591672897338867, -17.728939056396484, -15.866204261779785, -14.003470420837402, -12.14073657989502, -10.27800178527832, -8.415267944335938, -6.5525336265563965, -4.6897993087768555, -2.8270654678344727, -0.9643306732177734, 0.8984031677246094, 2.7611374855041504, 4.623871803283691, 6.486605644226074, 8.349340438842773, 10.212074279785156, 12.074808120727539, 13.937542915344238, 15.800276756286621, 17.66301155090332, 19.525745391845703, 21.388479232788086, 23.25121307373047, 25.113948822021484, 26.976680755615234, 28.83941650390625, 30.702152252197266, 32.56488800048828, 34.42761993408203, 36.29035568237305, 38.1530876159668, 40.01582336425781, 41.87855529785156, 43.74129104614258, 45.604026794433594, 47.46676254272461, 49.32949447631836, 51.192230224609375, 53.054962158203125, 54.91769790649414, 56.780433654785156, 58.643165588378906, 60.505897521972656, 62.36863327026367, 64.23136901855469, 66.09410095214844, 67.95683288574219, 69.81956481933594, 71.68230438232422, 73.54503631591797, 75.40777587890625, 77.2705078125, 79.13324737548828, 80.99597930908203, 82.85871124267578, 84.72145080566406, 86.58418273925781, 88.44691467285156, 90.30964660644531]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 13.0, 12.0, 23.0, 28.0, 40.0, 46.0, 57.0, 64.0, 79.0, 98.0, 117.0, 88.0, 77.0, 63.0, 56.0, 38.0, 33.0, 17.0, 18.0, 10.0, 13.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.595842361450195, -15.97778606414795, -15.359729766845703, -14.74167251586914, -14.123616218566895, -13.505559921264648, -12.887503623962402, -12.269447326660156, -11.651390075683594, -11.033333778381348, -10.415277481079102, -9.797220230102539, -9.179163932800293, -8.561107635498047, -7.943051338195801, -7.3249945640563965, -6.706938743591309, -6.0888824462890625, -5.470825672149658, -4.852769374847412, -4.234712600708008, -3.6166563034057617, -2.9986000061035156, -2.3805432319641113, -1.7624869346618652, -1.14443039894104, -0.5263739824295044, 0.09168243408203125, 0.7097389698028564, 1.3277955055236816, 1.9458518028259277, 2.563908576965332, 3.181964874267578, 3.8000214099884033, 4.4180779457092285, 5.036134243011475, 5.654191017150879, 6.272247314453125, 6.890303611755371, 7.508360385894775, 8.12641716003418, 8.744473457336426, 9.362529754638672, 9.980587005615234, 10.59864330291748, 11.216699600219727, 11.834755897521973, 12.452812194824219, 13.070868492126465, 13.688924789428711, 14.306981086730957, 14.925037384033203, 15.543094635009766, 16.161151885986328, 16.779207229614258, 17.39726448059082, 18.01531982421875, 18.633377075195312, 19.251432418823242, 19.869489669799805, 20.487545013427734, 21.105602264404297, 21.72365951538086, 22.34171485900879, 22.95977210998535]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 10.0, 5.0, 14.0, 16.0, 29.0, 51.0, 71.0, 129.0, 191.0, 394.0, 673.0, 1436.0, 3413.0, 9796.0, 45926.0, 523772.0, 407619.0, 39868.0, 9133.0, 3097.0, 1386.0, 695.0, 376.0, 179.0, 84.0, 58.0, 49.0, 21.0, 12.0, 11.0, 7.0, 7.0, 2.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.4994964599609375, -1.439422607421875, -1.3793487548828125, -1.31927490234375, -1.2592010498046875, -1.199127197265625, -1.1390533447265625, -1.0789794921875, -1.0189056396484375, -0.958831787109375, -0.8987579345703125, -0.83868408203125, -0.7786102294921875, -0.718536376953125, -0.6584625244140625, -0.598388671875, -0.5383148193359375, -0.478240966796875, -0.4181671142578125, -0.35809326171875, -0.2980194091796875, -0.237945556640625, -0.1778717041015625, -0.1177978515625, -0.0577239990234375, 0.002349853515625, 0.0624237060546875, 0.12249755859375, 0.1825714111328125, 0.242645263671875, 0.3027191162109375, 0.36279296875, 0.4228668212890625, 0.482940673828125, 0.5430145263671875, 0.60308837890625, 0.6631622314453125, 0.723236083984375, 0.7833099365234375, 0.8433837890625, 0.9034576416015625, 0.963531494140625, 1.0236053466796875, 1.08367919921875, 1.1437530517578125, 1.203826904296875, 1.2639007568359375, 1.323974609375, 1.3840484619140625, 1.444122314453125, 1.5041961669921875, 1.56427001953125, 1.6243438720703125, 1.684417724609375, 1.7444915771484375, 1.8045654296875, 1.8646392822265625, 1.924713134765625, 1.9847869873046875, 2.04486083984375, 2.1049346923828125, 2.165008544921875, 2.2250823974609375, 2.28515625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 9.0, 15.0, 11.0, 14.0, 29.0, 29.0, 29.0, 36.0, 42.0, 67.0, 53.0, 67.0, 57.0, 66.0, 69.0, 71.0, 67.0, 47.0, 53.0, 29.0, 32.0, 31.0, 24.0, 9.0, 11.0, 6.0, 7.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8427734375, -0.808135986328125, -0.77349853515625, -0.738861083984375, -0.7042236328125, -0.669586181640625, -0.63494873046875, -0.600311279296875, -0.565673828125, -0.531036376953125, -0.49639892578125, -0.461761474609375, -0.4271240234375, -0.392486572265625, -0.35784912109375, -0.323211669921875, -0.28857421875, -0.253936767578125, -0.21929931640625, -0.184661865234375, -0.1500244140625, -0.115386962890625, -0.08074951171875, -0.046112060546875, -0.011474609375, 0.023162841796875, 0.05780029296875, 0.092437744140625, 0.1270751953125, 0.161712646484375, 0.19635009765625, 0.230987548828125, 0.265625, 0.300262451171875, 0.33489990234375, 0.369537353515625, 0.4041748046875, 0.438812255859375, 0.47344970703125, 0.508087158203125, 0.542724609375, 0.577362060546875, 0.61199951171875, 0.646636962890625, 0.6812744140625, 0.715911865234375, 0.75054931640625, 0.785186767578125, 0.81982421875, 0.854461669921875, 0.88909912109375, 0.923736572265625, 0.9583740234375, 0.993011474609375, 1.02764892578125, 1.062286376953125, 1.096923828125, 1.131561279296875, 1.16619873046875, 1.200836181640625, 1.2354736328125, 1.270111083984375, 1.30474853515625, 1.339385986328125, 1.3740234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 15.0, 18.0, 19.0, 25.0, 37.0, 55.0, 73.0, 128.0, 215.0, 351.0, 641.0, 1829.0, 6951.0, 71887.0, 927752.0, 31364.0, 4380.0, 1347.0, 631.0, 318.0, 159.0, 106.0, 63.0, 60.0, 29.0, 19.0, 15.0, 15.0, 10.0, 9.0, 6.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158203125, -2.084686279296875, -2.01116943359375, -1.937652587890625, -1.8641357421875, -1.790618896484375, -1.71710205078125, -1.643585205078125, -1.570068359375, -1.496551513671875, -1.42303466796875, -1.349517822265625, -1.2760009765625, -1.202484130859375, -1.12896728515625, -1.055450439453125, -0.98193359375, -0.908416748046875, -0.83489990234375, -0.761383056640625, -0.6878662109375, -0.614349365234375, -0.54083251953125, -0.467315673828125, -0.393798828125, -0.320281982421875, -0.24676513671875, -0.173248291015625, -0.0997314453125, -0.026214599609375, 0.04730224609375, 0.120819091796875, 0.1943359375, 0.267852783203125, 0.34136962890625, 0.414886474609375, 0.4884033203125, 0.561920166015625, 0.63543701171875, 0.708953857421875, 0.782470703125, 0.855987548828125, 0.92950439453125, 1.003021240234375, 1.0765380859375, 1.150054931640625, 1.22357177734375, 1.297088623046875, 1.37060546875, 1.444122314453125, 1.51763916015625, 1.591156005859375, 1.6646728515625, 1.738189697265625, 1.81170654296875, 1.885223388671875, 1.958740234375, 2.032257080078125, 2.10577392578125, 2.179290771484375, 2.2528076171875, 2.326324462890625, 2.39984130859375, 2.473358154296875, 2.546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 6.0, 11.0, 12.0, 10.0, 26.0, 23.0, 43.0, 52.0, 54.0, 95.0, 131.0, 123.0, 102.0, 80.0, 64.0, 49.0, 26.0, 25.0, 20.0, 13.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.91552734375, -4.7412109375, -4.56689453125, -4.392578125, -4.21826171875, -4.0439453125, -3.86962890625, -3.6953125, -3.52099609375, -3.3466796875, -3.17236328125, -2.998046875, -2.82373046875, -2.6494140625, -2.47509765625, -2.30078125, -2.12646484375, -1.9521484375, -1.77783203125, -1.603515625, -1.42919921875, -1.2548828125, -1.08056640625, -0.90625, -0.73193359375, -0.5576171875, -0.38330078125, -0.208984375, -0.03466796875, 0.1396484375, 0.31396484375, 0.48828125, 0.66259765625, 0.8369140625, 1.01123046875, 1.185546875, 1.35986328125, 1.5341796875, 1.70849609375, 1.8828125, 2.05712890625, 2.2314453125, 2.40576171875, 2.580078125, 2.75439453125, 2.9287109375, 3.10302734375, 3.27734375, 3.45166015625, 3.6259765625, 3.80029296875, 3.974609375, 4.14892578125, 4.3232421875, 4.49755859375, 4.671875, 4.84619140625, 5.0205078125, 5.19482421875, 5.369140625, 5.54345703125, 5.7177734375, 5.89208984375, 6.06640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 12.0, 6.0, 6.0, 11.0, 14.0, 22.0, 30.0, 51.0, 65.0, 88.0, 136.0, 224.0, 492.0, 1038.0, 2823.0, 11191.0, 108684.0, 889921.0, 25863.0, 4868.0, 1505.0, 671.0, 282.0, 180.0, 115.0, 67.0, 47.0, 29.0, 28.0, 22.0, 21.0, 10.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.471435546875, -0.45633697509765625, -0.4412384033203125, -0.42613983154296875, -0.411041259765625, -0.39594268798828125, -0.3808441162109375, -0.36574554443359375, -0.35064697265625, -0.33554840087890625, -0.3204498291015625, -0.30535125732421875, -0.290252685546875, -0.27515411376953125, -0.2600555419921875, -0.24495697021484375, -0.2298583984375, -0.21475982666015625, -0.1996612548828125, -0.18456268310546875, -0.169464111328125, -0.15436553955078125, -0.1392669677734375, -0.12416839599609375, -0.10906982421875, -0.09397125244140625, -0.0788726806640625, -0.06377410888671875, -0.048675537109375, -0.03357696533203125, -0.0184783935546875, -0.00337982177734375, 0.01171875, 0.02681732177734375, 0.0419158935546875, 0.05701446533203125, 0.072113037109375, 0.08721160888671875, 0.1023101806640625, 0.11740875244140625, 0.13250732421875, 0.14760589599609375, 0.1627044677734375, 0.17780303955078125, 0.192901611328125, 0.20800018310546875, 0.2230987548828125, 0.23819732666015625, 0.2532958984375, 0.26839447021484375, 0.2834930419921875, 0.29859161376953125, 0.313690185546875, 0.32878875732421875, 0.3438873291015625, 0.35898590087890625, 0.37408447265625, 0.38918304443359375, 0.4042816162109375, 0.41938018798828125, 0.434478759765625, 0.44957733154296875, 0.4646759033203125, 0.47977447509765625, 0.494873046875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 9.0, 5.0, 10.0, 17.0, 14.0, 15.0, 27.0, 33.0, 45.0, 62.0, 92.0, 106.0, 119.0, 105.0, 77.0, 55.0, 50.0, 25.0, 17.0, 21.0, 18.0, 16.0, 9.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.416175842285156e-05, -8.07046890258789e-05, -7.724761962890625e-05, -7.37905502319336e-05, -7.033348083496094e-05, -6.687641143798828e-05, -6.341934204101562e-05, -5.996227264404297e-05, -5.650520324707031e-05, -5.3048133850097656e-05, -4.9591064453125e-05, -4.6133995056152344e-05, -4.267692565917969e-05, -3.921985626220703e-05, -3.5762786865234375e-05, -3.230571746826172e-05, -2.8848648071289062e-05, -2.5391578674316406e-05, -2.193450927734375e-05, -1.8477439880371094e-05, -1.5020370483398438e-05, -1.1563301086425781e-05, -8.106231689453125e-06, -4.649162292480469e-06, -1.1920928955078125e-06, 2.2649765014648438e-06, 5.7220458984375e-06, 9.179115295410156e-06, 1.2636184692382812e-05, 1.609325408935547e-05, 1.9550323486328125e-05, 2.300739288330078e-05, 2.6464462280273438e-05, 2.9921531677246094e-05, 3.337860107421875e-05, 3.6835670471191406e-05, 4.029273986816406e-05, 4.374980926513672e-05, 4.7206878662109375e-05, 5.066394805908203e-05, 5.412101745605469e-05, 5.7578086853027344e-05, 6.103515625e-05, 6.449222564697266e-05, 6.794929504394531e-05, 7.140636444091797e-05, 7.486343383789062e-05, 7.832050323486328e-05, 8.177757263183594e-05, 8.52346420288086e-05, 8.869171142578125e-05, 9.21487808227539e-05, 9.560585021972656e-05, 9.906291961669922e-05, 0.00010251998901367188, 0.00010597705841064453, 0.00010943412780761719, 0.00011289119720458984, 0.0001163482666015625, 0.00011980533599853516, 0.0001232624053955078, 0.00012671947479248047, 0.00013017654418945312, 0.00013363361358642578, 0.00013709068298339844]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 8.0, 12.0, 12.0, 15.0, 11.0, 26.0, 45.0, 62.0, 123.0, 216.0, 411.0, 953.0, 2668.0, 9443.0, 58422.0, 903574.0, 58354.0, 9580.0, 2682.0, 975.0, 404.0, 219.0, 123.0, 75.0, 39.0, 28.0, 19.0, 17.0, 5.0, 12.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.4599609375, -0.44887733459472656, -0.4377937316894531, -0.4267101287841797, -0.41562652587890625, -0.4045429229736328, -0.3934593200683594, -0.38237571716308594, -0.3712921142578125, -0.36020851135253906, -0.3491249084472656, -0.3380413055419922, -0.32695770263671875, -0.3158740997314453, -0.3047904968261719, -0.29370689392089844, -0.282623291015625, -0.27153968811035156, -0.2604560852050781, -0.2493724822998047, -0.23828887939453125, -0.2272052764892578, -0.21612167358398438, -0.20503807067871094, -0.1939544677734375, -0.18287086486816406, -0.17178726196289062, -0.1607036590576172, -0.14962005615234375, -0.1385364532470703, -0.12745285034179688, -0.11636924743652344, -0.10528564453125, -0.09420204162597656, -0.08311843872070312, -0.07203483581542969, -0.06095123291015625, -0.04986763000488281, -0.038784027099609375, -0.027700424194335938, -0.0166168212890625, -0.0055332183837890625, 0.005550384521484375, 0.016633987426757812, 0.02771759033203125, 0.03880119323730469, 0.049884796142578125, 0.06096839904785156, 0.072052001953125, 0.08313560485839844, 0.09421920776367188, 0.10530281066894531, 0.11638641357421875, 0.1274700164794922, 0.13855361938476562, 0.14963722229003906, 0.1607208251953125, 0.17180442810058594, 0.18288803100585938, 0.1939716339111328, 0.20505523681640625, 0.2161388397216797, 0.22722244262695312, 0.23830604553222656, 0.2493896484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 15.0, 13.0, 26.0, 37.0, 58.0, 93.0, 122.0, 153.0, 138.0, 108.0, 76.0, 51.0, 47.0, 25.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5480690002441406, -0.5346145629882812, -0.5211601257324219, -0.5077056884765625, -0.4942512512207031, -0.48079681396484375, -0.4673423767089844, -0.453887939453125, -0.4404335021972656, -0.42697906494140625, -0.4135246276855469, -0.4000701904296875, -0.3866157531738281, -0.37316131591796875, -0.3597068786621094, -0.34625244140625, -0.3327980041503906, -0.31934356689453125, -0.3058891296386719, -0.2924346923828125, -0.2789802551269531, -0.26552581787109375, -0.2520713806152344, -0.238616943359375, -0.22516250610351562, -0.21170806884765625, -0.19825363159179688, -0.1847991943359375, -0.17134475708007812, -0.15789031982421875, -0.14443588256835938, -0.1309814453125, -0.11752700805664062, -0.10407257080078125, -0.09061813354492188, -0.0771636962890625, -0.06370925903320312, -0.05025482177734375, -0.036800384521484375, -0.023345947265625, -0.009891510009765625, 0.00356292724609375, 0.017017364501953125, 0.0304718017578125, 0.043926239013671875, 0.05738067626953125, 0.07083511352539062, 0.08428955078125, 0.09774398803710938, 0.11119842529296875, 0.12465286254882812, 0.1381072998046875, 0.15156173706054688, 0.16501617431640625, 0.17847061157226562, 0.191925048828125, 0.20537948608398438, 0.21883392333984375, 0.23228836059570312, 0.2457427978515625, 0.2591972351074219, 0.27265167236328125, 0.2861061096191406, 0.299560546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 8.0, 7.0, 16.0, 41.0, 114.0, 630.0, 125.0, 44.0, 15.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.929229736328125, -5.129326820373535, -4.329423904418945, -3.5295205116271973, -2.7296175956726074, -1.9297146797180176, -1.1298112869262695, -0.3299083709716797, 0.46999454498291016, 1.2698975801467896, 2.069800615310669, 2.869703769683838, 3.6696066856384277, 4.469509601593018, 5.269412994384766, 6.0693159103393555, 6.869218826293945, 7.669121742248535, 8.469024658203125, 9.268928527832031, 10.068830490112305, 10.868734359741211, 11.6686372756958, 12.46854019165039, 13.26844310760498, 14.06834602355957, 14.86824893951416, 15.66815185546875, 16.468055725097656, 17.26795768737793, 18.067861557006836, 18.86776351928711, 19.667667388916016, 20.467571258544922, 21.267473220825195, 22.0673770904541, 22.867279052734375, 23.66718292236328, 24.467086791992188, 25.26698875427246, 26.066890716552734, 26.86679458618164, 27.666696548461914, 28.46660041809082, 29.266502380371094, 30.06640625, 30.866310119628906, 31.66621208190918, 32.46611785888672, 33.266021728515625, 34.06592559814453, 34.86582565307617, 35.66572952270508, 36.465633392333984, 37.26553726196289, 38.06543731689453, 38.86534118652344, 39.665245056152344, 40.46514892578125, 41.26504898071289, 42.0649528503418, 42.8648567199707, 43.66476058959961, 44.46466064453125, 45.264564514160156]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 12.0, 16.0, 22.0, 21.0, 33.0, 56.0, 69.0, 381.0, 194.0, 63.0, 38.0, 29.0, 26.0, 26.0, 11.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.485276222229004, -6.855204105377197, -6.225131511688232, -5.595059394836426, -4.964986801147461, -4.334914684295654, -3.7048425674438477, -3.074769973754883, -2.444697856903076, -1.8146255016326904, -1.1845532655715942, -0.554481029510498, 0.0755913257598877, 0.7056636810302734, 1.33573579788208, 1.965808391571045, 2.5958805084228516, 3.2259528636932373, 3.856025218963623, 4.48609733581543, 5.1161699295043945, 5.746242046356201, 6.376314163208008, 7.006386756896973, 7.636458873748779, 8.266530990600586, 8.89660358428955, 9.526676177978516, 10.156747817993164, 10.786820411682129, 11.416893005371094, 12.046964645385742, 12.677038192749023, 13.307110786437988, 13.937182426452637, 14.567255020141602, 15.197327613830566, 15.827400207519531, 16.45747184753418, 17.087543487548828, 17.71761703491211, 18.347688674926758, 18.97776222229004, 19.607833862304688, 20.237905502319336, 20.867979049682617, 21.498050689697266, 22.128124237060547, 22.758193969726562, 23.38826560974121, 24.018339157104492, 24.64841079711914, 25.27848243713379, 25.90855598449707, 26.53862762451172, 27.168701171875, 27.79877281188965, 28.428844451904297, 29.058917999267578, 29.688989639282227, 30.319061279296875, 30.949134826660156, 31.579206466674805, 32.20927810668945, 32.839351654052734]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 5.0, 4.0, 9.0, 10.0, 18.0, 28.0, 23.0, 20.0, 35.0, 33.0, 40.0, 69.0, 202.0, 265.0, 62.0, 45.0, 33.0, 31.0, 17.0, 14.0, 8.0, 8.0, 7.0, 2.0, 5.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8603515625, -0.8231201171875, -0.785888671875, -0.7486572265625, -0.71142578125, -0.6741943359375, -0.636962890625, -0.5997314453125, -0.5625, -0.5252685546875, -0.488037109375, -0.4508056640625, -0.41357421875, -0.3763427734375, -0.339111328125, -0.3018798828125, -0.2646484375, -0.2274169921875, -0.190185546875, -0.1529541015625, -0.11572265625, -0.0784912109375, -0.041259765625, -0.0040283203125, 0.033203125, 0.0704345703125, 0.107666015625, 0.1448974609375, 0.18212890625, 0.2193603515625, 0.256591796875, 0.2938232421875, 0.3310546875, 0.3682861328125, 0.405517578125, 0.4427490234375, 0.47998046875, 0.5172119140625, 0.554443359375, 0.5916748046875, 0.62890625, 0.6661376953125, 0.703369140625, 0.7406005859375, 0.77783203125, 0.8150634765625, 0.852294921875, 0.8895263671875, 0.9267578125, 0.9639892578125, 1.001220703125, 1.0384521484375, 1.07568359375, 1.1129150390625, 1.150146484375, 1.1873779296875, 1.224609375, 1.2618408203125, 1.299072265625, 1.3363037109375, 1.37353515625, 1.4107666015625, 1.447998046875, 1.4852294921875, 1.5224609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 10.0, 8.0, 6.0, 17.0, 20.0, 18.0, 35.0, 40.0, 131.0, 476.0, 10251.0, 8375698.0, 1436.0, 216.0, 74.0, 28.0, 22.0, 29.0, 7.0, 10.0, 11.0, 1.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.28751564025879, -23.59864044189453, -22.909765243530273, -22.220888137817383, -21.532012939453125, -20.843137741088867, -20.15426254272461, -19.46538543701172, -18.77651023864746, -18.087635040283203, -17.398759841918945, -16.709882736206055, -16.021007537841797, -15.332132339477539, -14.643257141113281, -13.954380989074707, -13.26550579071045, -12.576630592346191, -11.887754440307617, -11.19887924194336, -10.510003089904785, -9.821127891540527, -9.132251739501953, -8.443376541137695, -7.754500865936279, -7.065625190734863, -6.376749515533447, -5.687873840332031, -4.998998641967773, -4.310122489929199, -3.6212472915649414, -2.9323716163635254, -2.2434959411621094, -1.5546202659606934, -0.8657447099685669, -0.17686915397644043, 0.5120065212249756, 1.2008821964263916, 1.8897576332092285, 2.5786333084106445, 3.2675089836120605, 3.9563846588134766, 4.645260334014893, 5.334136009216309, 6.023011207580566, 6.711887359619141, 7.400762557983398, 8.089637756347656, 8.77851390838623, 9.467389106750488, 10.156265258789062, 10.84514045715332, 11.534016609191895, 12.222891807556152, 12.911767959594727, 13.600643157958984, 14.289518356323242, 14.9783935546875, 15.667269706726074, 16.35614585876465, 17.045021057128906, 17.733896255493164, 18.422771453857422, 19.111648559570312, 19.80052375793457]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 5.0, 7.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-11.602702140808105, -11.384727478027344, -11.166753768920898, -10.948779106140137, -10.730804443359375, -10.512829780578613, -10.294855117797852, -10.076881408691406, -9.858906745910645, -9.640932083129883, -9.422958374023438, -9.204983711242676, -8.987009048461914, -8.769034385681152, -8.55105972290039, -8.333086013793945, -8.115111351013184, -7.897136688232422, -7.679162502288818, -7.461188316345215, -7.243213653564453, -7.025238990783691, -6.807264804840088, -6.589290618896484, -6.371315956115723, -6.153341293334961, -5.935367107391357, -5.717392921447754, -5.499418258666992, -5.2814435958862305, -5.063469409942627, -4.845495223999023, -4.627520561218262, -4.4095458984375, -4.1915717124938965, -3.973597288131714, -3.7556228637695312, -3.5376484394073486, -3.319674015045166, -3.1016995906829834, -2.883725166320801, -2.665750741958618, -2.4477763175964355, -2.229801893234253, -2.0118274688720703, -1.7938530445098877, -1.575878620147705, -1.3579041957855225, -1.1399297714233398, -0.9219553470611572, -0.7039809226989746, -0.486006498336792, -0.2680320739746094, -0.05005764961242676, 0.16791677474975586, 0.3858911991119385, 0.6038656234741211, 0.8218400478363037, 1.0398144721984863, 1.257788896560669, 1.4757633209228516, 1.6937377452850342, 1.9117121696472168, 2.1296865940093994, 2.347661018371582]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 3.0, 11.0, 28.0, 24.0, 46.0, 73.0, 163.0, 274.0, 532.0, 1089.0, 2734.0, 7653.0, 26367.0, 107944.0, 247058.0, 92556.0, 24105.0, 7586.0, 2942.0, 1351.0, 662.0, 377.0, 236.0, 138.0, 91.0, 58.0, 47.0, 26.0, 18.0, 27.0, 18.0, 6.0, 3.0, 7.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.6583251953125, -4.488525390625, -4.3187255859375, -4.14892578125, -3.9791259765625, -3.809326171875, -3.6395263671875, -3.4697265625, -3.2999267578125, -3.130126953125, -2.9603271484375, -2.79052734375, -2.6207275390625, -2.450927734375, -2.2811279296875, -2.111328125, -1.9415283203125, -1.771728515625, -1.6019287109375, -1.43212890625, -1.2623291015625, -1.092529296875, -0.9227294921875, -0.7529296875, -0.5831298828125, -0.413330078125, -0.2435302734375, -0.07373046875, 0.0960693359375, 0.265869140625, 0.4356689453125, 0.60546875, 0.7752685546875, 0.945068359375, 1.1148681640625, 1.28466796875, 1.4544677734375, 1.624267578125, 1.7940673828125, 1.9638671875, 2.1336669921875, 2.303466796875, 2.4732666015625, 2.64306640625, 2.8128662109375, 2.982666015625, 3.1524658203125, 3.322265625, 3.4920654296875, 3.661865234375, 3.8316650390625, 4.00146484375, 4.1712646484375, 4.341064453125, 4.5108642578125, 4.6806640625, 4.8504638671875, 5.020263671875, 5.1900634765625, 5.35986328125, 5.5296630859375, 5.699462890625, 5.8692626953125, 6.0390625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 9.0, 16.0, 33.0, 43.0, 75.0, 76.0, 118.0, 120.0, 119.0, 112.0, 76.0, 58.0, 46.0, 26.0, 16.0, 14.0, 10.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.251953125, -1.196746826171875, -1.14154052734375, -1.086334228515625, -1.0311279296875, -0.975921630859375, -0.92071533203125, -0.865509033203125, -0.810302734375, -0.755096435546875, -0.69989013671875, -0.644683837890625, -0.5894775390625, -0.534271240234375, -0.47906494140625, -0.423858642578125, -0.36865234375, -0.313446044921875, -0.25823974609375, -0.203033447265625, -0.1478271484375, -0.092620849609375, -0.03741455078125, 0.017791748046875, 0.072998046875, 0.128204345703125, 0.18341064453125, 0.238616943359375, 0.2938232421875, 0.349029541015625, 0.40423583984375, 0.459442138671875, 0.5146484375, 0.569854736328125, 0.62506103515625, 0.680267333984375, 0.7354736328125, 0.790679931640625, 0.84588623046875, 0.901092529296875, 0.956298828125, 1.011505126953125, 1.06671142578125, 1.121917724609375, 1.1771240234375, 1.232330322265625, 1.28753662109375, 1.342742919921875, 1.39794921875, 1.453155517578125, 1.50836181640625, 1.563568115234375, 1.6187744140625, 1.673980712890625, 1.72918701171875, 1.784393310546875, 1.839599609375, 1.894805908203125, 1.95001220703125, 2.005218505859375, 2.0604248046875, 2.115631103515625, 2.17083740234375, 2.226043701171875, 2.28125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 8.0, 3.0, 11.0, 13.0, 17.0, 36.0, 111.0, 110.0, 74.0, 43.0, 24.0, 12.0, 9.0, 4.0, 2.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.786001205444336, -8.569734573364258, -8.353468894958496, -8.137202262878418, -7.92093563079834, -7.70466947555542, -7.488402843475342, -7.272136688232422, -7.055870056152344, -6.839603900909424, -6.623337268829346, -6.407071113586426, -6.190804481506348, -5.974538326263428, -5.75827169418335, -5.54200553894043, -5.325738906860352, -5.109472751617432, -4.8932061195373535, -4.676939964294434, -4.4606733322143555, -4.2444071769714355, -4.028140544891357, -3.8118743896484375, -3.5956082344055176, -3.3793418407440186, -3.1630754470825195, -2.9468090534210205, -2.7305426597595215, -2.5142765045166016, -2.2980098724365234, -2.0817437171936035, -1.8654770851135254, -1.6492106914520264, -1.4329442977905273, -1.2166779041290283, -1.0004115104675293, -0.7841452360153198, -0.5678788423538208, -0.3516124486923218, -0.13534605503082275, 0.08092032372951508, 0.2971867024898529, 0.5134530663490295, 0.7297194600105286, 0.9459857940673828, 1.1622521877288818, 1.3785185813903809, 1.5947849750518799, 1.811051368713379, 2.027317762374878, 2.243584156036377, 2.459850549697876, 2.676116943359375, 2.892383098602295, 3.108649730682373, 3.324915885925293, 3.541182279586792, 3.757448673248291, 3.97371506690979, 4.189981460571289, 4.406247615814209, 4.622514247894287, 4.838780403137207, 5.055047035217285]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 6.0, 10.0, 29.0, 78.0, 77.0, 73.0, 70.0, 38.0, 24.0, 7.0, 5.0, 9.0, 4.0, 3.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7920608520507812, -3.6617164611816406, -3.5313720703125, -3.4010276794433594, -3.2706832885742188, -3.140338897705078, -3.0099945068359375, -2.879650115966797, -2.7493057250976562, -2.6189613342285156, -2.488616943359375, -2.3582725524902344, -2.2279281616210938, -2.097583770751953, -1.9672393798828125, -1.8368949890136719, -1.7065505981445312, -1.5762062072753906, -1.44586181640625, -1.3155174255371094, -1.1851730346679688, -1.0548286437988281, -0.9244842529296875, -0.7941398620605469, -0.6637954711914062, -0.5334510803222656, -0.403106689453125, -0.2727622985839844, -0.14241790771484375, -0.012073516845703125, 0.1182708740234375, 0.24861526489257812, 0.37895965576171875, 0.5093040466308594, 0.6396484375, 0.7699928283691406, 0.9003372192382812, 1.0306816101074219, 1.1610260009765625, 1.2913703918457031, 1.4217147827148438, 1.5520591735839844, 1.682403564453125, 1.8127479553222656, 1.9430923461914062, 2.073436737060547, 2.2037811279296875, 2.334125518798828, 2.4644699096679688, 2.5948143005371094, 2.72515869140625, 2.8555030822753906, 2.9858474731445312, 3.116191864013672, 3.2465362548828125, 3.376880645751953, 3.5072250366210938, 3.6375694274902344, 3.767913818359375, 3.8982582092285156, 4.028602600097656, 4.158946990966797, 4.2892913818359375, 4.419635772705078, 4.549980163574219]}, "eval/loss": 4.16819953918457, "eval/wer": 1.9665807219357399, "eval/runtime": 794.4467, "eval/samples_per_second": 3.326, "eval/steps_per_second": 0.278} \ No newline at end of file +{"train/loss": 4.4211, "train/learning_rate": 5.805515239477504e-08, "train/epoch": 1.0, "train/global_step": 1189, "_runtime": 6756, "_timestamp": 1646072785, "_step": 1191, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 199.0, 773.0, 38.0, 3.0], "bins": [-638.4752197265625, -628.0576171875, -617.6399536132812, -607.2223510742188, -596.8046875, -586.3870849609375, -575.969482421875, -565.5518188476562, -555.1342163085938, -544.7166137695312, -534.2989501953125, -523.88134765625, -513.4636840820312, -503.04608154296875, -492.6284484863281, -482.2108154296875, -471.7931823730469, -461.37554931640625, -450.9579162597656, -440.5403137207031, -430.1226806640625, -419.7050476074219, -409.28741455078125, -398.8697814941406, -388.4521484375, -378.0345153808594, -367.61688232421875, -357.19927978515625, -346.7816467285156, -336.364013671875, -325.9463806152344, -315.52874755859375, -305.1111145019531, -294.6934814453125, -284.2758483886719, -273.8582458496094, -263.44061279296875, -253.02297973632812, -242.6053466796875, -232.18771362304688, -221.77011108398438, -211.35247802734375, -200.9348602294922, -190.51722717285156, -180.099609375, -169.68197631835938, -159.26434326171875, -148.84671020507812, -138.42909240722656, -128.01145935058594, -117.59384155273438, -107.17620849609375, -96.75858306884766, -86.34095764160156, -75.92332458496094, -65.50569915771484, -55.08807373046875, -44.670448303222656, -34.2528190612793, -23.83519172668457, -13.417564392089844, -2.99993896484375, 7.417690277099609, 17.83531951904297, 28.252946853637695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 7.0, 4.0, 3.0, 2.0, 12.0, 7.0, 9.0, 10.0, 13.0, 26.0, 23.0, 22.0, 24.0, 29.0, 36.0, 37.0, 45.0, 33.0, 39.0, 37.0, 61.0, 51.0, 50.0, 48.0, 51.0, 46.0, 37.0, 24.0, 35.0, 21.0, 27.0, 20.0, 19.0, 14.0, 16.0, 12.0, 13.0, 11.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.6351318359375, -54.82221984863281, -53.009307861328125, -51.19639587402344, -49.383480072021484, -47.5705680847168, -45.75765609741211, -43.94474411010742, -42.13182830810547, -40.31891632080078, -38.506004333496094, -36.693092346191406, -34.88017654418945, -33.067264556884766, -31.254352569580078, -29.44144058227539, -27.628528594970703, -25.815616607666016, -24.002702713012695, -22.189790725708008, -20.376876831054688, -18.56396484375, -16.751052856445312, -14.938139915466309, -13.125226974487305, -11.3123140335083, -9.499401092529297, -7.686489105224609, -5.8735761642456055, -4.060663223266602, -2.247751235961914, -0.43483829498291016, 1.3780746459960938, 3.1909873485565186, 5.003900051116943, 6.816812515258789, 8.629725456237793, 10.442638397216797, 12.255550384521484, 14.068463325500488, 15.881376266479492, 17.69428825378418, 19.5072021484375, 21.320114135742188, 23.133026123046875, 24.945940017700195, 26.758852005004883, 28.571765899658203, 30.38467788696289, 32.19758987426758, 34.010501861572266, 35.82341766357422, 37.636329650878906, 39.449241638183594, 41.26215362548828, 43.07506561279297, 44.887977600097656, 46.700889587402344, 48.51380157470703, 50.32671356201172, 52.13962936401367, 53.95254135131836, 55.76545333862305, 57.578365325927734, 59.39128112792969]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 12.0, 20.0, 15.0, 32.0, 45.0, 51.0, 46.0, 68.0, 78.0, 72.0, 86.0, 83.0, 89.0, 75.0, 51.0, 40.0, 31.0, 32.0, 19.0, 12.0, 10.0, 11.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.62652587890625, -9.3936767578125, -9.16082763671875, -8.927978515625, -8.69512939453125, -8.4622802734375, -8.22943115234375, -7.99658203125, -7.76373291015625, -7.5308837890625, -7.29803466796875, -7.065185546875, -6.83233642578125, -6.5994873046875, -6.36663818359375, -6.1337890625, -5.90093994140625, -5.6680908203125, -5.43524169921875, -5.202392578125, -4.96954345703125, -4.7366943359375, -4.50384521484375, -4.27099609375, -4.03814697265625, -3.8052978515625, -3.57244873046875, -3.339599609375, -3.10675048828125, -2.8739013671875, -2.64105224609375, -2.408203125, -2.17535400390625, -1.9425048828125, -1.70965576171875, -1.476806640625, -1.24395751953125, -1.0111083984375, -0.77825927734375, -0.54541015625, -0.31256103515625, -0.0797119140625, 0.15313720703125, 0.385986328125, 0.61883544921875, 0.8516845703125, 1.08453369140625, 1.3173828125, 1.55023193359375, 1.7830810546875, 2.01593017578125, 2.248779296875, 2.48162841796875, 2.7144775390625, 2.94732666015625, 3.18017578125, 3.41302490234375, 3.6458740234375, 3.87872314453125, 4.111572265625, 4.34442138671875, 4.5772705078125, 4.81011962890625, 5.04296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 5.0, 4.0, 8.0, 11.0, 13.0, 29.0, 34.0, 72.0, 89.0, 139.0, 212.0, 396.0, 735.0, 1454.0, 3154.0, 9650.0, 51280.0, 1266920.0, 2726149.0, 110410.0, 15390.0, 4333.0, 1812.0, 835.0, 446.0, 255.0, 145.0, 110.0, 66.0, 56.0, 31.0, 17.0, 14.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.0, -21.4381103515625, -20.876220703125, -20.3143310546875, -19.75244140625, -19.1905517578125, -18.628662109375, -18.0667724609375, -17.5048828125, -16.9429931640625, -16.381103515625, -15.8192138671875, -15.25732421875, -14.6954345703125, -14.133544921875, -13.5716552734375, -13.009765625, -12.4478759765625, -11.885986328125, -11.3240966796875, -10.76220703125, -10.2003173828125, -9.638427734375, -9.0765380859375, -8.5146484375, -7.9527587890625, -7.390869140625, -6.8289794921875, -6.26708984375, -5.7052001953125, -5.143310546875, -4.5814208984375, -4.01953125, -3.4576416015625, -2.895751953125, -2.3338623046875, -1.77197265625, -1.2100830078125, -0.648193359375, -0.0863037109375, 0.4755859375, 1.0374755859375, 1.599365234375, 2.1612548828125, 2.72314453125, 3.2850341796875, 3.846923828125, 4.4088134765625, 4.970703125, 5.5325927734375, 6.094482421875, 6.6563720703125, 7.21826171875, 7.7801513671875, 8.342041015625, 8.9039306640625, 9.4658203125, 10.0277099609375, 10.589599609375, 11.1514892578125, 11.71337890625, 12.2752685546875, 12.837158203125, 13.3990478515625, 13.9609375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 10.0, 13.0, 11.0, 32.0, 53.0, 49.0, 112.0, 172.0, 272.0, 472.0, 830.0, 815.0, 513.0, 268.0, 172.0, 85.0, 60.0, 42.0, 24.0, 20.0, 11.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.671875, -27.97314453125, -27.2744140625, -26.57568359375, -25.876953125, -25.17822265625, -24.4794921875, -23.78076171875, -23.08203125, -22.38330078125, -21.6845703125, -20.98583984375, -20.287109375, -19.58837890625, -18.8896484375, -18.19091796875, -17.4921875, -16.79345703125, -16.0947265625, -15.39599609375, -14.697265625, -13.99853515625, -13.2998046875, -12.60107421875, -11.90234375, -11.20361328125, -10.5048828125, -9.80615234375, -9.107421875, -8.40869140625, -7.7099609375, -7.01123046875, -6.3125, -5.61376953125, -4.9150390625, -4.21630859375, -3.517578125, -2.81884765625, -2.1201171875, -1.42138671875, -0.72265625, -0.02392578125, 0.6748046875, 1.37353515625, 2.072265625, 2.77099609375, 3.4697265625, 4.16845703125, 4.8671875, 5.56591796875, 6.2646484375, 6.96337890625, 7.662109375, 8.36083984375, 9.0595703125, 9.75830078125, 10.45703125, 11.15576171875, 11.8544921875, 12.55322265625, 13.251953125, 13.95068359375, 14.6494140625, 15.34814453125, 16.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 24.0, 31.0, 84.0, 145.0, 272.0, 602.0, 1688.0, 19694.0, 4153828.0, 15221.0, 1551.0, 584.0, 232.0, 132.0, 58.0, 40.0, 22.0, 19.0, 9.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.2548828125, -81.072265625, -77.8896484375, -74.70703125, -71.5244140625, -68.341796875, -65.1591796875, -61.9765625, -58.7939453125, -55.611328125, -52.4287109375, -49.24609375, -46.0634765625, -42.880859375, -39.6982421875, -36.515625, -33.3330078125, -30.150390625, -26.9677734375, -23.78515625, -20.6025390625, -17.419921875, -14.2373046875, -11.0546875, -7.8720703125, -4.689453125, -1.5068359375, 1.67578125, 4.8583984375, 8.041015625, 11.2236328125, 14.40625, 17.5888671875, 20.771484375, 23.9541015625, 27.13671875, 30.3193359375, 33.501953125, 36.6845703125, 39.8671875, 43.0498046875, 46.232421875, 49.4150390625, 52.59765625, 55.7802734375, 58.962890625, 62.1455078125, 65.328125, 68.5107421875, 71.693359375, 74.8759765625, 78.05859375, 81.2412109375, 84.423828125, 87.6064453125, 90.7890625, 93.9716796875, 97.154296875, 100.3369140625, 103.51953125, 106.7021484375, 109.884765625, 113.0673828125, 116.25]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 106.0, 600.0, 285.0, 12.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.01038360595703, -31.39297103881836, -24.775558471679688, -18.15814781188965, -11.540735244750977, -4.9233245849609375, 1.6940879821777344, 8.311500549316406, 14.928913116455078, 21.54632568359375, 28.163738250732422, 34.781150817871094, 41.3985595703125, 48.01597213745117, 54.633384704589844, 61.250797271728516, 67.86820983886719, 74.4856185913086, 81.10303497314453, 87.72044372558594, 94.33786010742188, 100.95526885986328, 107.57267761230469, 114.19009399414062, 120.80751037597656, 127.42491912841797, 134.04232788085938, 140.6597442626953, 147.27716064453125, 153.89456176757812, 160.51197814941406, 167.12939453125, 173.74681091308594, 180.36422729492188, 186.98162841796875, 193.5990447998047, 200.21646118164062, 206.8338623046875, 213.45127868652344, 220.06869506835938, 226.6861114501953, 233.30352783203125, 239.92092895507812, 246.53834533691406, 253.15576171875, 259.7731628417969, 266.3905944824219, 273.00799560546875, 279.6253967285156, 286.2427978515625, 292.8602294921875, 299.4776306152344, 306.09503173828125, 312.71246337890625, 319.3298645019531, 325.947265625, 332.564697265625, 339.1820983886719, 345.7995300292969, 352.41693115234375, 359.0343322753906, 365.6517639160156, 372.2691650390625, 378.8865966796875, 385.5039978027344]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 2.0, 14.0, 16.0, 19.0, 20.0, 30.0, 27.0, 46.0, 38.0, 48.0, 50.0, 57.0, 59.0, 63.0, 59.0, 51.0, 66.0, 49.0, 45.0, 47.0, 40.0, 28.0, 24.0, 19.0, 17.0, 19.0, 6.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.2113037109375, -70.05340576171875, -67.8955078125, -65.73760986328125, -63.579708099365234, -61.421810150146484, -59.26390838623047, -57.10601043701172, -54.94811248779297, -52.79021453857422, -50.63231658935547, -48.47441482543945, -46.3165168762207, -44.15861892700195, -42.00071716308594, -39.84281921386719, -37.68492126464844, -35.52702331542969, -33.36912536621094, -31.211223602294922, -29.053325653076172, -26.895427703857422, -24.73752784729004, -22.579627990722656, -20.421730041503906, -18.263832092285156, -16.105932235717773, -13.948033332824707, -11.79013442993164, -9.632235527038574, -7.474336624145508, -5.316437721252441, -3.158538818359375, -1.0006399154663086, 1.1572589874267578, 3.315157890319824, 5.473056793212891, 7.630955696105957, 9.788854598999023, 11.94675350189209, 14.104652404785156, 16.262550354003906, 18.42045021057129, 20.578350067138672, 22.736248016357422, 24.894145965576172, 27.052045822143555, 29.209945678710938, 31.367843627929688, 33.52574157714844, 35.68363952636719, 37.8415412902832, 39.99943923950195, 42.1573371887207, 44.31523895263672, 46.47313690185547, 48.63103485107422, 50.78893280029297, 52.94683074951172, 55.104732513427734, 57.262630462646484, 59.420528411865234, 61.57843017578125, 63.736328125, 65.89422607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 13.0, 17.0, 22.0, 35.0, 42.0, 89.0, 102.0, 183.0, 302.0, 449.0, 704.0, 1127.0, 1783.0, 2727.0, 4546.0, 7419.0, 11690.0, 19468.0, 33639.0, 58963.0, 111802.0, 223293.0, 266057.0, 135739.0, 70513.0, 39252.0, 22660.0, 13811.0, 8325.0, 5118.0, 3155.0, 2007.0, 1254.0, 777.0, 550.0, 304.0, 215.0, 133.0, 87.0, 52.0, 37.0, 28.0, 10.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0], "bins": [-0.7763671875, -0.7522125244140625, -0.728057861328125, -0.7039031982421875, -0.67974853515625, -0.6555938720703125, -0.631439208984375, -0.6072845458984375, -0.5831298828125, -0.5589752197265625, -0.534820556640625, -0.5106658935546875, -0.48651123046875, -0.4623565673828125, -0.438201904296875, -0.4140472412109375, -0.389892578125, -0.3657379150390625, -0.341583251953125, -0.3174285888671875, -0.29327392578125, -0.2691192626953125, -0.244964599609375, -0.2208099365234375, -0.1966552734375, -0.1725006103515625, -0.148345947265625, -0.1241912841796875, -0.10003662109375, -0.0758819580078125, -0.051727294921875, -0.0275726318359375, -0.00341796875, 0.0207366943359375, 0.044891357421875, 0.0690460205078125, 0.09320068359375, 0.1173553466796875, 0.141510009765625, 0.1656646728515625, 0.1898193359375, 0.2139739990234375, 0.238128662109375, 0.2622833251953125, 0.28643798828125, 0.3105926513671875, 0.334747314453125, 0.3589019775390625, 0.383056640625, 0.4072113037109375, 0.431365966796875, 0.4555206298828125, 0.47967529296875, 0.5038299560546875, 0.527984619140625, 0.5521392822265625, 0.5762939453125, 0.6004486083984375, 0.624603271484375, 0.6487579345703125, 0.67291259765625, 0.6970672607421875, 0.721221923828125, 0.7453765869140625, 0.76953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 5.0, 11.0, 9.0, 10.0, 16.0, 18.0, 27.0, 23.0, 26.0, 26.0, 26.0, 27.0, 32.0, 36.0, 51.0, 36.0, 42.0, 42.0, 1063.0, 38.0, 38.0, 47.0, 41.0, 31.0, 43.0, 26.0, 35.0, 32.0, 23.0, 20.0, 14.0, 17.0, 12.0, 12.0, 15.0, 9.0, 11.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.446624755859375, -2.36199951171875, -2.277374267578125, -2.1927490234375, -2.108123779296875, -2.02349853515625, -1.938873291015625, -1.854248046875, -1.769622802734375, -1.68499755859375, -1.600372314453125, -1.5157470703125, -1.431121826171875, -1.34649658203125, -1.261871337890625, -1.17724609375, -1.092620849609375, -1.00799560546875, -0.923370361328125, -0.8387451171875, -0.754119873046875, -0.66949462890625, -0.584869384765625, -0.500244140625, -0.415618896484375, -0.33099365234375, -0.246368408203125, -0.1617431640625, -0.077117919921875, 0.00750732421875, 0.092132568359375, 0.1767578125, 0.261383056640625, 0.34600830078125, 0.430633544921875, 0.5152587890625, 0.599884033203125, 0.68450927734375, 0.769134521484375, 0.853759765625, 0.938385009765625, 1.02301025390625, 1.107635498046875, 1.1922607421875, 1.276885986328125, 1.36151123046875, 1.446136474609375, 1.53076171875, 1.615386962890625, 1.70001220703125, 1.784637451171875, 1.8692626953125, 1.953887939453125, 2.03851318359375, 2.123138427734375, 2.207763671875, 2.292388916015625, 2.37701416015625, 2.461639404296875, 2.5462646484375, 2.630889892578125, 2.71551513671875, 2.800140380859375, 2.884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 14.0, 19.0, 26.0, 45.0, 60.0, 67.0, 143.0, 166.0, 315.0, 353.0, 595.0, 886.0, 1324.0, 1876.0, 2637.0, 3929.0, 5793.0, 8424.0, 12820.0, 18899.0, 28910.0, 44685.0, 71852.0, 116453.0, 200355.0, 1249274.0, 119444.0, 73563.0, 45799.0, 29574.0, 19114.0, 12771.0, 8515.0, 5815.0, 3943.0, 2773.0, 1862.0, 1309.0, 882.0, 584.0, 413.0, 287.0, 181.0, 118.0, 74.0, 65.0, 29.0, 32.0, 22.0, 11.0, 13.0, 8.0, 1.0, 4.0, 3.0, 2.0], "bins": [-0.56787109375, -0.5506744384765625, -0.533477783203125, -0.5162811279296875, -0.49908447265625, -0.4818878173828125, -0.464691162109375, -0.4474945068359375, -0.4302978515625, -0.4131011962890625, -0.395904541015625, -0.3787078857421875, -0.36151123046875, -0.3443145751953125, -0.327117919921875, -0.3099212646484375, -0.292724609375, -0.2755279541015625, -0.258331298828125, -0.2411346435546875, -0.22393798828125, -0.2067413330078125, -0.189544677734375, -0.1723480224609375, -0.1551513671875, -0.1379547119140625, -0.120758056640625, -0.1035614013671875, -0.08636474609375, -0.0691680908203125, -0.051971435546875, -0.0347747802734375, -0.017578125, -0.0003814697265625, 0.016815185546875, 0.0340118408203125, 0.05120849609375, 0.0684051513671875, 0.085601806640625, 0.1027984619140625, 0.1199951171875, 0.1371917724609375, 0.154388427734375, 0.1715850830078125, 0.18878173828125, 0.2059783935546875, 0.223175048828125, 0.2403717041015625, 0.257568359375, 0.2747650146484375, 0.291961669921875, 0.3091583251953125, 0.32635498046875, 0.3435516357421875, 0.360748291015625, 0.3779449462890625, 0.3951416015625, 0.4123382568359375, 0.429534912109375, 0.4467315673828125, 0.46392822265625, 0.4811248779296875, 0.498321533203125, 0.5155181884765625, 0.53271484375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 17.0, 16.0, 19.0, 22.0, 30.0, 41.0, 45.0, 47.0, 55.0, 71.0, 59.0, 62.0, 59.0, 76.0, 51.0, 52.0, 43.0, 27.0, 47.0, 26.0, 22.0, 16.0, 11.0, 14.0, 11.0, 6.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002894401550292969, -0.0002780109643936157, -0.00026658177375793457, -0.0002551525831222534, -0.00024372339248657227, -0.0002322942018508911, -0.00022086501121520996, -0.0002094358205795288, -0.00019800662994384766, -0.0001865774393081665, -0.00017514824867248535, -0.0001637190580368042, -0.00015228986740112305, -0.0001408606767654419, -0.00012943148612976074, -0.00011800229549407959, -0.00010657310485839844, -9.514391422271729e-05, -8.371472358703613e-05, -7.228553295135498e-05, -6.085634231567383e-05, -4.9427151679992676e-05, -3.7997961044311523e-05, -2.656877040863037e-05, -1.5139579772949219e-05, -3.7103891372680664e-06, 7.718801498413086e-06, 1.9147992134094238e-05, 3.057718276977539e-05, 4.200637340545654e-05, 5.3435564041137695e-05, 6.486475467681885e-05, 7.62939453125e-05, 8.772313594818115e-05, 9.91523265838623e-05, 0.00011058151721954346, 0.00012201070785522461, 0.00013343989849090576, 0.00014486908912658691, 0.00015629827976226807, 0.00016772747039794922, 0.00017915666103363037, 0.00019058585166931152, 0.00020201504230499268, 0.00021344423294067383, 0.00022487342357635498, 0.00023630261421203613, 0.0002477318048477173, 0.00025916099548339844, 0.0002705901861190796, 0.00028201937675476074, 0.0002934485673904419, 0.00030487775802612305, 0.0003163069486618042, 0.00032773613929748535, 0.0003391653299331665, 0.00035059452056884766, 0.0003620237112045288, 0.00037345290184020996, 0.0003848820924758911, 0.00039631128311157227, 0.0004077404737472534, 0.00041916966438293457, 0.0004305988550186157, 0.0004420280456542969]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 7.0, 6.0, 7.0, 12.0, 11.0, 23.0, 38.0, 45.0, 41.0, 73.0, 98.0, 144.0, 191.0, 244.0, 378.0, 696.0, 3017.0, 1039662.0, 1912.0, 616.0, 389.0, 241.0, 184.0, 125.0, 92.0, 75.0, 43.0, 57.0, 29.0, 18.0, 22.0, 8.0, 5.0, 10.0, 5.0, 10.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.00812530517578125, -0.00788944959640503, -0.007653594017028809, -0.007417738437652588, -0.007181882858276367, -0.0069460272789001465, -0.006710171699523926, -0.006474316120147705, -0.006238460540771484, -0.006002604961395264, -0.005766749382019043, -0.005530893802642822, -0.0052950382232666016, -0.005059182643890381, -0.00482332706451416, -0.0045874714851379395, -0.004351615905761719, -0.004115760326385498, -0.0038799047470092773, -0.0036440491676330566, -0.003408193588256836, -0.0031723380088806152, -0.0029364824295043945, -0.002700626850128174, -0.002464771270751953, -0.0022289156913757324, -0.0019930601119995117, -0.001757204532623291, -0.0015213489532470703, -0.0012854933738708496, -0.001049637794494629, -0.0008137822151184082, -0.0005779266357421875, -0.0003420710563659668, -0.0001062154769897461, 0.0001296401023864746, 0.0003654956817626953, 0.000601351261138916, 0.0008372068405151367, 0.0010730624198913574, 0.0013089179992675781, 0.0015447735786437988, 0.0017806291580200195, 0.0020164847373962402, 0.002252340316772461, 0.0024881958961486816, 0.0027240514755249023, 0.002959907054901123, 0.0031957626342773438, 0.0034316182136535645, 0.003667473793029785, 0.003903329372406006, 0.0041391849517822266, 0.004375040531158447, 0.004610896110534668, 0.004846751689910889, 0.005082607269287109, 0.00531846284866333, 0.005554318428039551, 0.0057901740074157715, 0.006026029586791992, 0.006261885166168213, 0.006497740745544434, 0.006733596324920654, 0.006969451904296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 374.0, 640.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027660042978823185, -0.0027096248231828213, -0.002653245348483324, -0.002596865873783827, -0.002540486166253686, -0.0024841066915541887, -0.0024277272168546915, -0.0023713477421551943, -0.002314968267455697, -0.0022585887927562, -0.0022022093180567026, -0.0021458298433572054, -0.0020894501358270645, -0.0020330706611275673, -0.00197669118642807, -0.0019203117117285728, -0.0018639322370290756, -0.0018075527623295784, -0.0017511731712147593, -0.0016947936965152621, -0.001638414221815765, -0.0015820346307009459, -0.0015256551560014486, -0.0014692756813019514, -0.0014128960901871324, -0.0013565166154876351, -0.001300137024372816, -0.0012437575496733189, -0.0011873780749738216, -0.0011309986002743244, -0.0010746190091595054, -0.0010182395344600081, -0.0009618600597605109, -0.0009054805268533528, -0.0008491010521538556, -0.0007927215192466974, -0.0007363420445472002, -0.0006799625116400421, -0.0006235829787328839, -0.0005672035040333867, -0.0005108240293338895, -0.0004544445255305618, -0.0003980650217272341, -0.000341685488820076, -0.00028530601412057877, -0.00022892648121342063, -0.00017254697741009295, -0.00011616747360676527, -5.9787940699607134e-05, -3.408433258300647e-06, 5.297107418300584e-05, 0.00010935058526229113, 0.0001657300890656188, 0.00022210960742086172, 0.0002784891112241894, 0.0003348686150275171, 0.00039124811883084476, 0.00044762762263417244, 0.0005040071555413306, 0.0005603866302408278, 0.0006167661631479859, 0.0006731456378474832, 0.0007295251707546413, 0.0007859047036617994, 0.0008422841783612967]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 4.0, 8.0, 10.0, 7.0, 10.0, 11.0, 12.0, 10.0, 23.0, 9.0, 33.0, 21.0, 21.0, 39.0, 20.0, 48.0, 28.0, 32.0, 35.0, 42.0, 37.0, 52.0, 41.0, 32.0, 34.0, 35.0, 36.0, 28.0, 31.0, 28.0, 24.0, 30.0, 24.0, 24.0, 13.0, 21.0, 21.0, 13.0, 15.0, 6.0, 9.0, 4.0, 5.0, 5.0, 3.0, 7.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018829107284545898, -0.00018277112394571304, -0.0001772511750459671, -0.00017173122614622116, -0.00016621127724647522, -0.00016069132834672928, -0.00015517137944698334, -0.0001496514305472374, -0.00014413148164749146, -0.00013861153274774551, -0.00013309158384799957, -0.00012757163494825363, -0.00012205168604850769, -0.00011653173714876175, -0.00011101178824901581, -0.00010549183934926987, -9.997189044952393e-05, -9.445194154977798e-05, -8.893199265003204e-05, -8.34120437502861e-05, -7.789209485054016e-05, -7.237214595079422e-05, -6.685219705104828e-05, -6.133224815130234e-05, -5.5812299251556396e-05, -5.0292350351810455e-05, -4.4772401452064514e-05, -3.925245255231857e-05, -3.373250365257263e-05, -2.821255475282669e-05, -2.269260585308075e-05, -1.717265695333481e-05, -1.1652708053588867e-05, -6.132759153842926e-06, -6.128102540969849e-07, 4.907138645648956e-06, 1.0427087545394897e-05, 1.594703644514084e-05, 2.146698534488678e-05, 2.698693424463272e-05, 3.250688314437866e-05, 3.80268320441246e-05, 4.3546780943870544e-05, 4.9066729843616486e-05, 5.458667874336243e-05, 6.010662764310837e-05, 6.562657654285431e-05, 7.114652544260025e-05, 7.666647434234619e-05, 8.218642324209213e-05, 8.770637214183807e-05, 9.322632104158401e-05, 9.874626994132996e-05, 0.0001042662188410759, 0.00010978616774082184, 0.00011530611664056778, 0.00012082606554031372, 0.00012634601444005966, 0.0001318659633398056, 0.00013738591223955154, 0.00014290586113929749, 0.00014842581003904343, 0.00015394575893878937, 0.0001594657078385353, 0.00016498565673828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 10.0, 11.0, 16.0, 18.0, 17.0, 15.0, 31.0, 17.0, 24.0, 36.0, 34.0, 33.0, 48.0, 50.0, 50.0, 55.0, 52.0, 62.0, 58.0, 47.0, 54.0, 30.0, 44.0, 33.0, 31.0, 20.0, 15.0, 13.0, 17.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.29296875, -6.13153076171875, -5.9700927734375, -5.80865478515625, -5.647216796875, -5.48577880859375, -5.3243408203125, -5.16290283203125, -5.00146484375, -4.84002685546875, -4.6785888671875, -4.51715087890625, -4.355712890625, -4.19427490234375, -4.0328369140625, -3.87139892578125, -3.7099609375, -3.54852294921875, -3.3870849609375, -3.22564697265625, -3.064208984375, -2.90277099609375, -2.7413330078125, -2.57989501953125, -2.41845703125, -2.25701904296875, -2.0955810546875, -1.93414306640625, -1.772705078125, -1.61126708984375, -1.4498291015625, -1.28839111328125, -1.126953125, -0.96551513671875, -0.8040771484375, -0.64263916015625, -0.481201171875, -0.31976318359375, -0.1583251953125, 0.00311279296875, 0.16455078125, 0.32598876953125, 0.4874267578125, 0.64886474609375, 0.810302734375, 0.97174072265625, 1.1331787109375, 1.29461669921875, 1.4560546875, 1.61749267578125, 1.7789306640625, 1.94036865234375, 2.101806640625, 2.26324462890625, 2.4246826171875, 2.58612060546875, 2.74755859375, 2.90899658203125, 3.0704345703125, 3.23187255859375, 3.393310546875, 3.55474853515625, 3.7161865234375, 3.87762451171875, 4.0390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 9.0, 9.0, 19.0, 23.0, 20.0, 42.0, 44.0, 69.0, 103.0, 126.0, 182.0, 231.0, 321.0, 491.0, 635.0, 933.0, 1326.0, 1971.0, 3080.0, 5351.0, 10535.0, 30146.0, 756300.0, 195459.0, 19870.0, 8296.0, 4420.0, 2745.0, 1694.0, 1169.0, 828.0, 574.0, 425.0, 297.0, 223.0, 169.0, 111.0, 79.0, 67.0, 40.0, 35.0, 24.0, 19.0, 18.0, 11.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.515625, -29.58642578125, -28.6572265625, -27.72802734375, -26.798828125, -25.86962890625, -24.9404296875, -24.01123046875, -23.08203125, -22.15283203125, -21.2236328125, -20.29443359375, -19.365234375, -18.43603515625, -17.5068359375, -16.57763671875, -15.6484375, -14.71923828125, -13.7900390625, -12.86083984375, -11.931640625, -11.00244140625, -10.0732421875, -9.14404296875, -8.21484375, -7.28564453125, -6.3564453125, -5.42724609375, -4.498046875, -3.56884765625, -2.6396484375, -1.71044921875, -0.78125, 0.14794921875, 1.0771484375, 2.00634765625, 2.935546875, 3.86474609375, 4.7939453125, 5.72314453125, 6.65234375, 7.58154296875, 8.5107421875, 9.43994140625, 10.369140625, 11.29833984375, 12.2275390625, 13.15673828125, 14.0859375, 15.01513671875, 15.9443359375, 16.87353515625, 17.802734375, 18.73193359375, 19.6611328125, 20.59033203125, 21.51953125, 22.44873046875, 23.3779296875, 24.30712890625, 25.236328125, 26.16552734375, 27.0947265625, 28.02392578125, 28.953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 7.0, 8.0, 11.0, 12.0, 11.0, 14.0, 10.0, 19.0, 15.0, 22.0, 27.0, 22.0, 39.0, 30.0, 32.0, 43.0, 40.0, 55.0, 79.0, 204.0, 1642.0, 216.0, 84.0, 52.0, 37.0, 36.0, 35.0, 37.0, 29.0, 33.0, 25.0, 20.0, 19.0, 18.0, 14.0, 7.0, 10.0, 9.0, 1.0, 10.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.4609375, -12.0777587890625, -11.694580078125, -11.3114013671875, -10.92822265625, -10.5450439453125, -10.161865234375, -9.7786865234375, -9.3955078125, -9.0123291015625, -8.629150390625, -8.2459716796875, -7.86279296875, -7.4796142578125, -7.096435546875, -6.7132568359375, -6.330078125, -5.9468994140625, -5.563720703125, -5.1805419921875, -4.79736328125, -4.4141845703125, -4.031005859375, -3.6478271484375, -3.2646484375, -2.8814697265625, -2.498291015625, -2.1151123046875, -1.73193359375, -1.3487548828125, -0.965576171875, -0.5823974609375, -0.19921875, 0.1839599609375, 0.567138671875, 0.9503173828125, 1.33349609375, 1.7166748046875, 2.099853515625, 2.4830322265625, 2.8662109375, 3.2493896484375, 3.632568359375, 4.0157470703125, 4.39892578125, 4.7821044921875, 5.165283203125, 5.5484619140625, 5.931640625, 6.3148193359375, 6.697998046875, 7.0811767578125, 7.46435546875, 7.8475341796875, 8.230712890625, 8.6138916015625, 8.9970703125, 9.3802490234375, 9.763427734375, 10.1466064453125, 10.52978515625, 10.9129638671875, 11.296142578125, 11.6793212890625, 12.0625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 7.0, 8.0, 13.0, 17.0, 15.0, 24.0, 21.0, 28.0, 37.0, 37.0, 38.0, 56.0, 69.0, 172.0, 551.0, 3187.0, 3109555.0, 30118.0, 925.0, 302.0, 127.0, 72.0, 35.0, 39.0, 31.0, 29.0, 22.0, 20.0, 30.0, 19.0, 7.0, 15.0, 10.0, 12.0, 11.0, 4.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-55.0625, -53.32568359375, -51.5888671875, -49.85205078125, -48.115234375, -46.37841796875, -44.6416015625, -42.90478515625, -41.16796875, -39.43115234375, -37.6943359375, -35.95751953125, -34.220703125, -32.48388671875, -30.7470703125, -29.01025390625, -27.2734375, -25.53662109375, -23.7998046875, -22.06298828125, -20.326171875, -18.58935546875, -16.8525390625, -15.11572265625, -13.37890625, -11.64208984375, -9.9052734375, -8.16845703125, -6.431640625, -4.69482421875, -2.9580078125, -1.22119140625, 0.515625, 2.25244140625, 3.9892578125, 5.72607421875, 7.462890625, 9.19970703125, 10.9365234375, 12.67333984375, 14.41015625, 16.14697265625, 17.8837890625, 19.62060546875, 21.357421875, 23.09423828125, 24.8310546875, 26.56787109375, 28.3046875, 30.04150390625, 31.7783203125, 33.51513671875, 35.251953125, 36.98876953125, 38.7255859375, 40.46240234375, 42.19921875, 43.93603515625, 45.6728515625, 47.40966796875, 49.146484375, 50.88330078125, 52.6201171875, 54.35693359375, 56.09375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 755.0, 243.0, 11.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.55690002441406, -167.24212646484375, -162.92735290527344, -158.61257934570312, -154.2978057861328, -149.9830322265625, -145.6682586669922, -141.35348510742188, -137.0386962890625, -132.7239227294922, -128.40914916992188, -124.09437561035156, -119.77960205078125, -115.46482849121094, -111.1500473022461, -106.83527374267578, -102.5205078125, -98.20573425292969, -93.89096069335938, -89.57618713378906, -85.26141357421875, -80.94664001464844, -76.6318588256836, -72.31708526611328, -68.00231170654297, -63.687538146972656, -59.372764587402344, -55.057987213134766, -50.74321365356445, -46.42844009399414, -42.11366271972656, -37.79888916015625, -33.48411560058594, -29.169342041015625, -24.85456657409668, -20.539791107177734, -16.225017547607422, -11.91024398803711, -7.595468521118164, -3.2806930541992188, 1.0340805053710938, 5.348855018615723, 9.663629531860352, 13.97840404510498, 18.29317855834961, 22.607952117919922, 26.922727584838867, 31.237503051757812, 35.552276611328125, 39.86705017089844, 44.18182373046875, 48.49660110473633, 52.81137466430664, 57.12614822387695, 61.44092559814453, 65.75569915771484, 70.07047271728516, 74.38524627685547, 78.70001983642578, 83.0147933959961, 87.32957458496094, 91.64434814453125, 95.95912170410156, 100.27389526367188, 104.58866882324219]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 0.0, 3.0, 9.0, 5.0, 6.0, 19.0, 8.0, 7.0, 14.0, 20.0, 23.0, 27.0, 26.0, 23.0, 30.0, 32.0, 42.0, 28.0, 48.0, 43.0, 48.0, 45.0, 47.0, 38.0, 45.0, 46.0, 39.0, 35.0, 25.0, 42.0, 25.0, 28.0, 20.0, 21.0, 17.0, 11.0, 8.0, 16.0, 5.0, 9.0, 7.0, 5.0, 1.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.96411895751953, -35.4940071105957, -34.02389907836914, -32.55378723144531, -31.083677291870117, -29.613567352294922, -28.143457412719727, -26.67334747314453, -25.203235626220703, -23.733125686645508, -22.263015747070312, -20.792903900146484, -19.32279396057129, -17.852684020996094, -16.3825740814209, -14.912463188171387, -13.442354202270508, -11.972244262695312, -10.5021333694458, -9.032023429870605, -7.561913013458252, -6.091802597045898, -4.621692657470703, -3.1515817642211914, -1.681471824645996, -0.21136152744293213, 1.2587487697601318, 2.7288589477539062, 4.19896936416626, 5.669079780578613, 7.139189720153809, 8.60930061340332, 10.079410552978516, 11.549520492553711, 13.019631385803223, 14.489741325378418, 15.95985221862793, 17.429962158203125, 18.90007209777832, 20.370182037353516, 21.840293884277344, 23.31040382385254, 24.780513763427734, 26.250625610351562, 27.720735549926758, 29.190845489501953, 30.66095542907715, 32.131065368652344, 33.601173400878906, 35.071285247802734, 36.5413932800293, 38.011505126953125, 39.48161315917969, 40.951725006103516, 42.421836853027344, 43.891944885253906, 45.362056732177734, 46.83216857910156, 48.302276611328125, 49.77238845825195, 51.242496490478516, 52.712608337402344, 54.182716369628906, 55.652828216552734, 57.12294006347656]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 11.0, 10.0, 14.0, 19.0, 20.0, 17.0, 25.0, 22.0, 28.0, 25.0, 39.0, 30.0, 45.0, 51.0, 54.0, 47.0, 58.0, 54.0, 61.0, 55.0, 38.0, 35.0, 39.0, 34.0, 29.0, 19.0, 23.0, 19.0, 15.0, 11.0, 7.0, 14.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -6.020263671875, -5.85302734375, -5.685791015625, -5.5185546875, -5.351318359375, -5.18408203125, -5.016845703125, -4.849609375, -4.682373046875, -4.51513671875, -4.347900390625, -4.1806640625, -4.013427734375, -3.84619140625, -3.678955078125, -3.51171875, -3.344482421875, -3.17724609375, -3.010009765625, -2.8427734375, -2.675537109375, -2.50830078125, -2.341064453125, -2.173828125, -2.006591796875, -1.83935546875, -1.672119140625, -1.5048828125, -1.337646484375, -1.17041015625, -1.003173828125, -0.8359375, -0.668701171875, -0.50146484375, -0.334228515625, -0.1669921875, 0.000244140625, 0.16748046875, 0.334716796875, 0.501953125, 0.669189453125, 0.83642578125, 1.003662109375, 1.1708984375, 1.338134765625, 1.50537109375, 1.672607421875, 1.83984375, 2.007080078125, 2.17431640625, 2.341552734375, 2.5087890625, 2.676025390625, 2.84326171875, 3.010498046875, 3.177734375, 3.344970703125, 3.51220703125, 3.679443359375, 3.8466796875, 4.013916015625, 4.18115234375, 4.348388671875, 4.515625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 5.0, 7.0, 11.0, 21.0, 18.0, 26.0, 32.0, 53.0, 77.0, 111.0, 200.0, 319.0, 551.0, 1045.0, 2162.0, 4484.0, 10499.0, 30649.0, 201788.0, 3619767.0, 268429.0, 33329.0, 10871.0, 4800.0, 2275.0, 1155.0, 622.0, 325.0, 209.0, 129.0, 95.0, 58.0, 43.0, 24.0, 16.0, 16.0, 15.0, 7.0, 9.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.5087890625, -25.611328125, -24.7138671875, -23.81640625, -22.9189453125, -22.021484375, -21.1240234375, -20.2265625, -19.3291015625, -18.431640625, -17.5341796875, -16.63671875, -15.7392578125, -14.841796875, -13.9443359375, -13.046875, -12.1494140625, -11.251953125, -10.3544921875, -9.45703125, -8.5595703125, -7.662109375, -6.7646484375, -5.8671875, -4.9697265625, -4.072265625, -3.1748046875, -2.27734375, -1.3798828125, -0.482421875, 0.4150390625, 1.3125, 2.2099609375, 3.107421875, 4.0048828125, 4.90234375, 5.7998046875, 6.697265625, 7.5947265625, 8.4921875, 9.3896484375, 10.287109375, 11.1845703125, 12.08203125, 12.9794921875, 13.876953125, 14.7744140625, 15.671875, 16.5693359375, 17.466796875, 18.3642578125, 19.26171875, 20.1591796875, 21.056640625, 21.9541015625, 22.8515625, 23.7490234375, 24.646484375, 25.5439453125, 26.44140625, 27.3388671875, 28.236328125, 29.1337890625, 30.03125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 9.0, 16.0, 25.0, 40.0, 48.0, 56.0, 99.0, 129.0, 214.0, 346.0, 618.0, 771.0, 606.0, 346.0, 242.0, 148.0, 92.0, 73.0, 49.0, 29.0, 25.0, 33.0, 14.0, 11.0, 7.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.390625, -27.5703125, -26.75, -25.9296875, -25.109375, -24.2890625, -23.46875, -22.6484375, -21.828125, -21.0078125, -20.1875, -19.3671875, -18.546875, -17.7265625, -16.90625, -16.0859375, -15.265625, -14.4453125, -13.625, -12.8046875, -11.984375, -11.1640625, -10.34375, -9.5234375, -8.703125, -7.8828125, -7.0625, -6.2421875, -5.421875, -4.6015625, -3.78125, -2.9609375, -2.140625, -1.3203125, -0.5, 0.3203125, 1.140625, 1.9609375, 2.78125, 3.6015625, 4.421875, 5.2421875, 6.0625, 6.8828125, 7.703125, 8.5234375, 9.34375, 10.1640625, 10.984375, 11.8046875, 12.625, 13.4453125, 14.265625, 15.0859375, 15.90625, 16.7265625, 17.546875, 18.3671875, 19.1875, 20.0078125, 20.828125, 21.6484375, 22.46875, 23.2890625, 24.109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 7.0, 6.0, 11.0, 7.0, 21.0, 27.0, 36.0, 38.0, 54.0, 87.0, 123.0, 168.0, 334.0, 838.0, 13162.0, 4170489.0, 7280.0, 710.0, 339.0, 173.0, 118.0, 84.0, 49.0, 32.0, 30.0, 21.0, 16.0, 6.0, 2.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25, -80.49609375, -76.7421875, -72.98828125, -69.234375, -65.48046875, -61.7265625, -57.97265625, -54.21875, -50.46484375, -46.7109375, -42.95703125, -39.203125, -35.44921875, -31.6953125, -27.94140625, -24.1875, -20.43359375, -16.6796875, -12.92578125, -9.171875, -5.41796875, -1.6640625, 2.08984375, 5.84375, 9.59765625, 13.3515625, 17.10546875, 20.859375, 24.61328125, 28.3671875, 32.12109375, 35.875, 39.62890625, 43.3828125, 47.13671875, 50.890625, 54.64453125, 58.3984375, 62.15234375, 65.90625, 69.66015625, 73.4140625, 77.16796875, 80.921875, 84.67578125, 88.4296875, 92.18359375, 95.9375, 99.69140625, 103.4453125, 107.19921875, 110.953125, 114.70703125, 118.4609375, 122.21484375, 125.96875, 129.72265625, 133.4765625, 137.23046875, 140.984375, 144.73828125, 148.4921875, 152.24609375, 156.0]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [4.0, 2.0, 134.0, 771.0, 107.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.26115798950195, -23.710105895996094, -14.159051895141602, -4.607997894287109, 4.94305419921875, 14.49410629272461, 24.045162200927734, 33.59621047973633, 43.14726638793945, 52.69831848144531, 62.24937438964844, 71.80043029785156, 81.35147857666016, 90.90252685546875, 100.45358276367188, 110.004638671875, 119.55569458007812, 129.10675048828125, 138.65780639648438, 148.2088623046875, 157.75990295410156, 167.3109588623047, 176.8620147705078, 186.41305541992188, 195.964111328125, 205.51516723632812, 215.06622314453125, 224.61727905273438, 234.16831970214844, 243.71937561035156, 253.2704315185547, 262.82147216796875, 272.3725280761719, 281.923583984375, 291.4746398925781, 301.02569580078125, 310.5767517089844, 320.1278076171875, 329.6788330078125, 339.2298889160156, 348.78094482421875, 358.3320007324219, 367.883056640625, 377.4341125488281, 386.98516845703125, 396.53619384765625, 406.0872802734375, 415.6383056640625, 425.18939208984375, 434.7404479980469, 444.29150390625, 453.8425598144531, 463.39361572265625, 472.94464111328125, 482.4957275390625, 492.0467529296875, 501.5978088378906, 511.14886474609375, 520.6998901367188, 530.2509765625, 539.802001953125, 549.3530883789062, 558.9041137695312, 568.4552001953125, 578.0062255859375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 9.0, 12.0, 9.0, 16.0, 16.0, 19.0, 17.0, 31.0, 25.0, 26.0, 40.0, 43.0, 33.0, 34.0, 38.0, 38.0, 52.0, 44.0, 50.0, 47.0, 35.0, 47.0, 26.0, 38.0, 34.0, 19.0, 27.0, 24.0, 23.0, 21.0, 20.0, 16.0, 15.0, 8.0, 10.0, 8.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-69.60829162597656, -67.6014404296875, -65.59459686279297, -63.587745666503906, -61.580894470214844, -59.57404708862305, -57.56719970703125, -55.56034851074219, -53.553497314453125, -51.54664993286133, -49.539798736572266, -47.53295135498047, -45.526100158691406, -43.51925277709961, -41.51240539550781, -39.50555419921875, -37.49870681762695, -35.491859436035156, -33.485008239746094, -31.478160858154297, -29.471309661865234, -27.464462280273438, -25.457612991333008, -23.450763702392578, -21.44391441345215, -19.43706512451172, -17.43021583557129, -15.423367500305176, -13.416518211364746, -11.409668922424316, -9.402820587158203, -7.395971298217773, -5.389122009277344, -3.382272958755493, -1.3754239082336426, 0.6314249038696289, 2.6382741928100586, 4.645123481750488, 6.651971817016602, 8.658821105957031, 10.665670394897461, 12.67251968383789, 14.67936897277832, 16.68621826171875, 18.693065643310547, 20.69991683959961, 22.706764221191406, 24.713613510131836, 26.720462799072266, 28.727312088012695, 30.734161376953125, 32.74100875854492, 34.747859954833984, 36.75470733642578, 38.761558532714844, 40.76840591430664, 42.77525329589844, 44.782100677490234, 46.7889518737793, 48.795799255371094, 50.802650451660156, 52.80949783325195, 54.81634521484375, 56.82319641113281, 58.830047607421875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 37.0, 54.0, 79.0, 118.0, 192.0, 310.0, 453.0, 686.0, 1059.0, 1833.0, 2942.0, 4715.0, 7616.0, 12326.0, 20740.0, 34448.0, 58052.0, 101939.0, 192597.0, 265304.0, 145790.0, 79400.0, 46776.0, 27820.0, 16736.0, 9980.0, 6300.0, 3768.0, 2378.0, 1466.0, 940.0, 607.0, 356.0, 216.0, 162.0, 100.0, 80.0, 54.0, 31.0, 17.0, 11.0, 7.0, 4.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.87060546875, -0.844451904296875, -0.81829833984375, -0.792144775390625, -0.7659912109375, -0.739837646484375, -0.71368408203125, -0.687530517578125, -0.661376953125, -0.635223388671875, -0.60906982421875, -0.582916259765625, -0.5567626953125, -0.530609130859375, -0.50445556640625, -0.478302001953125, -0.4521484375, -0.425994873046875, -0.39984130859375, -0.373687744140625, -0.3475341796875, -0.321380615234375, -0.29522705078125, -0.269073486328125, -0.242919921875, -0.216766357421875, -0.19061279296875, -0.164459228515625, -0.1383056640625, -0.112152099609375, -0.08599853515625, -0.059844970703125, -0.03369140625, -0.007537841796875, 0.01861572265625, 0.044769287109375, 0.0709228515625, 0.097076416015625, 0.12322998046875, 0.149383544921875, 0.175537109375, 0.201690673828125, 0.22784423828125, 0.253997802734375, 0.2801513671875, 0.306304931640625, 0.33245849609375, 0.358612060546875, 0.384765625, 0.410919189453125, 0.43707275390625, 0.463226318359375, 0.4893798828125, 0.515533447265625, 0.54168701171875, 0.567840576171875, 0.593994140625, 0.620147705078125, 0.64630126953125, 0.672454833984375, 0.6986083984375, 0.724761962890625, 0.75091552734375, 0.777069091796875, 0.80322265625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 7.0, 4.0, 2.0, 11.0, 14.0, 9.0, 12.0, 17.0, 11.0, 26.0, 29.0, 24.0, 22.0, 20.0, 30.0, 43.0, 33.0, 32.0, 41.0, 35.0, 45.0, 1059.0, 40.0, 44.0, 39.0, 34.0, 45.0, 34.0, 31.0, 29.0, 34.0, 30.0, 20.0, 26.0, 17.0, 9.0, 14.0, 11.0, 7.0, 12.0, 5.0, 5.0, 7.0, 0.0, 9.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.734375, -2.64202880859375, -2.5496826171875, -2.45733642578125, -2.364990234375, -2.27264404296875, -2.1802978515625, -2.08795166015625, -1.99560546875, -1.90325927734375, -1.8109130859375, -1.71856689453125, -1.626220703125, -1.53387451171875, -1.4415283203125, -1.34918212890625, -1.2568359375, -1.16448974609375, -1.0721435546875, -0.97979736328125, -0.887451171875, -0.79510498046875, -0.7027587890625, -0.61041259765625, -0.51806640625, -0.42572021484375, -0.3333740234375, -0.24102783203125, -0.148681640625, -0.05633544921875, 0.0360107421875, 0.12835693359375, 0.220703125, 0.31304931640625, 0.4053955078125, 0.49774169921875, 0.590087890625, 0.68243408203125, 0.7747802734375, 0.86712646484375, 0.95947265625, 1.05181884765625, 1.1441650390625, 1.23651123046875, 1.328857421875, 1.42120361328125, 1.5135498046875, 1.60589599609375, 1.6982421875, 1.79058837890625, 1.8829345703125, 1.97528076171875, 2.067626953125, 2.15997314453125, 2.2523193359375, 2.34466552734375, 2.43701171875, 2.52935791015625, 2.6217041015625, 2.71405029296875, 2.806396484375, 2.89874267578125, 2.9910888671875, 3.08343505859375, 3.17578125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 10.0, 7.0, 15.0, 18.0, 30.0, 45.0, 61.0, 101.0, 140.0, 202.0, 320.0, 486.0, 761.0, 1079.0, 1647.0, 2387.0, 3792.0, 5561.0, 8600.0, 13120.0, 20200.0, 31747.0, 52094.0, 85638.0, 150482.0, 1299043.0, 168678.0, 95309.0, 56819.0, 35211.0, 22080.0, 14080.0, 9200.0, 6152.0, 4050.0, 2662.0, 1785.0, 1138.0, 794.0, 530.0, 349.0, 258.0, 144.0, 98.0, 78.0, 45.0, 36.0, 21.0, 10.0, 10.0, 7.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.69873046875, -0.6779327392578125, -0.657135009765625, -0.6363372802734375, -0.61553955078125, -0.5947418212890625, -0.573944091796875, -0.5531463623046875, -0.5323486328125, -0.5115509033203125, -0.490753173828125, -0.4699554443359375, -0.44915771484375, -0.4283599853515625, -0.407562255859375, -0.3867645263671875, -0.365966796875, -0.3451690673828125, -0.324371337890625, -0.3035736083984375, -0.28277587890625, -0.2619781494140625, -0.241180419921875, -0.2203826904296875, -0.1995849609375, -0.1787872314453125, -0.157989501953125, -0.1371917724609375, -0.11639404296875, -0.0955963134765625, -0.074798583984375, -0.0540008544921875, -0.033203125, -0.0124053955078125, 0.008392333984375, 0.0291900634765625, 0.04998779296875, 0.0707855224609375, 0.091583251953125, 0.1123809814453125, 0.1331787109375, 0.1539764404296875, 0.174774169921875, 0.1955718994140625, 0.21636962890625, 0.2371673583984375, 0.257965087890625, 0.2787628173828125, 0.299560546875, 0.3203582763671875, 0.341156005859375, 0.3619537353515625, 0.38275146484375, 0.4035491943359375, 0.424346923828125, 0.4451446533203125, 0.4659423828125, 0.4867401123046875, 0.507537841796875, 0.5283355712890625, 0.54913330078125, 0.5699310302734375, 0.590728759765625, 0.6115264892578125, 0.63232421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 12.0, 9.0, 16.0, 8.0, 14.0, 21.0, 24.0, 35.0, 31.0, 32.0, 28.0, 41.0, 50.0, 54.0, 55.0, 66.0, 75.0, 42.0, 45.0, 49.0, 51.0, 38.0, 46.0, 18.0, 17.0, 18.0, 14.0, 15.0, 19.0, 12.0, 5.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0005235671997070312, -0.00051068514585495, -0.0004978030920028687, -0.00048492103815078735, -0.00047203898429870605, -0.00045915693044662476, -0.00044627487659454346, -0.00043339282274246216, -0.00042051076889038086, -0.00040762871503829956, -0.00039474666118621826, -0.00038186460733413696, -0.00036898255348205566, -0.00035610049962997437, -0.00034321844577789307, -0.00033033639192581177, -0.00031745433807373047, -0.00030457228422164917, -0.00029169023036956787, -0.00027880817651748657, -0.0002659261226654053, -0.000253044068813324, -0.00024016201496124268, -0.00022727996110916138, -0.00021439790725708008, -0.00020151585340499878, -0.00018863379955291748, -0.00017575174570083618, -0.00016286969184875488, -0.00014998763799667358, -0.00013710558414459229, -0.00012422353029251099, -0.00011134147644042969, -9.845942258834839e-05, -8.557736873626709e-05, -7.269531488418579e-05, -5.981326103210449e-05, -4.693120718002319e-05, -3.4049153327941895e-05, -2.1167099475860596e-05, -8.285045623779297e-06, 4.597008228302002e-06, 1.74790620803833e-05, 3.03611159324646e-05, 4.32431697845459e-05, 5.61252236366272e-05, 6.90072774887085e-05, 8.18893313407898e-05, 9.47713851928711e-05, 0.00010765343904495239, 0.00012053549289703369, 0.000133417546749115, 0.0001462996006011963, 0.0001591816544532776, 0.0001720637083053589, 0.00018494576215744019, 0.00019782781600952148, 0.00021070986986160278, 0.00022359192371368408, 0.00023647397756576538, 0.0002493560314178467, 0.000262238085269928, 0.0002751201391220093, 0.0002880021929740906, 0.0003008842468261719]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 16.0, 11.0, 22.0, 21.0, 30.0, 39.0, 66.0, 66.0, 101.0, 144.0, 317.0, 602.0, 4301.0, 1040318.0, 1268.0, 426.0, 242.0, 148.0, 102.0, 70.0, 53.0, 32.0, 32.0, 18.0, 14.0, 20.0, 13.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00841522216796875, -0.008054494857788086, -0.007693767547607422, -0.007333040237426758, -0.006972312927246094, -0.00661158561706543, -0.006250858306884766, -0.0058901309967041016, -0.0055294036865234375, -0.0051686763763427734, -0.004807949066162109, -0.004447221755981445, -0.004086494445800781, -0.003725767135620117, -0.003365039825439453, -0.003004312515258789, -0.002643585205078125, -0.002282857894897461, -0.0019221305847167969, -0.0015614032745361328, -0.0012006759643554688, -0.0008399486541748047, -0.0004792213439941406, -0.00011849403381347656, 0.0002422332763671875, 0.0006029605865478516, 0.0009636878967285156, 0.0013244152069091797, 0.0016851425170898438, 0.002045869827270508, 0.002406597137451172, 0.002767324447631836, 0.0031280517578125, 0.003488779067993164, 0.003849506378173828, 0.004210233688354492, 0.004570960998535156, 0.00493168830871582, 0.005292415618896484, 0.0056531429290771484, 0.0060138702392578125, 0.0063745975494384766, 0.006735324859619141, 0.007096052169799805, 0.007456779479980469, 0.007817506790161133, 0.008178234100341797, 0.008538961410522461, 0.008899688720703125, 0.009260416030883789, 0.009621143341064453, 0.009981870651245117, 0.010342597961425781, 0.010703325271606445, 0.01106405258178711, 0.011424779891967773, 0.011785507202148438, 0.012146234512329102, 0.012506961822509766, 0.01286768913269043, 0.013228416442871094, 0.013589143753051758, 0.013949871063232422, 0.014310598373413086, 0.01467132568359375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 14.0, 57.0, 248.0, 461.0, 195.0, 31.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003618910850491375, -0.00034320427221246064, -0.00032451743027195334, -0.0003058306174352765, -0.0002871437754947692, -0.0002684569626580924, -0.0002497701207175851, -0.00023108330788090825, -0.00021239648049231619, -0.00019370965310372412, -0.00017502282571513206, -0.00015633599832654, -0.00013764918548986316, -0.00011896235082531348, -0.00010027553071267903, -8.158870332408696e-05, -6.29018759354949e-05, -4.4215048546902835e-05, -2.5528224796289578e-05, -6.841401045676321e-06, 1.1845426342915744e-05, 3.053225373150781e-05, 4.921907384414226e-05, 6.790590123273432e-05, 8.659272862132639e-05, 0.00010527955600991845, 0.00012396638339851052, 0.00014265321078710258, 0.00016134002362377942, 0.0001800268655642867, 0.00019871367840096354, 0.0002174005057895556, 0.00023608730407431722, 0.00025477411691099405, 0.00027346095885150135, 0.0002921477716881782, 0.0003108346136286855, 0.0003295214264653623, 0.00034820823930203915, 0.00036689508124254644, 0.00038558192318305373, 0.00040426873601973057, 0.00042295557796023786, 0.0004416423907969147, 0.000460329232737422, 0.0004790160455740988, 0.0004977028584107757, 0.0005163897294551134, 0.0005350764840841293, 0.0005537632969208062, 0.000572450109757483, 0.0005911369808018208, 0.0006098237936384976, 0.0006285106064751744, 0.0006471974193118513, 0.0006658842321485281, 0.0006845711031928658, 0.0007032579160295427, 0.0007219447288662195, 0.0007406315999105573, 0.0007593184127472341, 0.0007780052255839109, 0.0007966920384205878, 0.0008153788512572646, 0.0008340657223016024]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 9.0, 8.0, 8.0, 12.0, 21.0, 16.0, 25.0, 19.0, 28.0, 16.0, 24.0, 37.0, 27.0, 36.0, 27.0, 29.0, 37.0, 49.0, 42.0, 39.0, 49.0, 37.0, 37.0, 35.0, 36.0, 30.0, 33.0, 31.0, 26.0, 20.0, 19.0, 25.0, 19.0, 15.0, 9.0, 17.0, 7.0, 5.0, 7.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002194046974182129, -0.00021274667233228683, -0.00020608864724636078, -0.00019943062216043472, -0.00019277259707450867, -0.0001861145719885826, -0.00017945654690265656, -0.0001727985218167305, -0.00016614049673080444, -0.0001594824716448784, -0.00015282444655895233, -0.00014616642147302628, -0.00013950839638710022, -0.00013285037130117416, -0.0001261923462152481, -0.00011953432112932205, -0.000112876296043396, -0.00010621827095746994, -9.956024587154388e-05, -9.290222078561783e-05, -8.624419569969177e-05, -7.958617061376572e-05, -7.292814552783966e-05, -6.62701204419136e-05, -5.961209535598755e-05, -5.295407027006149e-05, -4.629604518413544e-05, -3.963802009820938e-05, -3.2979995012283325e-05, -2.632196992635727e-05, -1.9663944840431213e-05, -1.3005919754505157e-05, -6.3478946685791016e-06, 3.1013041734695435e-07, 6.96815550327301e-06, 1.3626180589199066e-05, 2.0284205675125122e-05, 2.6942230761051178e-05, 3.3600255846977234e-05, 4.025828093290329e-05, 4.6916306018829346e-05, 5.35743311047554e-05, 6.023235619068146e-05, 6.689038127660751e-05, 7.354840636253357e-05, 8.020643144845963e-05, 8.686445653438568e-05, 9.352248162031174e-05, 0.00010018050670623779, 0.00010683853179216385, 0.0001134965568780899, 0.00012015458196401596, 0.00012681260704994202, 0.00013347063213586807, 0.00014012865722179413, 0.00014678668230772018, 0.00015344470739364624, 0.0001601027324795723, 0.00016676075756549835, 0.0001734187826514244, 0.00018007680773735046, 0.00018673483282327652, 0.00019339285790920258, 0.00020005088299512863, 0.0002067089080810547]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 7.0, 14.0, 17.0, 22.0, 23.0, 35.0, 23.0, 35.0, 29.0, 33.0, 43.0, 40.0, 42.0, 50.0, 45.0, 59.0, 53.0, 40.0, 45.0, 43.0, 32.0, 40.0, 29.0, 27.0, 23.0, 19.0, 17.0, 14.0, 12.0, 7.0, 10.0, 9.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.7109375, -5.55352783203125, -5.3961181640625, -5.23870849609375, -5.081298828125, -4.92388916015625, -4.7664794921875, -4.60906982421875, -4.45166015625, -4.29425048828125, -4.1368408203125, -3.97943115234375, -3.822021484375, -3.66461181640625, -3.5072021484375, -3.34979248046875, -3.1923828125, -3.03497314453125, -2.8775634765625, -2.72015380859375, -2.562744140625, -2.40533447265625, -2.2479248046875, -2.09051513671875, -1.93310546875, -1.77569580078125, -1.6182861328125, -1.46087646484375, -1.303466796875, -1.14605712890625, -0.9886474609375, -0.83123779296875, -0.673828125, -0.51641845703125, -0.3590087890625, -0.20159912109375, -0.044189453125, 0.11322021484375, 0.2706298828125, 0.42803955078125, 0.58544921875, 0.74285888671875, 0.9002685546875, 1.05767822265625, 1.215087890625, 1.37249755859375, 1.5299072265625, 1.68731689453125, 1.8447265625, 2.00213623046875, 2.1595458984375, 2.31695556640625, 2.474365234375, 2.63177490234375, 2.7891845703125, 2.94659423828125, 3.10400390625, 3.26141357421875, 3.4188232421875, 3.57623291015625, 3.733642578125, 3.89105224609375, 4.0484619140625, 4.20587158203125, 4.36328125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 9.0, 13.0, 21.0, 23.0, 46.0, 48.0, 78.0, 91.0, 131.0, 225.0, 299.0, 563.0, 958.0, 1930.0, 4603.0, 13680.0, 46226.0, 193152.0, 543248.0, 178341.0, 43035.0, 12883.0, 4531.0, 1970.0, 919.0, 539.0, 304.0, 225.0, 130.0, 81.0, 70.0, 59.0, 31.0, 27.0, 15.0, 14.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.796875, -5.62872314453125, -5.4605712890625, -5.29241943359375, -5.124267578125, -4.95611572265625, -4.7879638671875, -4.61981201171875, -4.45166015625, -4.28350830078125, -4.1153564453125, -3.94720458984375, -3.779052734375, -3.61090087890625, -3.4427490234375, -3.27459716796875, -3.1064453125, -2.93829345703125, -2.7701416015625, -2.60198974609375, -2.433837890625, -2.26568603515625, -2.0975341796875, -1.92938232421875, -1.76123046875, -1.59307861328125, -1.4249267578125, -1.25677490234375, -1.088623046875, -0.92047119140625, -0.7523193359375, -0.58416748046875, -0.416015625, -0.24786376953125, -0.0797119140625, 0.08843994140625, 0.256591796875, 0.42474365234375, 0.5928955078125, 0.76104736328125, 0.92919921875, 1.09735107421875, 1.2655029296875, 1.43365478515625, 1.601806640625, 1.76995849609375, 1.9381103515625, 2.10626220703125, 2.2744140625, 2.44256591796875, 2.6107177734375, 2.77886962890625, 2.947021484375, 3.11517333984375, 3.2833251953125, 3.45147705078125, 3.61962890625, 3.78778076171875, 3.9559326171875, 4.12408447265625, 4.292236328125, 4.46038818359375, 4.6285400390625, 4.79669189453125, 4.96484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 16.0, 15.0, 17.0, 23.0, 26.0, 30.0, 25.0, 25.0, 30.0, 30.0, 40.0, 54.0, 40.0, 83.0, 437.0, 1607.0, 81.0, 38.0, 53.0, 42.0, 43.0, 42.0, 24.0, 28.0, 27.0, 17.0, 23.0, 21.0, 15.0, 19.0, 11.0, 7.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.53125, -16.0313720703125, -15.531494140625, -15.0316162109375, -14.53173828125, -14.0318603515625, -13.531982421875, -13.0321044921875, -12.5322265625, -12.0323486328125, -11.532470703125, -11.0325927734375, -10.53271484375, -10.0328369140625, -9.532958984375, -9.0330810546875, -8.533203125, -8.0333251953125, -7.533447265625, -7.0335693359375, -6.53369140625, -6.0338134765625, -5.533935546875, -5.0340576171875, -4.5341796875, -4.0343017578125, -3.534423828125, -3.0345458984375, -2.53466796875, -2.0347900390625, -1.534912109375, -1.0350341796875, -0.53515625, -0.0352783203125, 0.464599609375, 0.9644775390625, 1.46435546875, 1.9642333984375, 2.464111328125, 2.9639892578125, 3.4638671875, 3.9637451171875, 4.463623046875, 4.9635009765625, 5.46337890625, 5.9632568359375, 6.463134765625, 6.9630126953125, 7.462890625, 7.9627685546875, 8.462646484375, 8.9625244140625, 9.46240234375, 9.9622802734375, 10.462158203125, 10.9620361328125, 11.4619140625, 11.9617919921875, 12.461669921875, 12.9615478515625, 13.46142578125, 13.9613037109375, 14.461181640625, 14.9610595703125, 15.4609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 8.0, 9.0, 7.0, 9.0, 15.0, 17.0, 28.0, 22.0, 18.0, 23.0, 38.0, 31.0, 61.0, 77.0, 139.0, 191.0, 545.0, 2388.0, 2961827.0, 178001.0, 1239.0, 395.0, 174.0, 97.0, 75.0, 42.0, 37.0, 30.0, 30.0, 29.0, 21.0, 16.0, 20.0, 10.0, 6.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-36.21875, -35.044921875, -33.87109375, -32.697265625, -31.5234375, -30.349609375, -29.17578125, -28.001953125, -26.828125, -25.654296875, -24.48046875, -23.306640625, -22.1328125, -20.958984375, -19.78515625, -18.611328125, -17.4375, -16.263671875, -15.08984375, -13.916015625, -12.7421875, -11.568359375, -10.39453125, -9.220703125, -8.046875, -6.873046875, -5.69921875, -4.525390625, -3.3515625, -2.177734375, -1.00390625, 0.169921875, 1.34375, 2.517578125, 3.69140625, 4.865234375, 6.0390625, 7.212890625, 8.38671875, 9.560546875, 10.734375, 11.908203125, 13.08203125, 14.255859375, 15.4296875, 16.603515625, 17.77734375, 18.951171875, 20.125, 21.298828125, 22.47265625, 23.646484375, 24.8203125, 25.994140625, 27.16796875, 28.341796875, 29.515625, 30.689453125, 31.86328125, 33.037109375, 34.2109375, 35.384765625, 36.55859375, 37.732421875, 38.90625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 8.0, 19.0, 75.0, 173.0, 236.0, 254.0, 154.0, 59.0, 29.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962770938873291, -5.297201633453369, -4.631632328033447, -3.9660627841949463, -3.3004934787750244, -2.6349241733551025, -1.9693546295166016, -1.3037853240966797, -0.6382160186767578, 0.027353346347808838, 0.6929227113723755, 1.358492136001587, 2.024061441421509, 2.6896307468414307, 3.3552002906799316, 4.0207695960998535, 4.686338901519775, 5.351908206939697, 6.017477512359619, 6.683047294616699, 7.348616600036621, 8.014185905456543, 8.679755210876465, 9.345324516296387, 10.010893821716309, 10.67646312713623, 11.342032432556152, 12.007601737976074, 12.673171043395996, 13.338740348815918, 14.004310607910156, 14.669879913330078, 15.335447311401367, 16.00101661682129, 16.66658592224121, 17.332155227661133, 17.997724533081055, 18.663293838500977, 19.3288631439209, 19.99443244934082, 20.660001754760742, 21.325571060180664, 21.991140365600586, 22.656709671020508, 23.32227897644043, 23.98784828186035, 24.653417587280273, 25.318986892700195, 25.98455810546875, 26.650127410888672, 27.315696716308594, 27.981266021728516, 28.646835327148438, 29.31240463256836, 29.97797393798828, 30.643543243408203, 31.309112548828125, 31.974681854248047, 32.64025115966797, 33.30582046508789, 33.97138977050781, 34.636959075927734, 35.302528381347656, 35.96809768676758, 36.6336669921875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 12.0, 16.0, 10.0, 16.0, 11.0, 22.0, 22.0, 36.0, 37.0, 31.0, 47.0, 29.0, 32.0, 39.0, 44.0, 44.0, 43.0, 44.0, 56.0, 49.0, 50.0, 38.0, 27.0, 36.0, 26.0, 25.0, 22.0, 15.0, 29.0, 17.0, 8.0, 13.0, 6.0, 14.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.35805130004883, -52.647804260253906, -50.937557220458984, -49.22731018066406, -47.517066955566406, -45.806819915771484, -44.09657287597656, -42.38632583618164, -40.67607879638672, -38.9658317565918, -37.255584716796875, -35.54534149169922, -33.8350944519043, -32.124847412109375, -30.414600372314453, -28.70435333251953, -26.994110107421875, -25.283863067626953, -23.573617935180664, -21.863370895385742, -20.153125762939453, -18.44287872314453, -16.73263168334961, -15.022385597229004, -13.312139511108398, -11.601893424987793, -9.891647338867188, -8.181400299072266, -6.47115421295166, -4.760908126831055, -3.050661087036133, -1.3404150009155273, 0.36983489990234375, 2.0800812244415283, 3.790327548980713, 5.500574111938477, 7.210820198059082, 8.921066284179688, 10.63131332397461, 12.341559410095215, 14.05180549621582, 15.762051582336426, 17.47229766845703, 19.182544708251953, 20.892791748046875, 22.603036880493164, 24.313283920288086, 26.023529052734375, 27.733776092529297, 29.44402313232422, 31.154268264770508, 32.86451721191406, 34.57476043701172, 36.28500747680664, 37.99525451660156, 39.705501556396484, 41.415748596191406, 43.12599563598633, 44.83624267578125, 46.546485900878906, 48.25673294067383, 49.96697998046875, 51.67722702026367, 53.387474060058594, 55.09771728515625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 7.0, 3.0, 7.0, 9.0, 11.0, 11.0, 10.0, 18.0, 9.0, 23.0, 22.0, 28.0, 27.0, 26.0, 35.0, 36.0, 44.0, 35.0, 37.0, 46.0, 50.0, 50.0, 57.0, 55.0, 35.0, 50.0, 37.0, 38.0, 28.0, 25.0, 27.0, 21.0, 10.0, 20.0, 11.0, 12.0, 6.0, 9.0, 12.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.73046875, -5.56939697265625, -5.4083251953125, -5.24725341796875, -5.086181640625, -4.92510986328125, -4.7640380859375, -4.60296630859375, -4.44189453125, -4.28082275390625, -4.1197509765625, -3.95867919921875, -3.797607421875, -3.63653564453125, -3.4754638671875, -3.31439208984375, -3.1533203125, -2.99224853515625, -2.8311767578125, -2.67010498046875, -2.509033203125, -2.34796142578125, -2.1868896484375, -2.02581787109375, -1.86474609375, -1.70367431640625, -1.5426025390625, -1.38153076171875, -1.220458984375, -1.05938720703125, -0.8983154296875, -0.73724365234375, -0.576171875, -0.41510009765625, -0.2540283203125, -0.09295654296875, 0.068115234375, 0.22918701171875, 0.3902587890625, 0.55133056640625, 0.71240234375, 0.87347412109375, 1.0345458984375, 1.19561767578125, 1.356689453125, 1.51776123046875, 1.6788330078125, 1.83990478515625, 2.0009765625, 2.16204833984375, 2.3231201171875, 2.48419189453125, 2.645263671875, 2.80633544921875, 2.9674072265625, 3.12847900390625, 3.28955078125, 3.45062255859375, 3.6116943359375, 3.77276611328125, 3.933837890625, 4.09490966796875, 4.2559814453125, 4.41705322265625, 4.578125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 10.0, 6.0, 18.0, 14.0, 15.0, 33.0, 35.0, 56.0, 74.0, 119.0, 176.0, 343.0, 772.0, 3004.0, 24010.0, 597422.0, 3239332.0, 310238.0, 14954.0, 2170.0, 671.0, 300.0, 162.0, 97.0, 61.0, 49.0, 32.0, 28.0, 14.0, 17.0, 12.0, 5.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.46875, -19.9215087890625, -19.374267578125, -18.8270263671875, -18.27978515625, -17.7325439453125, -17.185302734375, -16.6380615234375, -16.0908203125, -15.5435791015625, -14.996337890625, -14.4490966796875, -13.90185546875, -13.3546142578125, -12.807373046875, -12.2601318359375, -11.712890625, -11.1656494140625, -10.618408203125, -10.0711669921875, -9.52392578125, -8.9766845703125, -8.429443359375, -7.8822021484375, -7.3349609375, -6.7877197265625, -6.240478515625, -5.6932373046875, -5.14599609375, -4.5987548828125, -4.051513671875, -3.5042724609375, -2.95703125, -2.4097900390625, -1.862548828125, -1.3153076171875, -0.76806640625, -0.2208251953125, 0.326416015625, 0.8736572265625, 1.4208984375, 1.9681396484375, 2.515380859375, 3.0626220703125, 3.60986328125, 4.1571044921875, 4.704345703125, 5.2515869140625, 5.798828125, 6.3460693359375, 6.893310546875, 7.4405517578125, 7.98779296875, 8.5350341796875, 9.082275390625, 9.6295166015625, 10.1767578125, 10.7239990234375, 11.271240234375, 11.8184814453125, 12.36572265625, 12.9129638671875, 13.460205078125, 14.0074462890625, 14.5546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 7.0, 16.0, 10.0, 29.0, 40.0, 58.0, 79.0, 116.0, 171.0, 280.0, 432.0, 653.0, 719.0, 492.0, 316.0, 200.0, 151.0, 94.0, 64.0, 47.0, 38.0, 17.0, 13.0, 14.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.078125, -28.335693359375, -27.59326171875, -26.850830078125, -26.1083984375, -25.365966796875, -24.62353515625, -23.881103515625, -23.138671875, -22.396240234375, -21.65380859375, -20.911376953125, -20.1689453125, -19.426513671875, -18.68408203125, -17.941650390625, -17.19921875, -16.456787109375, -15.71435546875, -14.971923828125, -14.2294921875, -13.487060546875, -12.74462890625, -12.002197265625, -11.259765625, -10.517333984375, -9.77490234375, -9.032470703125, -8.2900390625, -7.547607421875, -6.80517578125, -6.062744140625, -5.3203125, -4.577880859375, -3.83544921875, -3.093017578125, -2.3505859375, -1.608154296875, -0.86572265625, -0.123291015625, 0.619140625, 1.361572265625, 2.10400390625, 2.846435546875, 3.5888671875, 4.331298828125, 5.07373046875, 5.816162109375, 6.55859375, 7.301025390625, 8.04345703125, 8.785888671875, 9.5283203125, 10.270751953125, 11.01318359375, 11.755615234375, 12.498046875, 13.240478515625, 13.98291015625, 14.725341796875, 15.4677734375, 16.210205078125, 16.95263671875, 17.695068359375, 18.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 9.0, 18.0, 29.0, 28.0, 60.0, 76.0, 113.0, 180.0, 260.0, 464.0, 1192.0, 26659.0, 4112762.0, 49792.0, 1364.0, 474.0, 257.0, 162.0, 101.0, 82.0, 48.0, 43.0, 25.0, 22.0, 10.0, 8.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.0625, -50.8095703125, -48.556640625, -46.3037109375, -44.05078125, -41.7978515625, -39.544921875, -37.2919921875, -35.0390625, -32.7861328125, -30.533203125, -28.2802734375, -26.02734375, -23.7744140625, -21.521484375, -19.2685546875, -17.015625, -14.7626953125, -12.509765625, -10.2568359375, -8.00390625, -5.7509765625, -3.498046875, -1.2451171875, 1.0078125, 3.2607421875, 5.513671875, 7.7666015625, 10.01953125, 12.2724609375, 14.525390625, 16.7783203125, 19.03125, 21.2841796875, 23.537109375, 25.7900390625, 28.04296875, 30.2958984375, 32.548828125, 34.8017578125, 37.0546875, 39.3076171875, 41.560546875, 43.8134765625, 46.06640625, 48.3193359375, 50.572265625, 52.8251953125, 55.078125, 57.3310546875, 59.583984375, 61.8369140625, 64.08984375, 66.3427734375, 68.595703125, 70.8486328125, 73.1015625, 75.3544921875, 77.607421875, 79.8603515625, 82.11328125, 84.3662109375, 86.619140625, 88.8720703125, 91.125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 92.0, 707.0, 211.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-588.1069946289062, -577.901123046875, -567.6953125, -557.4894409179688, -547.2836303710938, -537.0777587890625, -526.8719482421875, -516.6660766601562, -506.46026611328125, -496.2544250488281, -486.048583984375, -475.8427429199219, -465.63690185546875, -455.4310607910156, -445.2252197265625, -435.01934814453125, -424.8135070800781, -414.607666015625, -404.4018249511719, -394.19598388671875, -383.9901428222656, -373.7843017578125, -363.5784606933594, -353.37261962890625, -343.166748046875, -332.9609069824219, -322.75506591796875, -312.5492248535156, -302.3433837890625, -292.1375427246094, -281.93170166015625, -271.725830078125, -261.52001953125, -251.31417846679688, -241.10833740234375, -230.90249633789062, -220.6966552734375, -210.49081420898438, -200.2849578857422, -190.07911682128906, -179.873291015625, -169.66744995117188, -159.46160888671875, -149.25576782226562, -139.0499267578125, -128.84408569335938, -118.63822937011719, -108.43238830566406, -98.2265396118164, -88.02069854736328, -77.81484985351562, -67.6090087890625, -57.403167724609375, -47.19732666015625, -36.99148178100586, -26.78563690185547, -16.579795837402344, -6.373952865600586, 3.831890106201172, 14.03773307800293, 24.243576049804688, 34.44941711425781, 44.6552619934082, 54.861106872558594, 65.06694793701172]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 3.0, 11.0, 8.0, 18.0, 12.0, 17.0, 26.0, 25.0, 21.0, 21.0, 30.0, 23.0, 40.0, 31.0, 27.0, 39.0, 46.0, 38.0, 45.0, 23.0, 46.0, 40.0, 34.0, 38.0, 27.0, 29.0, 35.0, 29.0, 24.0, 30.0, 26.0, 24.0, 23.0, 16.0, 8.0, 9.0, 14.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-54.29388427734375, -52.568817138671875, -50.84375, -49.118682861328125, -47.39361572265625, -45.668548583984375, -43.9434814453125, -42.218414306640625, -40.49334716796875, -38.768280029296875, -37.043212890625, -35.318145751953125, -33.59307861328125, -31.868011474609375, -30.1429443359375, -28.417877197265625, -26.692811965942383, -24.967744827270508, -23.242677688598633, -21.517610549926758, -19.792543411254883, -18.06747817993164, -16.342411041259766, -14.617342948913574, -12.8922758102417, -11.167208671569824, -9.44214153289795, -7.717074871063232, -5.992007732391357, -4.266941070556641, -2.5418739318847656, -0.8168067932128906, 0.9082603454589844, 2.6333274841308594, 4.358394622802734, 6.083461284637451, 7.808528423309326, 9.533595085144043, 11.258662223815918, 12.983729362487793, 14.708796501159668, 16.433862686157227, 18.1589298248291, 19.883996963500977, 21.60906410217285, 23.334131240844727, 25.0591983795166, 26.784265518188477, 28.50933265686035, 30.234399795532227, 31.9594669342041, 33.684532165527344, 35.40959930419922, 37.134666442871094, 38.85973358154297, 40.584800720214844, 42.30986785888672, 44.034934997558594, 45.76000213623047, 47.485069274902344, 49.21013641357422, 50.935203552246094, 52.66027069091797, 54.385337829589844, 56.11040496826172]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 6.0, 10.0, 9.0, 18.0, 23.0, 32.0, 37.0, 52.0, 71.0, 101.0, 157.0, 256.0, 374.0, 472.0, 721.0, 1083.0, 1570.0, 2366.0, 3531.0, 5383.0, 8465.0, 13279.0, 21158.0, 33813.0, 57093.0, 98510.0, 172252.0, 244687.0, 156638.0, 88838.0, 51828.0, 31164.0, 19382.0, 12223.0, 7711.0, 4995.0, 3338.0, 2260.0, 1439.0, 1019.0, 713.0, 431.0, 324.0, 216.0, 150.0, 118.0, 73.0, 57.0, 40.0, 23.0, 15.0, 15.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.76806640625, -0.7436141967773438, -0.7191619873046875, -0.6947097778320312, -0.670257568359375, -0.6458053588867188, -0.6213531494140625, -0.5969009399414062, -0.57244873046875, -0.5479965209960938, -0.5235443115234375, -0.49909210205078125, -0.474639892578125, -0.45018768310546875, -0.4257354736328125, -0.40128326416015625, -0.3768310546875, -0.35237884521484375, -0.3279266357421875, -0.30347442626953125, -0.279022216796875, -0.25457000732421875, -0.2301177978515625, -0.20566558837890625, -0.18121337890625, -0.15676116943359375, -0.1323089599609375, -0.10785675048828125, -0.083404541015625, -0.05895233154296875, -0.0345001220703125, -0.01004791259765625, 0.014404296875, 0.03885650634765625, 0.0633087158203125, 0.08776092529296875, 0.112213134765625, 0.13666534423828125, 0.1611175537109375, 0.18556976318359375, 0.21002197265625, 0.23447418212890625, 0.2589263916015625, 0.28337860107421875, 0.307830810546875, 0.33228302001953125, 0.3567352294921875, 0.38118743896484375, 0.4056396484375, 0.43009185791015625, 0.4545440673828125, 0.47899627685546875, 0.503448486328125, 0.5279006958007812, 0.5523529052734375, 0.5768051147460938, 0.60125732421875, 0.6257095336914062, 0.6501617431640625, 0.6746139526367188, 0.699066162109375, 0.7235183715820312, 0.7479705810546875, 0.7724227905273438, 0.796875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 4.0, 5.0, 7.0, 11.0, 8.0, 12.0, 9.0, 16.0, 14.0, 23.0, 16.0, 21.0, 19.0, 28.0, 39.0, 21.0, 43.0, 45.0, 35.0, 42.0, 45.0, 1061.0, 42.0, 40.0, 37.0, 43.0, 37.0, 26.0, 32.0, 37.0, 23.0, 25.0, 22.0, 18.0, 15.0, 15.0, 13.0, 12.0, 13.0, 8.0, 9.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.84765625, -2.75567626953125, -2.6636962890625, -2.57171630859375, -2.479736328125, -2.38775634765625, -2.2957763671875, -2.20379638671875, -2.11181640625, -2.01983642578125, -1.9278564453125, -1.83587646484375, -1.743896484375, -1.65191650390625, -1.5599365234375, -1.46795654296875, -1.3759765625, -1.28399658203125, -1.1920166015625, -1.10003662109375, -1.008056640625, -0.91607666015625, -0.8240966796875, -0.73211669921875, -0.64013671875, -0.54815673828125, -0.4561767578125, -0.36419677734375, -0.272216796875, -0.18023681640625, -0.0882568359375, 0.00372314453125, 0.095703125, 0.18768310546875, 0.2796630859375, 0.37164306640625, 0.463623046875, 0.55560302734375, 0.6475830078125, 0.73956298828125, 0.83154296875, 0.92352294921875, 1.0155029296875, 1.10748291015625, 1.199462890625, 1.29144287109375, 1.3834228515625, 1.47540283203125, 1.5673828125, 1.65936279296875, 1.7513427734375, 1.84332275390625, 1.935302734375, 2.02728271484375, 2.1192626953125, 2.21124267578125, 2.30322265625, 2.39520263671875, 2.4871826171875, 2.57916259765625, 2.671142578125, 2.76312255859375, 2.8551025390625, 2.94708251953125, 3.0390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 14.0, 15.0, 27.0, 47.0, 51.0, 112.0, 159.0, 238.0, 316.0, 522.0, 685.0, 997.0, 1476.0, 2131.0, 3245.0, 4675.0, 6797.0, 10387.0, 15530.0, 24333.0, 38678.0, 63029.0, 107734.0, 196292.0, 1284523.0, 131346.0, 75151.0, 45761.0, 28333.0, 18164.0, 11986.0, 7670.0, 5207.0, 3625.0, 2516.0, 1689.0, 1136.0, 815.0, 550.0, 364.0, 267.0, 161.0, 123.0, 84.0, 53.0, 38.0, 25.0, 18.0, 11.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6675491333007812, -0.6461334228515625, -0.6247177124023438, -0.603302001953125, -0.5818862915039062, -0.5604705810546875, -0.5390548706054688, -0.51763916015625, -0.49622344970703125, -0.4748077392578125, -0.45339202880859375, -0.431976318359375, -0.41056060791015625, -0.3891448974609375, -0.36772918701171875, -0.3463134765625, -0.32489776611328125, -0.3034820556640625, -0.28206634521484375, -0.260650634765625, -0.23923492431640625, -0.2178192138671875, -0.19640350341796875, -0.17498779296875, -0.15357208251953125, -0.1321563720703125, -0.11074066162109375, -0.089324951171875, -0.06790924072265625, -0.0464935302734375, -0.02507781982421875, -0.003662109375, 0.01775360107421875, 0.0391693115234375, 0.06058502197265625, 0.082000732421875, 0.10341644287109375, 0.1248321533203125, 0.14624786376953125, 0.16766357421875, 0.18907928466796875, 0.2104949951171875, 0.23191070556640625, 0.253326416015625, 0.27474212646484375, 0.2961578369140625, 0.31757354736328125, 0.3389892578125, 0.36040496826171875, 0.3818206787109375, 0.40323638916015625, 0.424652099609375, 0.44606781005859375, 0.4674835205078125, 0.48889923095703125, 0.51031494140625, 0.5317306518554688, 0.5531463623046875, 0.5745620727539062, 0.595977783203125, 0.6173934936523438, 0.6388092041015625, 0.6602249145507812, 0.681640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 14.0, 19.0, 16.0, 15.0, 20.0, 19.0, 31.0, 36.0, 54.0, 44.0, 66.0, 67.0, 69.0, 74.0, 60.0, 64.0, 60.0, 45.0, 40.0, 39.0, 21.0, 22.0, 20.0, 15.0, 8.0, 9.0, 10.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005450248718261719, -0.0005289986729621887, -0.0005129724740982056, -0.0004969462752342224, -0.00048092007637023926, -0.0004648938775062561, -0.00044886767864227295, -0.0004328414797782898, -0.00041681528091430664, -0.0004007890820503235, -0.00038476288318634033, -0.0003687366843223572, -0.000352710485458374, -0.00033668428659439087, -0.0003206580877304077, -0.00030463188886642456, -0.0002886056900024414, -0.00027257949113845825, -0.0002565532922744751, -0.00024052709341049194, -0.0002245008945465088, -0.00020847469568252563, -0.00019244849681854248, -0.00017642229795455933, -0.00016039609909057617, -0.00014436990022659302, -0.00012834370136260986, -0.00011231750249862671, -9.629130363464355e-05, -8.02651047706604e-05, -6.423890590667725e-05, -4.821270704269409e-05, -3.218650817871094e-05, -1.6160309314727783e-05, -1.341104507446289e-07, 1.5892088413238525e-05, 3.191828727722168e-05, 4.7944486141204834e-05, 6.397068500518799e-05, 7.999688386917114e-05, 9.60230827331543e-05, 0.00011204928159713745, 0.0001280754804611206, 0.00014410167932510376, 0.00016012787818908691, 0.00017615407705307007, 0.00019218027591705322, 0.00020820647478103638, 0.00022423267364501953, 0.00024025887250900269, 0.00025628507137298584, 0.000272311270236969, 0.00028833746910095215, 0.0003043636679649353, 0.00032038986682891846, 0.0003364160656929016, 0.00035244226455688477, 0.0003684684634208679, 0.0003844946622848511, 0.00040052086114883423, 0.0004165470600128174, 0.00043257325887680054, 0.0004485994577407837, 0.00046462565660476685, 0.00048065185546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 8.0, 4.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 17.0, 21.0, 27.0, 30.0, 65.0, 88.0, 146.0, 205.0, 363.0, 1037.0, 1037134.0, 8085.0, 515.0, 269.0, 138.0, 94.0, 69.0, 45.0, 31.0, 20.0, 21.0, 11.0, 18.0, 9.0, 12.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0130615234375, -0.012662410736083984, -0.012263298034667969, -0.011864185333251953, -0.011465072631835938, -0.011065959930419922, -0.010666847229003906, -0.01026773452758789, -0.009868621826171875, -0.00946950912475586, -0.009070396423339844, -0.008671283721923828, -0.008272171020507812, -0.007873058319091797, -0.007473945617675781, -0.007074832916259766, -0.00667572021484375, -0.006276607513427734, -0.005877494812011719, -0.005478382110595703, -0.0050792694091796875, -0.004680156707763672, -0.004281044006347656, -0.0038819313049316406, -0.003482818603515625, -0.0030837059020996094, -0.0026845932006835938, -0.002285480499267578, -0.0018863677978515625, -0.0014872550964355469, -0.0010881423950195312, -0.0006890296936035156, -0.0002899169921875, 0.00010919570922851562, 0.0005083084106445312, 0.0009074211120605469, 0.0013065338134765625, 0.0017056465148925781, 0.0021047592163085938, 0.0025038719177246094, 0.002902984619140625, 0.0033020973205566406, 0.0037012100219726562, 0.004100322723388672, 0.0044994354248046875, 0.004898548126220703, 0.005297660827636719, 0.005696773529052734, 0.00609588623046875, 0.006494998931884766, 0.006894111633300781, 0.007293224334716797, 0.0076923370361328125, 0.008091449737548828, 0.008490562438964844, 0.00888967514038086, 0.009288787841796875, 0.00968790054321289, 0.010087013244628906, 0.010486125946044922, 0.010885238647460938, 0.011284351348876953, 0.011683464050292969, 0.012082576751708984, 0.012481689453125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 116.0, 707.0, 182.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023232121020555496, -0.002281415509060025, -0.0022396191488951445, -0.00219782255589962, -0.0021560261957347393, -0.002114229602739215, -0.0020724330097436905, -0.0020306366495788097, -0.0019888400565832853, -0.0019470435800030828, -0.0019052471034228802, -0.0018634505104273558, -0.0018216540338471532, -0.0017798575572669506, -0.0017380609642714262, -0.0016962644876912236, -0.001654468011111021, -0.0016126715345308185, -0.0015708750579506159, -0.0015290784649550915, -0.001487281988374889, -0.0014454855117946863, -0.001403688918799162, -0.0013618924422189593, -0.0013200959656387568, -0.0012782994890585542, -0.0012365030124783516, -0.0011947064194828272, -0.0011529099429026246, -0.001111113466322422, -0.0010693168733268976, -0.001027520396746695, -0.0009857239201664925, -0.0009439274435862899, -0.0009021309087984264, -0.0008603343740105629, -0.0008185378974303603, -0.0007767414208501577, -0.0007349448860622942, -0.0006931483512744308, -0.0006513518746942282, -0.0006095553981140256, -0.0005677588633261621, -0.0005259623285382986, -0.00048416585195809603, -0.000442369346274063, -0.00040057284059002995, -0.0003587763349059969, -0.0003169798292219639, -0.00027518332353793085, -0.0002333868178538978, -0.00019159031216986477, -0.00014979380648583174, -0.0001079973008017987, -6.620079511776567e-05, -2.440428943373263e-05, 1.7392216250300407e-05, 5.9188721934333444e-05, 0.00010098522761836648, 0.00014278173330239952, 0.00018457823898643255, 0.0002263747446704656, 0.0002681712503544986, 0.00030996775603853166, 0.0003517642617225647]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 8.0, 3.0, 6.0, 13.0, 12.0, 19.0, 19.0, 23.0, 19.0, 25.0, 34.0, 32.0, 33.0, 34.0, 31.0, 47.0, 50.0, 40.0, 36.0, 47.0, 47.0, 46.0, 28.0, 35.0, 34.0, 29.0, 32.0, 40.0, 23.0, 18.0, 16.0, 23.0, 17.0, 14.0, 11.0, 16.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00025641918182373047, -0.00024845823645591736, -0.00024049729108810425, -0.00023253634572029114, -0.00022457540035247803, -0.00021661445498466492, -0.0002086535096168518, -0.0002006925642490387, -0.00019273161888122559, -0.00018477067351341248, -0.00017680972814559937, -0.00016884878277778625, -0.00016088783740997314, -0.00015292689204216003, -0.00014496594667434692, -0.0001370050013065338, -0.0001290440559387207, -0.00012108311057090759, -0.00011312216520309448, -0.00010516121983528137, -9.720027446746826e-05, -8.923932909965515e-05, -8.127838373184204e-05, -7.331743836402893e-05, -6.535649299621582e-05, -5.739554762840271e-05, -4.94346022605896e-05, -4.147365689277649e-05, -3.351271152496338e-05, -2.555176615715027e-05, -1.7590820789337158e-05, -9.629875421524048e-06, -1.6689300537109375e-06, 6.292015314102173e-06, 1.4252960681915283e-05, 2.2213906049728394e-05, 3.0174851417541504e-05, 3.8135796785354614e-05, 4.6096742153167725e-05, 5.4057687520980835e-05, 6.201863288879395e-05, 6.997957825660706e-05, 7.794052362442017e-05, 8.590146899223328e-05, 9.386241436004639e-05, 0.0001018233597278595, 0.00010978430509567261, 0.00011774525046348572, 0.00012570619583129883, 0.00013366714119911194, 0.00014162808656692505, 0.00014958903193473816, 0.00015754997730255127, 0.00016551092267036438, 0.0001734718680381775, 0.0001814328134059906, 0.0001893937587738037, 0.00019735470414161682, 0.00020531564950942993, 0.00021327659487724304, 0.00022123754024505615, 0.00022919848561286926, 0.00023715943098068237, 0.0002451203763484955, 0.0002530813217163086]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 14.0, 10.0, 18.0, 21.0, 32.0, 27.0, 32.0, 32.0, 24.0, 36.0, 51.0, 29.0, 48.0, 37.0, 51.0, 43.0, 51.0, 49.0, 44.0, 49.0, 36.0, 34.0, 21.0, 31.0, 31.0, 20.0, 15.0, 11.0, 9.0, 8.0, 9.0, 8.0, 11.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.2265625, -5.06439208984375, -4.9022216796875, -4.74005126953125, -4.577880859375, -4.41571044921875, -4.2535400390625, -4.09136962890625, -3.92919921875, -3.76702880859375, -3.6048583984375, -3.44268798828125, -3.280517578125, -3.11834716796875, -2.9561767578125, -2.79400634765625, -2.6318359375, -2.46966552734375, -2.3074951171875, -2.14532470703125, -1.983154296875, -1.82098388671875, -1.6588134765625, -1.49664306640625, -1.33447265625, -1.17230224609375, -1.0101318359375, -0.84796142578125, -0.685791015625, -0.52362060546875, -0.3614501953125, -0.19927978515625, -0.037109375, 0.12506103515625, 0.2872314453125, 0.44940185546875, 0.611572265625, 0.77374267578125, 0.9359130859375, 1.09808349609375, 1.26025390625, 1.42242431640625, 1.5845947265625, 1.74676513671875, 1.908935546875, 2.07110595703125, 2.2332763671875, 2.39544677734375, 2.5576171875, 2.71978759765625, 2.8819580078125, 3.04412841796875, 3.206298828125, 3.36846923828125, 3.5306396484375, 3.69281005859375, 3.85498046875, 4.01715087890625, 4.1793212890625, 4.34149169921875, 4.503662109375, 4.66583251953125, 4.8280029296875, 4.99017333984375, 5.15234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 11.0, 14.0, 11.0, 10.0, 17.0, 28.0, 36.0, 59.0, 78.0, 91.0, 143.0, 215.0, 318.0, 503.0, 735.0, 1192.0, 2123.0, 3845.0, 7421.0, 15796.0, 37459.0, 99707.0, 328021.0, 364664.0, 110647.0, 40395.0, 17154.0, 8054.0, 4065.0, 2126.0, 1272.0, 815.0, 472.0, 328.0, 219.0, 161.0, 112.0, 64.0, 40.0, 37.0, 26.0, 21.0, 16.0, 11.0, 9.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.379425048828125, -3.27056884765625, -3.161712646484375, -3.0528564453125, -2.944000244140625, -2.83514404296875, -2.726287841796875, -2.617431640625, -2.508575439453125, -2.39971923828125, -2.290863037109375, -2.1820068359375, -2.073150634765625, -1.96429443359375, -1.855438232421875, -1.74658203125, -1.637725830078125, -1.52886962890625, -1.420013427734375, -1.3111572265625, -1.202301025390625, -1.09344482421875, -0.984588623046875, -0.875732421875, -0.766876220703125, -0.65802001953125, -0.549163818359375, -0.4403076171875, -0.331451416015625, -0.22259521484375, -0.113739013671875, -0.0048828125, 0.103973388671875, 0.21282958984375, 0.321685791015625, 0.4305419921875, 0.539398193359375, 0.64825439453125, 0.757110595703125, 0.865966796875, 0.974822998046875, 1.08367919921875, 1.192535400390625, 1.3013916015625, 1.410247802734375, 1.51910400390625, 1.627960205078125, 1.73681640625, 1.845672607421875, 1.95452880859375, 2.063385009765625, 2.1722412109375, 2.281097412109375, 2.38995361328125, 2.498809814453125, 2.607666015625, 2.716522216796875, 2.82537841796875, 2.934234619140625, 3.0430908203125, 3.151947021484375, 3.26080322265625, 3.369659423828125, 3.478515625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 4.0, 12.0, 11.0, 10.0, 17.0, 19.0, 16.0, 31.0, 36.0, 32.0, 32.0, 39.0, 42.0, 46.0, 57.0, 61.0, 223.0, 1786.0, 103.0, 57.0, 64.0, 44.0, 41.0, 47.0, 35.0, 30.0, 16.0, 28.0, 15.0, 16.0, 16.0, 9.0, 13.0, 9.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -16.998291015625, -16.41845703125, -15.838623046875, -15.2587890625, -14.678955078125, -14.09912109375, -13.519287109375, -12.939453125, -12.359619140625, -11.77978515625, -11.199951171875, -10.6201171875, -10.040283203125, -9.46044921875, -8.880615234375, -8.30078125, -7.720947265625, -7.14111328125, -6.561279296875, -5.9814453125, -5.401611328125, -4.82177734375, -4.241943359375, -3.662109375, -3.082275390625, -2.50244140625, -1.922607421875, -1.3427734375, -0.762939453125, -0.18310546875, 0.396728515625, 0.9765625, 1.556396484375, 2.13623046875, 2.716064453125, 3.2958984375, 3.875732421875, 4.45556640625, 5.035400390625, 5.615234375, 6.195068359375, 6.77490234375, 7.354736328125, 7.9345703125, 8.514404296875, 9.09423828125, 9.674072265625, 10.25390625, 10.833740234375, 11.41357421875, 11.993408203125, 12.5732421875, 13.153076171875, 13.73291015625, 14.312744140625, 14.892578125, 15.472412109375, 16.05224609375, 16.632080078125, 17.2119140625, 17.791748046875, 18.37158203125, 18.951416015625, 19.53125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 5.0, 15.0, 11.0, 11.0, 21.0, 21.0, 32.0, 30.0, 31.0, 64.0, 77.0, 109.0, 202.0, 386.0, 1099.0, 12272.0, 3060969.0, 67103.0, 1903.0, 560.0, 223.0, 145.0, 97.0, 61.0, 57.0, 39.0, 28.0, 24.0, 21.0, 18.0, 11.0, 10.0, 9.0, 5.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.4375, -32.444580078125, -31.45166015625, -30.458740234375, -29.4658203125, -28.472900390625, -27.47998046875, -26.487060546875, -25.494140625, -24.501220703125, -23.50830078125, -22.515380859375, -21.5224609375, -20.529541015625, -19.53662109375, -18.543701171875, -17.55078125, -16.557861328125, -15.56494140625, -14.572021484375, -13.5791015625, -12.586181640625, -11.59326171875, -10.600341796875, -9.607421875, -8.614501953125, -7.62158203125, -6.628662109375, -5.6357421875, -4.642822265625, -3.64990234375, -2.656982421875, -1.6640625, -0.671142578125, 0.32177734375, 1.314697265625, 2.3076171875, 3.300537109375, 4.29345703125, 5.286376953125, 6.279296875, 7.272216796875, 8.26513671875, 9.258056640625, 10.2509765625, 11.243896484375, 12.23681640625, 13.229736328125, 14.22265625, 15.215576171875, 16.20849609375, 17.201416015625, 18.1943359375, 19.187255859375, 20.18017578125, 21.173095703125, 22.166015625, 23.158935546875, 24.15185546875, 25.144775390625, 26.1376953125, 27.130615234375, 28.12353515625, 29.116455078125, 30.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 14.0, 45.0, 127.0, 252.0, 296.0, 175.0, 63.0, 25.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61174201965332, -8.57434368133545, -7.536944389343262, -6.499546051025391, -5.462147235870361, -4.424748420715332, -3.387350082397461, -2.3499512672424316, -1.3125524520874023, -0.2751537561416626, 0.7622449398040771, 1.7996435165405273, 2.8370423316955566, 3.874441146850586, 4.911839485168457, 5.949238300323486, 6.986637115478516, 8.024035453796387, 9.061434745788574, 10.098833084106445, 11.136232376098633, 12.173630714416504, 13.211029052734375, 14.248428344726562, 15.285826683044434, 16.323225021362305, 17.360624313354492, 18.398021697998047, 19.435420989990234, 20.472820281982422, 21.51021957397461, 22.547616958618164, 23.58501434326172, 24.622413635253906, 25.65981101989746, 26.69721031188965, 27.734609603881836, 28.77200698852539, 29.809406280517578, 30.846805572509766, 31.884204864501953, 32.92160415649414, 33.95900344848633, 34.99639892578125, 36.03379821777344, 37.071197509765625, 38.10859680175781, 39.14599609375, 40.18339538574219, 41.220794677734375, 42.25819396972656, 43.29559326171875, 44.33298873901367, 45.37038803100586, 46.40778732299805, 47.445186614990234, 48.482582092285156, 49.519981384277344, 50.55738067626953, 51.59477996826172, 52.63217544555664, 53.66957473754883, 54.706974029541016, 55.7443733215332, 56.78177261352539]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 11.0, 8.0, 14.0, 14.0, 16.0, 25.0, 33.0, 28.0, 42.0, 40.0, 46.0, 44.0, 57.0, 44.0, 52.0, 38.0, 55.0, 36.0, 47.0, 33.0, 28.0, 36.0, 28.0, 35.0, 20.0, 24.0, 17.0, 17.0, 16.0, 15.0, 15.0, 9.0, 11.0, 6.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-55.94017028808594, -54.101715087890625, -52.26325988769531, -50.4248046875, -48.58634948730469, -46.747894287109375, -44.90943908691406, -43.07098388671875, -41.23252868652344, -39.394073486328125, -37.55561828613281, -35.7171630859375, -33.87870788574219, -32.040252685546875, -30.201799392700195, -28.363344192504883, -26.524890899658203, -24.68643569946289, -22.847980499267578, -21.009525299072266, -19.171070098876953, -17.33261489868164, -15.494161605834961, -13.655706405639648, -11.817251205444336, -9.978796005249023, -8.140340805053711, -6.301886558532715, -4.463431358337402, -2.62497615814209, -0.7865219116210938, 1.0519332885742188, 2.8903884887695312, 4.728843688964844, 6.567298412322998, 8.405753135681152, 10.244208335876465, 12.082663536071777, 13.921117782592773, 15.759572982788086, 17.5980281829834, 19.43648338317871, 21.274938583374023, 23.113391876220703, 24.951847076416016, 26.790302276611328, 28.62875747680664, 30.467212677001953, 32.305667877197266, 34.14412307739258, 35.98257827758789, 37.8210334777832, 39.659488677978516, 41.49794387817383, 43.336395263671875, 45.17485046386719, 47.0133056640625, 48.85176086425781, 50.690216064453125, 52.52867126464844, 54.36712646484375, 56.20558166503906, 58.044036865234375, 59.88249206542969, 61.720947265625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 8.0, 4.0, 11.0, 5.0, 10.0, 14.0, 12.0, 13.0, 12.0, 30.0, 22.0, 29.0, 29.0, 28.0, 32.0, 36.0, 43.0, 45.0, 30.0, 47.0, 45.0, 46.0, 49.0, 55.0, 45.0, 44.0, 35.0, 32.0, 27.0, 30.0, 26.0, 19.0, 28.0, 6.0, 10.0, 10.0, 6.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.22265625, -5.05645751953125, -4.8902587890625, -4.72406005859375, -4.557861328125, -4.39166259765625, -4.2254638671875, -4.05926513671875, -3.89306640625, -3.72686767578125, -3.5606689453125, -3.39447021484375, -3.228271484375, -3.06207275390625, -2.8958740234375, -2.72967529296875, -2.5634765625, -2.39727783203125, -2.2310791015625, -2.06488037109375, -1.898681640625, -1.73248291015625, -1.5662841796875, -1.40008544921875, -1.23388671875, -1.06768798828125, -0.9014892578125, -0.73529052734375, -0.569091796875, -0.40289306640625, -0.2366943359375, -0.07049560546875, 0.095703125, 0.26190185546875, 0.4281005859375, 0.59429931640625, 0.760498046875, 0.92669677734375, 1.0928955078125, 1.25909423828125, 1.42529296875, 1.59149169921875, 1.7576904296875, 1.92388916015625, 2.090087890625, 2.25628662109375, 2.4224853515625, 2.58868408203125, 2.7548828125, 2.92108154296875, 3.0872802734375, 3.25347900390625, 3.419677734375, 3.58587646484375, 3.7520751953125, 3.91827392578125, 4.08447265625, 4.25067138671875, 4.4168701171875, 4.58306884765625, 4.749267578125, 4.91546630859375, 5.0816650390625, 5.24786376953125, 5.4140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 11.0, 9.0, 14.0, 14.0, 20.0, 19.0, 22.0, 18.0, 30.0, 24.0, 23.0, 31.0, 28.0, 58.0, 116.0, 824.0, 17305.0, 3149680.0, 1019371.0, 5782.0, 439.0, 90.0, 49.0, 39.0, 29.0, 28.0, 30.0, 19.0, 27.0, 23.0, 18.0, 13.0, 8.0, 15.0, 12.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.953125, -28.949951171875, -27.94677734375, -26.943603515625, -25.9404296875, -24.937255859375, -23.93408203125, -22.930908203125, -21.927734375, -20.924560546875, -19.92138671875, -18.918212890625, -17.9150390625, -16.911865234375, -15.90869140625, -14.905517578125, -13.90234375, -12.899169921875, -11.89599609375, -10.892822265625, -9.8896484375, -8.886474609375, -7.88330078125, -6.880126953125, -5.876953125, -4.873779296875, -3.87060546875, -2.867431640625, -1.8642578125, -0.861083984375, 0.14208984375, 1.145263671875, 2.1484375, 3.151611328125, 4.15478515625, 5.157958984375, 6.1611328125, 7.164306640625, 8.16748046875, 9.170654296875, 10.173828125, 11.177001953125, 12.18017578125, 13.183349609375, 14.1865234375, 15.189697265625, 16.19287109375, 17.196044921875, 18.19921875, 19.202392578125, 20.20556640625, 21.208740234375, 22.2119140625, 23.215087890625, 24.21826171875, 25.221435546875, 26.224609375, 27.227783203125, 28.23095703125, 29.234130859375, 30.2373046875, 31.240478515625, 32.24365234375, 33.246826171875, 34.25]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 8.0, 17.0, 16.0, 37.0, 41.0, 79.0, 83.0, 151.0, 234.0, 338.0, 570.0, 741.0, 611.0, 402.0, 249.0, 159.0, 114.0, 79.0, 46.0, 28.0, 24.0, 13.0, 9.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.8680419921875, -26.189208984375, -25.5103759765625, -24.83154296875, -24.1527099609375, -23.473876953125, -22.7950439453125, -22.1162109375, -21.4373779296875, -20.758544921875, -20.0797119140625, -19.40087890625, -18.7220458984375, -18.043212890625, -17.3643798828125, -16.685546875, -16.0067138671875, -15.327880859375, -14.6490478515625, -13.97021484375, -13.2913818359375, -12.612548828125, -11.9337158203125, -11.2548828125, -10.5760498046875, -9.897216796875, -9.2183837890625, -8.53955078125, -7.8607177734375, -7.181884765625, -6.5030517578125, -5.82421875, -5.1453857421875, -4.466552734375, -3.7877197265625, -3.10888671875, -2.4300537109375, -1.751220703125, -1.0723876953125, -0.3935546875, 0.2852783203125, 0.964111328125, 1.6429443359375, 2.32177734375, 3.0006103515625, 3.679443359375, 4.3582763671875, 5.037109375, 5.7159423828125, 6.394775390625, 7.0736083984375, 7.75244140625, 8.4312744140625, 9.110107421875, 9.7889404296875, 10.4677734375, 11.1466064453125, 11.825439453125, 12.5042724609375, 13.18310546875, 13.8619384765625, 14.540771484375, 15.2196044921875, 15.8984375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 13.0, 19.0, 33.0, 43.0, 77.0, 123.0, 213.0, 334.0, 795.0, 11502.0, 4165605.0, 13949.0, 714.0, 350.0, 193.0, 121.0, 69.0, 49.0, 27.0, 9.0, 12.0, 5.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.1875, -68.9814453125, -65.775390625, -62.5693359375, -59.36328125, -56.1572265625, -52.951171875, -49.7451171875, -46.5390625, -43.3330078125, -40.126953125, -36.9208984375, -33.71484375, -30.5087890625, -27.302734375, -24.0966796875, -20.890625, -17.6845703125, -14.478515625, -11.2724609375, -8.06640625, -4.8603515625, -1.654296875, 1.5517578125, 4.7578125, 7.9638671875, 11.169921875, 14.3759765625, 17.58203125, 20.7880859375, 23.994140625, 27.2001953125, 30.40625, 33.6123046875, 36.818359375, 40.0244140625, 43.23046875, 46.4365234375, 49.642578125, 52.8486328125, 56.0546875, 59.2607421875, 62.466796875, 65.6728515625, 68.87890625, 72.0849609375, 75.291015625, 78.4970703125, 81.703125, 84.9091796875, 88.115234375, 91.3212890625, 94.52734375, 97.7333984375, 100.939453125, 104.1455078125, 107.3515625, 110.5576171875, 113.763671875, 116.9697265625, 120.17578125, 123.3818359375, 126.587890625, 129.7939453125, 133.0]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 62.0, 208.0, 377.0, 253.0, 84.0, 14.0, 6.0, 0.0, 2.0, 2.0], "bins": [-271.8650207519531, -267.0650634765625, -262.26507568359375, -257.4651184082031, -252.6651611328125, -247.86520385742188, -243.0652313232422, -238.2652587890625, -233.46530151367188, -228.66534423828125, -223.86537170410156, -219.06539916992188, -214.26544189453125, -209.46548461914062, -204.66551208496094, -199.86553955078125, -195.06558227539062, -190.265625, -185.4656524658203, -180.66567993164062, -175.86572265625, -171.06576538085938, -166.2657928466797, -161.4658203125, -156.66586303710938, -151.86590576171875, -147.06593322753906, -142.26596069335938, -137.46600341796875, -132.66604614257812, -127.86607360839844, -123.06610870361328, -118.26615905761719, -113.46619415283203, -108.66622924804688, -103.86626434326172, -99.06629943847656, -94.2663345336914, -89.46636962890625, -84.6664047241211, -79.86643981933594, -75.06647491455078, -70.26651000976562, -65.46654510498047, -60.66658020019531, -55.866615295410156, -51.066650390625, -46.266685485839844, -41.46672058105469, -36.66675567626953, -31.866790771484375, -27.06682586669922, -22.266860961914062, -17.466896057128906, -12.66693115234375, -7.866966247558594, -3.0670013427734375, 1.7329635620117188, 6.532928466796875, 11.332893371582031, 16.132858276367188, 20.932823181152344, 25.7327880859375, 30.532752990722656, 35.33271789550781]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 7.0, 2.0, 2.0, 8.0, 4.0, 8.0, 11.0, 5.0, 11.0, 10.0, 11.0, 21.0, 20.0, 19.0, 22.0, 26.0, 32.0, 25.0, 38.0, 48.0, 45.0, 51.0, 33.0, 48.0, 47.0, 39.0, 45.0, 40.0, 40.0, 39.0, 34.0, 35.0, 27.0, 25.0, 24.0, 13.0, 16.0, 15.0, 14.0, 9.0, 11.0, 13.0, 10.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.365203857421875, -43.54517364501953, -41.72513961791992, -39.90510940551758, -38.085079193115234, -36.265045166015625, -34.44501495361328, -32.62498474121094, -30.804954528808594, -28.984922409057617, -27.164892196655273, -25.344860076904297, -23.524829864501953, -21.704797744750977, -19.884765625, -18.064735412597656, -16.24470329284668, -14.42467212677002, -12.60464096069336, -10.784608840942383, -8.964578628540039, -7.1445465087890625, -5.324515342712402, -3.504484176635742, -1.684453010559082, 0.13557827472686768, 1.9556095600128174, 3.7756409645080566, 5.595672130584717, 7.415703773498535, 9.235734939575195, 11.055766105651855, 12.875797271728516, 14.695828437805176, 16.515859603881836, 18.335891723632812, 20.155921936035156, 21.975954055786133, 23.79598617553711, 25.616016387939453, 27.436046600341797, 29.256078720092773, 31.076108932495117, 32.896141052246094, 34.71617126464844, 36.53620147705078, 38.35623550415039, 40.176265716552734, 41.996299743652344, 43.81632995605469, 45.6363639831543, 47.45639419555664, 49.276424407958984, 51.096458435058594, 52.91648864746094, 54.73651885986328, 56.556549072265625, 58.37657928466797, 60.19661331176758, 62.01664352416992, 63.836673736572266, 65.65670776367188, 67.47673797607422, 69.29676818847656, 71.1167984008789]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 24.0, 25.0, 53.0, 63.0, 90.0, 126.0, 195.0, 275.0, 451.0, 725.0, 1186.0, 1822.0, 2953.0, 4668.0, 7752.0, 12854.0, 20597.0, 34828.0, 60651.0, 110730.0, 211067.0, 261287.0, 137905.0, 72931.0, 41731.0, 24748.0, 14848.0, 9035.0, 5655.0, 3444.0, 2189.0, 1291.0, 860.0, 544.0, 290.0, 221.0, 130.0, 81.0, 85.0, 40.0, 29.0, 20.0, 15.0, 5.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.85107421875, -0.8228607177734375, -0.794647216796875, -0.7664337158203125, -0.73822021484375, -0.7100067138671875, -0.681793212890625, -0.6535797119140625, -0.6253662109375, -0.5971527099609375, -0.568939208984375, -0.5407257080078125, -0.51251220703125, -0.4842987060546875, -0.456085205078125, -0.4278717041015625, -0.399658203125, -0.3714447021484375, -0.343231201171875, -0.3150177001953125, -0.28680419921875, -0.2585906982421875, -0.230377197265625, -0.2021636962890625, -0.1739501953125, -0.1457366943359375, -0.117523193359375, -0.0893096923828125, -0.06109619140625, -0.0328826904296875, -0.004669189453125, 0.0235443115234375, 0.0517578125, 0.0799713134765625, 0.108184814453125, 0.1363983154296875, 0.16461181640625, 0.1928253173828125, 0.221038818359375, 0.2492523193359375, 0.2774658203125, 0.3056793212890625, 0.333892822265625, 0.3621063232421875, 0.39031982421875, 0.4185333251953125, 0.446746826171875, 0.4749603271484375, 0.503173828125, 0.5313873291015625, 0.559600830078125, 0.5878143310546875, 0.61602783203125, 0.6442413330078125, 0.672454833984375, 0.7006683349609375, 0.7288818359375, 0.7570953369140625, 0.785308837890625, 0.8135223388671875, 0.84173583984375, 0.8699493408203125, 0.898162841796875, 0.9263763427734375, 0.95458984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 1.0, 3.0, 5.0, 9.0, 9.0, 14.0, 12.0, 16.0, 23.0, 21.0, 22.0, 28.0, 30.0, 20.0, 32.0, 41.0, 21.0, 37.0, 41.0, 33.0, 36.0, 1051.0, 41.0, 38.0, 43.0, 44.0, 37.0, 33.0, 32.0, 31.0, 32.0, 21.0, 26.0, 22.0, 19.0, 17.0, 14.0, 10.0, 7.0, 14.0, 10.0, 7.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.375, -3.274688720703125, -3.17437744140625, -3.074066162109375, -2.9737548828125, -2.873443603515625, -2.77313232421875, -2.672821044921875, -2.572509765625, -2.472198486328125, -2.37188720703125, -2.271575927734375, -2.1712646484375, -2.070953369140625, -1.97064208984375, -1.870330810546875, -1.77001953125, -1.669708251953125, -1.56939697265625, -1.469085693359375, -1.3687744140625, -1.268463134765625, -1.16815185546875, -1.067840576171875, -0.967529296875, -0.867218017578125, -0.76690673828125, -0.666595458984375, -0.5662841796875, -0.465972900390625, -0.36566162109375, -0.265350341796875, -0.1650390625, -0.064727783203125, 0.03558349609375, 0.135894775390625, 0.2362060546875, 0.336517333984375, 0.43682861328125, 0.537139892578125, 0.637451171875, 0.737762451171875, 0.83807373046875, 0.938385009765625, 1.0386962890625, 1.139007568359375, 1.23931884765625, 1.339630126953125, 1.43994140625, 1.540252685546875, 1.64056396484375, 1.740875244140625, 1.8411865234375, 1.941497802734375, 2.04180908203125, 2.142120361328125, 2.242431640625, 2.342742919921875, 2.44305419921875, 2.543365478515625, 2.6436767578125, 2.743988037109375, 2.84429931640625, 2.944610595703125, 3.044921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 17.0, 17.0, 21.0, 38.0, 57.0, 81.0, 105.0, 150.0, 246.0, 332.0, 478.0, 641.0, 929.0, 1311.0, 1725.0, 2507.0, 3548.0, 5109.0, 7005.0, 10326.0, 14945.0, 21992.0, 32681.0, 49468.0, 77491.0, 125528.0, 1253785.0, 175974.0, 106980.0, 67359.0, 43701.0, 28777.0, 19481.0, 13311.0, 8981.0, 6556.0, 4511.0, 3133.0, 2279.0, 1594.0, 1176.0, 807.0, 605.0, 419.0, 283.0, 182.0, 148.0, 101.0, 70.0, 49.0, 34.0, 29.0, 20.0, 15.0, 5.0, 6.0, 4.0, 3.0], "bins": [-0.65673828125, -0.6367416381835938, -0.6167449951171875, -0.5967483520507812, -0.576751708984375, -0.5567550659179688, -0.5367584228515625, -0.5167617797851562, -0.49676513671875, -0.47676849365234375, -0.4567718505859375, -0.43677520751953125, -0.416778564453125, -0.39678192138671875, -0.3767852783203125, -0.35678863525390625, -0.3367919921875, -0.31679534912109375, -0.2967987060546875, -0.27680206298828125, -0.256805419921875, -0.23680877685546875, -0.2168121337890625, -0.19681549072265625, -0.17681884765625, -0.15682220458984375, -0.1368255615234375, -0.11682891845703125, -0.096832275390625, -0.07683563232421875, -0.0568389892578125, -0.03684234619140625, -0.016845703125, 0.00315093994140625, 0.0231475830078125, 0.04314422607421875, 0.063140869140625, 0.08313751220703125, 0.1031341552734375, 0.12313079833984375, 0.14312744140625, 0.16312408447265625, 0.1831207275390625, 0.20311737060546875, 0.223114013671875, 0.24311065673828125, 0.2631072998046875, 0.28310394287109375, 0.3031005859375, 0.32309722900390625, 0.3430938720703125, 0.36309051513671875, 0.383087158203125, 0.40308380126953125, 0.4230804443359375, 0.44307708740234375, 0.46307373046875, 0.48307037353515625, 0.5030670166015625, 0.5230636596679688, 0.543060302734375, 0.5630569458007812, 0.5830535888671875, 0.6030502319335938, 0.623046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 5.0, 10.0, 14.0, 17.0, 28.0, 24.0, 27.0, 37.0, 58.0, 58.0, 75.0, 70.0, 75.0, 75.0, 78.0, 52.0, 61.0, 46.0, 32.0, 35.0, 24.0, 9.0, 8.0, 11.0, 9.0, 11.0, 8.0, 7.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005273818969726562, -0.0005113109946250916, -0.0004952400922775269, -0.00047916918992996216, -0.00046309828758239746, -0.00044702738523483276, -0.00043095648288726807, -0.00041488558053970337, -0.00039881467819213867, -0.000382743775844574, -0.0003666728734970093, -0.0003506019711494446, -0.0003345310688018799, -0.0003184601664543152, -0.0003023892641067505, -0.0002863183617591858, -0.0002702474594116211, -0.0002541765570640564, -0.0002381056547164917, -0.000222034752368927, -0.0002059638500213623, -0.0001898929476737976, -0.0001738220453262329, -0.0001577511429786682, -0.00014168024063110352, -0.00012560933828353882, -0.00010953843593597412, -9.346753358840942e-05, -7.739663124084473e-05, -6.132572889328003e-05, -4.525482654571533e-05, -2.9183924198150635e-05, -1.3113021850585938e-05, 2.9578804969787598e-06, 1.9028782844543457e-05, 3.5099685192108154e-05, 5.117058753967285e-05, 6.724148988723755e-05, 8.331239223480225e-05, 9.938329458236694e-05, 0.00011545419692993164, 0.00013152509927749634, 0.00014759600162506104, 0.00016366690397262573, 0.00017973780632019043, 0.00019580870866775513, 0.00021187961101531982, 0.00022795051336288452, 0.00024402141571044922, 0.0002600923180580139, 0.0002761632204055786, 0.0002922341227531433, 0.000308305025100708, 0.0003243759274482727, 0.0003404468297958374, 0.0003565177321434021, 0.0003725886344909668, 0.0003886595368385315, 0.0004047304391860962, 0.0004208013415336609, 0.0004368722438812256, 0.0004529431462287903, 0.000469014048576355, 0.0004850849509239197, 0.0005011558532714844]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 8.0, 9.0, 12.0, 23.0, 24.0, 45.0, 69.0, 120.0, 163.0, 288.0, 509.0, 4461.0, 1039695.0, 1910.0, 485.0, 224.0, 146.0, 120.0, 67.0, 51.0, 38.0, 21.0, 24.0, 2.0, 8.0, 5.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01320648193359375, -0.012786149978637695, -0.01236581802368164, -0.011945486068725586, -0.011525154113769531, -0.011104822158813477, -0.010684490203857422, -0.010264158248901367, -0.009843826293945312, -0.009423494338989258, -0.009003162384033203, -0.008582830429077148, -0.008162498474121094, -0.007742166519165039, -0.007321834564208984, -0.00690150260925293, -0.006481170654296875, -0.00606083869934082, -0.005640506744384766, -0.005220174789428711, -0.004799842834472656, -0.0043795108795166016, -0.003959178924560547, -0.003538846969604492, -0.0031185150146484375, -0.002698183059692383, -0.002277851104736328, -0.0018575191497802734, -0.0014371871948242188, -0.001016855239868164, -0.0005965232849121094, -0.0001761913299560547, 0.000244140625, 0.0006644725799560547, 0.0010848045349121094, 0.001505136489868164, 0.0019254684448242188, 0.0023458003997802734, 0.002766132354736328, 0.003186464309692383, 0.0036067962646484375, 0.004027128219604492, 0.004447460174560547, 0.0048677921295166016, 0.005288124084472656, 0.005708456039428711, 0.006128787994384766, 0.00654911994934082, 0.006969451904296875, 0.00738978385925293, 0.007810115814208984, 0.008230447769165039, 0.008650779724121094, 0.009071111679077148, 0.009491443634033203, 0.009911775588989258, 0.010332107543945312, 0.010752439498901367, 0.011172771453857422, 0.011593103408813477, 0.012013435363769531, 0.012433767318725586, 0.01285409927368164, 0.013274431228637695, 0.01369476318359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 498.0, 463.0, 32.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003202585969120264, -0.003145412774756551, -0.003088239813223481, -0.003031066618859768, -0.0029738936573266983, -0.002916720462962985, -0.0028595475014299154, -0.002802374307066202, -0.0027452013455331326, -0.0026880281511694193, -0.0026308551896363497, -0.0025736819952726364, -0.002516509033739567, -0.0024593358393758535, -0.002402162877842784, -0.0023449896834790707, -0.0022878164891153574, -0.002230643294751644, -0.0021734703332185745, -0.0021162971388548613, -0.0020591241773217916, -0.0020019509829580784, -0.0019447780214250088, -0.0018876048270612955, -0.001830431865528226, -0.0017732587875798345, -0.001716085709631443, -0.0016589126316830516, -0.0016017395537346601, -0.0015445663593709469, -0.0014873933978378773, -0.001430220203474164, -0.0013730472419410944, -0.001315874163992703, -0.0012587010860443115, -0.00120152800809592, -0.0011443549301475286, -0.0010871817357838154, -0.0010300087742507458, -0.0009728355798870325, -0.0009156625019386411, -0.0008584894239902496, -0.0008013163460418582, -0.0007441432680934668, -0.0006869701319374144, -0.000629797053989023, -0.0005726239760406315, -0.0005154508398845792, -0.0004582777910400182, -0.00040110471309162676, -0.00034393160603940487, -0.00028675852809101343, -0.00022958543559070677, -0.0001724123430904001, -0.00011523926514200866, -5.806615808978677e-05, -8.930801413953304e-07, 5.628000872093253e-05, 0.00011345309758326039, 0.00017062618280760944, 0.0002277992753079161, 0.00028497236780822277, 0.0003421454457566142, 0.0003993185528088361, 0.00045649163075722754]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 16.0, 5.0, 19.0, 21.0, 27.0, 17.0, 14.0, 35.0, 32.0, 37.0, 38.0, 40.0, 39.0, 36.0, 50.0, 50.0, 33.0, 47.0, 48.0, 38.0, 42.0, 42.0, 30.0, 28.0, 30.0, 23.0, 18.0, 15.0, 12.0, 17.0, 13.0, 15.0, 9.0, 11.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0002529025077819824, -0.0002455078065395355, -0.00023811310529708862, -0.00023071840405464172, -0.00022332370281219482, -0.00021592900156974792, -0.00020853430032730103, -0.00020113959908485413, -0.00019374489784240723, -0.00018635019659996033, -0.00017895549535751343, -0.00017156079411506653, -0.00016416609287261963, -0.00015677139163017273, -0.00014937669038772583, -0.00014198198914527893, -0.00013458728790283203, -0.00012719258666038513, -0.00011979788541793823, -0.00011240318417549133, -0.00010500848293304443, -9.761378169059753e-05, -9.021908044815063e-05, -8.282437920570374e-05, -7.542967796325684e-05, -6.803497672080994e-05, -6.064027547836304e-05, -5.324557423591614e-05, -4.585087299346924e-05, -3.845617175102234e-05, -3.106147050857544e-05, -2.366676926612854e-05, -1.627206802368164e-05, -8.877366781234741e-06, -1.4826655387878418e-06, 5.912035703659058e-06, 1.3306736946105957e-05, 2.0701438188552856e-05, 2.8096139430999756e-05, 3.5490840673446655e-05, 4.2885541915893555e-05, 5.0280243158340454e-05, 5.7674944400787354e-05, 6.506964564323425e-05, 7.246434688568115e-05, 7.985904812812805e-05, 8.725374937057495e-05, 9.464845061302185e-05, 0.00010204315185546875, 0.00010943785309791565, 0.00011683255434036255, 0.00012422725558280945, 0.00013162195682525635, 0.00013901665806770325, 0.00014641135931015015, 0.00015380606055259705, 0.00016120076179504395, 0.00016859546303749084, 0.00017599016427993774, 0.00018338486552238464, 0.00019077956676483154, 0.00019817426800727844, 0.00020556896924972534, 0.00021296367049217224, 0.00022035837173461914]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 10.0, 7.0, 9.0, 15.0, 7.0, 13.0, 18.0, 14.0, 22.0, 27.0, 28.0, 21.0, 27.0, 28.0, 33.0, 46.0, 42.0, 37.0, 51.0, 50.0, 41.0, 50.0, 44.0, 49.0, 45.0, 37.0, 29.0, 29.0, 30.0, 23.0, 12.0, 18.0, 18.0, 17.0, 9.0, 17.0, 10.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.12890625, -4.96002197265625, -4.7911376953125, -4.62225341796875, -4.453369140625, -4.28448486328125, -4.1156005859375, -3.94671630859375, -3.77783203125, -3.60894775390625, -3.4400634765625, -3.27117919921875, -3.102294921875, -2.93341064453125, -2.7645263671875, -2.59564208984375, -2.4267578125, -2.25787353515625, -2.0889892578125, -1.92010498046875, -1.751220703125, -1.58233642578125, -1.4134521484375, -1.24456787109375, -1.07568359375, -0.90679931640625, -0.7379150390625, -0.56903076171875, -0.400146484375, -0.23126220703125, -0.0623779296875, 0.10650634765625, 0.275390625, 0.44427490234375, 0.6131591796875, 0.78204345703125, 0.950927734375, 1.11981201171875, 1.2886962890625, 1.45758056640625, 1.62646484375, 1.79534912109375, 1.9642333984375, 2.13311767578125, 2.302001953125, 2.47088623046875, 2.6397705078125, 2.80865478515625, 2.9775390625, 3.14642333984375, 3.3153076171875, 3.48419189453125, 3.653076171875, 3.82196044921875, 3.9908447265625, 4.15972900390625, 4.32861328125, 4.49749755859375, 4.6663818359375, 4.83526611328125, 5.004150390625, 5.17303466796875, 5.3419189453125, 5.51080322265625, 5.6796875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 5.0, 10.0, 13.0, 11.0, 23.0, 44.0, 51.0, 54.0, 78.0, 112.0, 172.0, 215.0, 344.0, 566.0, 796.0, 1415.0, 2421.0, 5063.0, 11027.0, 30647.0, 106062.0, 481712.0, 300480.0, 67911.0, 21299.0, 8435.0, 4002.0, 2128.0, 1251.0, 738.0, 485.0, 289.0, 177.0, 153.0, 97.0, 85.0, 45.0, 39.0, 26.0, 20.0, 12.0, 6.0, 8.0, 5.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.140625, -4.0145263671875, -3.888427734375, -3.7623291015625, -3.63623046875, -3.5101318359375, -3.384033203125, -3.2579345703125, -3.1318359375, -3.0057373046875, -2.879638671875, -2.7535400390625, -2.62744140625, -2.5013427734375, -2.375244140625, -2.2491455078125, -2.123046875, -1.9969482421875, -1.870849609375, -1.7447509765625, -1.61865234375, -1.4925537109375, -1.366455078125, -1.2403564453125, -1.1142578125, -0.9881591796875, -0.862060546875, -0.7359619140625, -0.60986328125, -0.4837646484375, -0.357666015625, -0.2315673828125, -0.10546875, 0.0206298828125, 0.146728515625, 0.2728271484375, 0.39892578125, 0.5250244140625, 0.651123046875, 0.7772216796875, 0.9033203125, 1.0294189453125, 1.155517578125, 1.2816162109375, 1.40771484375, 1.5338134765625, 1.659912109375, 1.7860107421875, 1.912109375, 2.0382080078125, 2.164306640625, 2.2904052734375, 2.41650390625, 2.5426025390625, 2.668701171875, 2.7947998046875, 2.9208984375, 3.0469970703125, 3.173095703125, 3.2991943359375, 3.42529296875, 3.5513916015625, 3.677490234375, 3.8035888671875, 3.9296875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 6.0, 9.0, 20.0, 13.0, 20.0, 26.0, 18.0, 34.0, 40.0, 55.0, 46.0, 53.0, 61.0, 111.0, 1926.0, 173.0, 65.0, 39.0, 50.0, 56.0, 38.0, 39.0, 34.0, 24.0, 16.0, 15.0, 15.0, 6.0, 14.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-27.484375, -26.753173828125, -26.02197265625, -25.290771484375, -24.5595703125, -23.828369140625, -23.09716796875, -22.365966796875, -21.634765625, -20.903564453125, -20.17236328125, -19.441162109375, -18.7099609375, -17.978759765625, -17.24755859375, -16.516357421875, -15.78515625, -15.053955078125, -14.32275390625, -13.591552734375, -12.8603515625, -12.129150390625, -11.39794921875, -10.666748046875, -9.935546875, -9.204345703125, -8.47314453125, -7.741943359375, -7.0107421875, -6.279541015625, -5.54833984375, -4.817138671875, -4.0859375, -3.354736328125, -2.62353515625, -1.892333984375, -1.1611328125, -0.429931640625, 0.30126953125, 1.032470703125, 1.763671875, 2.494873046875, 3.22607421875, 3.957275390625, 4.6884765625, 5.419677734375, 6.15087890625, 6.882080078125, 7.61328125, 8.344482421875, 9.07568359375, 9.806884765625, 10.5380859375, 11.269287109375, 12.00048828125, 12.731689453125, 13.462890625, 14.194091796875, 14.92529296875, 15.656494140625, 16.3876953125, 17.118896484375, 17.85009765625, 18.581298828125, 19.3125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 9.0, 12.0, 5.0, 17.0, 18.0, 15.0, 25.0, 41.0, 46.0, 68.0, 104.0, 143.0, 245.0, 590.0, 3471.0, 3014078.0, 124255.0, 1494.0, 445.0, 202.0, 118.0, 71.0, 60.0, 39.0, 14.0, 31.0, 21.0, 11.0, 18.0, 9.0, 8.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.65625, -29.513671875, -28.37109375, -27.228515625, -26.0859375, -24.943359375, -23.80078125, -22.658203125, -21.515625, -20.373046875, -19.23046875, -18.087890625, -16.9453125, -15.802734375, -14.66015625, -13.517578125, -12.375, -11.232421875, -10.08984375, -8.947265625, -7.8046875, -6.662109375, -5.51953125, -4.376953125, -3.234375, -2.091796875, -0.94921875, 0.193359375, 1.3359375, 2.478515625, 3.62109375, 4.763671875, 5.90625, 7.048828125, 8.19140625, 9.333984375, 10.4765625, 11.619140625, 12.76171875, 13.904296875, 15.046875, 16.189453125, 17.33203125, 18.474609375, 19.6171875, 20.759765625, 21.90234375, 23.044921875, 24.1875, 25.330078125, 26.47265625, 27.615234375, 28.7578125, 29.900390625, 31.04296875, 32.185546875, 33.328125, 34.470703125, 35.61328125, 36.755859375, 37.8984375, 39.041015625, 40.18359375, 41.326171875, 42.46875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 171.0, 739.0, 103.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.85891723632812, -143.07476806640625, -140.2906036376953, -137.50645446777344, -134.7222900390625, -131.93814086914062, -129.15399169921875, -126.36983489990234, -123.58567810058594, -120.80152130126953, -118.01736450195312, -115.23321533203125, -112.44905853271484, -109.66490173339844, -106.88075256347656, -104.09659576416016, -101.31243896484375, -98.52828216552734, -95.74412536621094, -92.95997619628906, -90.17581939697266, -87.39166259765625, -84.60751342773438, -81.82335662841797, -79.03919982910156, -76.25504302978516, -73.47088623046875, -70.68673706054688, -67.90258026123047, -65.11842346191406, -62.33427047729492, -59.55011749267578, -56.76596450805664, -53.9818115234375, -51.197654724121094, -48.41349792480469, -45.62934494018555, -42.845191955566406, -40.06103515625, -37.276878356933594, -34.49272537231445, -31.70857048034668, -28.924415588378906, -26.140260696411133, -23.35610580444336, -20.571950912475586, -17.787796020507812, -15.003641128540039, -12.219486236572266, -9.435331344604492, -6.651176452636719, -3.8670215606689453, -1.0828666687011719, 1.7012882232666016, 4.485443115234375, 7.269598007202148, 10.053752899169922, 12.837907791137695, 15.622062683105469, 18.406217575073242, 21.190372467041016, 23.97452735900879, 26.758682250976562, 29.542837142944336, 32.32699203491211]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 8.0, 7.0, 8.0, 7.0, 14.0, 13.0, 13.0, 21.0, 16.0, 25.0, 31.0, 28.0, 34.0, 33.0, 28.0, 46.0, 36.0, 34.0, 41.0, 45.0, 36.0, 34.0, 37.0, 30.0, 38.0, 30.0, 32.0, 25.0, 36.0, 18.0, 20.0, 27.0, 25.0, 16.0, 20.0, 16.0, 14.0, 10.0, 5.0, 10.0, 10.0, 6.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.84174346923828, -51.20581817626953, -49.56989669799805, -47.93397521972656, -46.29804992675781, -44.66212463378906, -43.02620315551758, -41.390281677246094, -39.754356384277344, -38.118431091308594, -36.48250961303711, -34.846588134765625, -33.210662841796875, -31.574739456176758, -29.93881607055664, -28.302892684936523, -26.666969299316406, -25.03104591369629, -23.395122528076172, -21.759199142456055, -20.123275756835938, -18.48735237121582, -16.851428985595703, -15.215505599975586, -13.579582214355469, -11.943658828735352, -10.307735443115234, -8.671812057495117, -7.035888671875, -5.399965286254883, -3.7640419006347656, -2.1281185150146484, -0.49219512939453125, 1.143728256225586, 2.779651641845703, 4.41557502746582, 6.0514984130859375, 7.687421798706055, 9.323345184326172, 10.959268569946289, 12.595191955566406, 14.231115341186523, 15.86703872680664, 17.502962112426758, 19.138885498046875, 20.774808883666992, 22.41073226928711, 24.046655654907227, 25.682579040527344, 27.31850242614746, 28.954425811767578, 30.590349197387695, 32.22627258300781, 33.86219787597656, 35.49811935424805, 37.13404083251953, 38.76996612548828, 40.40589141845703, 42.041812896728516, 43.677734375, 45.31365966796875, 46.9495849609375, 48.585506439208984, 50.22142791748047, 51.85735321044922]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 8.0, 11.0, 6.0, 10.0, 9.0, 15.0, 10.0, 14.0, 18.0, 20.0, 25.0, 29.0, 23.0, 23.0, 35.0, 37.0, 41.0, 34.0, 40.0, 53.0, 43.0, 57.0, 35.0, 50.0, 44.0, 48.0, 32.0, 41.0, 29.0, 25.0, 22.0, 15.0, 19.0, 22.0, 6.0, 20.0, 15.0, 6.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.1119384765625, -4.938720703125, -4.7655029296875, -4.59228515625, -4.4190673828125, -4.245849609375, -4.0726318359375, -3.8994140625, -3.7261962890625, -3.552978515625, -3.3797607421875, -3.20654296875, -3.0333251953125, -2.860107421875, -2.6868896484375, -2.513671875, -2.3404541015625, -2.167236328125, -1.9940185546875, -1.82080078125, -1.6475830078125, -1.474365234375, -1.3011474609375, -1.1279296875, -0.9547119140625, -0.781494140625, -0.6082763671875, -0.43505859375, -0.2618408203125, -0.088623046875, 0.0845947265625, 0.2578125, 0.4310302734375, 0.604248046875, 0.7774658203125, 0.95068359375, 1.1239013671875, 1.297119140625, 1.4703369140625, 1.6435546875, 1.8167724609375, 1.989990234375, 2.1632080078125, 2.33642578125, 2.5096435546875, 2.682861328125, 2.8560791015625, 3.029296875, 3.2025146484375, 3.375732421875, 3.5489501953125, 3.72216796875, 3.8953857421875, 4.068603515625, 4.2418212890625, 4.4150390625, 4.5882568359375, 4.761474609375, 4.9346923828125, 5.10791015625, 5.2811279296875, 5.454345703125, 5.6275634765625, 5.80078125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 9.0, 3.0, 10.0, 8.0, 18.0, 19.0, 26.0, 24.0, 30.0, 44.0, 71.0, 102.0, 195.0, 379.0, 1087.0, 3539.0, 14292.0, 80068.0, 662130.0, 2335069.0, 946128.0, 124343.0, 19600.0, 4553.0, 1378.0, 488.0, 230.0, 119.0, 86.0, 62.0, 31.0, 35.0, 18.0, 19.0, 14.0, 9.0, 11.0, 4.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7890625, -9.4691162109375, -9.149169921875, -8.8292236328125, -8.50927734375, -8.1893310546875, -7.869384765625, -7.5494384765625, -7.2294921875, -6.9095458984375, -6.589599609375, -6.2696533203125, -5.94970703125, -5.6297607421875, -5.309814453125, -4.9898681640625, -4.669921875, -4.3499755859375, -4.030029296875, -3.7100830078125, -3.39013671875, -3.0701904296875, -2.750244140625, -2.4302978515625, -2.1103515625, -1.7904052734375, -1.470458984375, -1.1505126953125, -0.83056640625, -0.5106201171875, -0.190673828125, 0.1292724609375, 0.44921875, 0.7691650390625, 1.089111328125, 1.4090576171875, 1.72900390625, 2.0489501953125, 2.368896484375, 2.6888427734375, 3.0087890625, 3.3287353515625, 3.648681640625, 3.9686279296875, 4.28857421875, 4.6085205078125, 4.928466796875, 5.2484130859375, 5.568359375, 5.8883056640625, 6.208251953125, 6.5281982421875, 6.84814453125, 7.1680908203125, 7.488037109375, 7.8079833984375, 8.1279296875, 8.4478759765625, 8.767822265625, 9.0877685546875, 9.40771484375, 9.7276611328125, 10.047607421875, 10.3675537109375, 10.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 6.0, 12.0, 28.0, 25.0, 52.0, 65.0, 98.0, 144.0, 260.0, 413.0, 640.0, 723.0, 598.0, 374.0, 229.0, 143.0, 88.0, 53.0, 38.0, 27.0, 14.0, 21.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.966064453125, -26.24462890625, -25.523193359375, -24.8017578125, -24.080322265625, -23.35888671875, -22.637451171875, -21.916015625, -21.194580078125, -20.47314453125, -19.751708984375, -19.0302734375, -18.308837890625, -17.58740234375, -16.865966796875, -16.14453125, -15.423095703125, -14.70166015625, -13.980224609375, -13.2587890625, -12.537353515625, -11.81591796875, -11.094482421875, -10.373046875, -9.651611328125, -8.93017578125, -8.208740234375, -7.4873046875, -6.765869140625, -6.04443359375, -5.322998046875, -4.6015625, -3.880126953125, -3.15869140625, -2.437255859375, -1.7158203125, -0.994384765625, -0.27294921875, 0.448486328125, 1.169921875, 1.891357421875, 2.61279296875, 3.334228515625, 4.0556640625, 4.777099609375, 5.49853515625, 6.219970703125, 6.94140625, 7.662841796875, 8.38427734375, 9.105712890625, 9.8271484375, 10.548583984375, 11.27001953125, 11.991455078125, 12.712890625, 13.434326171875, 14.15576171875, 14.877197265625, 15.5986328125, 16.320068359375, 17.04150390625, 17.762939453125, 18.484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 11.0, 10.0, 12.0, 19.0, 21.0, 38.0, 56.0, 93.0, 109.0, 168.0, 334.0, 988.0, 47984.0, 4132958.0, 10022.0, 659.0, 254.0, 177.0, 118.0, 85.0, 39.0, 35.0, 23.0, 19.0, 16.0, 8.0, 4.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.8125, -71.1162109375, -68.419921875, -65.7236328125, -63.02734375, -60.3310546875, -57.634765625, -54.9384765625, -52.2421875, -49.5458984375, -46.849609375, -44.1533203125, -41.45703125, -38.7607421875, -36.064453125, -33.3681640625, -30.671875, -27.9755859375, -25.279296875, -22.5830078125, -19.88671875, -17.1904296875, -14.494140625, -11.7978515625, -9.1015625, -6.4052734375, -3.708984375, -1.0126953125, 1.68359375, 4.3798828125, 7.076171875, 9.7724609375, 12.46875, 15.1650390625, 17.861328125, 20.5576171875, 23.25390625, 25.9501953125, 28.646484375, 31.3427734375, 34.0390625, 36.7353515625, 39.431640625, 42.1279296875, 44.82421875, 47.5205078125, 50.216796875, 52.9130859375, 55.609375, 58.3056640625, 61.001953125, 63.6982421875, 66.39453125, 69.0908203125, 71.787109375, 74.4833984375, 77.1796875, 79.8759765625, 82.572265625, 85.2685546875, 87.96484375, 90.6611328125, 93.357421875, 96.0537109375, 98.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 18.0, 73.0, 308.0, 369.0, 199.0, 36.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.89875030517578, -119.7562484741211, -114.61375427246094, -109.47125244140625, -104.32875061035156, -99.18624877929688, -94.04375457763672, -88.90125274658203, -83.75875854492188, -78.61625671386719, -73.47376251220703, -68.33126068115234, -63.188758850097656, -58.046260833740234, -52.90376281738281, -47.761260986328125, -42.61875915527344, -37.476261138916016, -32.33375930786133, -27.191261291503906, -22.04876136779785, -16.906261444091797, -11.763763427734375, -6.6212615966796875, -1.4787635803222656, 3.663735866546631, 8.806235313415527, 13.948734283447266, 19.09123420715332, 24.233734130859375, 29.376232147216797, 34.518733978271484, 39.66123962402344, 44.80373764038086, 49.94623947143555, 55.08873748779297, 60.231239318847656, 65.37373352050781, 70.5162353515625, 75.65873718261719, 80.80123901367188, 85.94374084472656, 91.08623504638672, 96.2287368774414, 101.3712387084961, 106.51373291015625, 111.65623474121094, 116.79873657226562, 121.94123077392578, 127.08373260498047, 132.22622680664062, 137.3687286376953, 142.51123046875, 147.6537322998047, 152.79623413085938, 157.938720703125, 163.0812225341797, 168.22372436523438, 173.36622619628906, 178.50872802734375, 183.65121459960938, 188.79371643066406, 193.93621826171875, 199.07872009277344, 204.22122192382812]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 9.0, 15.0, 15.0, 6.0, 15.0, 15.0, 23.0, 27.0, 27.0, 35.0, 38.0, 30.0, 38.0, 29.0, 42.0, 35.0, 43.0, 35.0, 51.0, 30.0, 42.0, 30.0, 29.0, 38.0, 39.0, 30.0, 40.0, 25.0, 22.0, 20.0, 19.0, 15.0, 9.0, 11.0, 14.0, 7.0, 8.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.622406005859375, -50.974788665771484, -49.32716751098633, -47.67955017089844, -46.03193283081055, -44.384315490722656, -42.7366943359375, -41.08907699584961, -39.44145965576172, -37.79384231567383, -36.14622116088867, -34.49860382080078, -32.85098648071289, -31.203367233276367, -29.555747985839844, -27.908130645751953, -26.260509490966797, -24.612890243530273, -22.965272903442383, -21.31765365600586, -19.67003631591797, -18.022417068481445, -16.374797821044922, -14.727179527282715, -13.079561233520508, -11.4319429397583, -9.784324645996094, -8.13670539855957, -6.489087104797363, -4.841468811035156, -3.193849563598633, -1.5462312698364258, 0.10138702392578125, 1.7490055561065674, 3.3966240882873535, 5.044242858886719, 6.691861152648926, 8.339479446411133, 9.987098693847656, 11.634716987609863, 13.28233528137207, 14.929953575134277, 16.577571868896484, 18.225191116333008, 19.87281036376953, 21.520427703857422, 23.168046951293945, 24.81566619873047, 26.46328353881836, 28.110902786254883, 29.758520126342773, 31.406139373779297, 33.05375671386719, 34.701377868652344, 36.348995208740234, 37.996612548828125, 39.64423370361328, 41.29185104370117, 42.93947219848633, 44.58708953857422, 46.23470687866211, 47.88232421875, 49.529945373535156, 51.17756271362305, 52.82518005371094]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 24.0, 27.0, 42.0, 66.0, 92.0, 113.0, 169.0, 271.0, 399.0, 625.0, 916.0, 1444.0, 2082.0, 3367.0, 5320.0, 8425.0, 13224.0, 21561.0, 35665.0, 61286.0, 111960.0, 218869.0, 256923.0, 130108.0, 70410.0, 40259.0, 24170.0, 14928.0, 9190.0, 5783.0, 3756.0, 2501.0, 1583.0, 1018.0, 644.0, 418.0, 311.0, 176.0, 153.0, 81.0, 55.0, 39.0, 39.0, 10.0, 9.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8407363891601562, -0.8128204345703125, -0.7849044799804688, -0.756988525390625, -0.7290725708007812, -0.7011566162109375, -0.6732406616210938, -0.64532470703125, -0.6174087524414062, -0.5894927978515625, -0.5615768432617188, -0.533660888671875, -0.5057449340820312, -0.4778289794921875, -0.44991302490234375, -0.4219970703125, -0.39408111572265625, -0.3661651611328125, -0.33824920654296875, -0.310333251953125, -0.28241729736328125, -0.2545013427734375, -0.22658538818359375, -0.19866943359375, -0.17075347900390625, -0.1428375244140625, -0.11492156982421875, -0.087005615234375, -0.05908966064453125, -0.0311737060546875, -0.00325775146484375, 0.024658203125, 0.05257415771484375, 0.0804901123046875, 0.10840606689453125, 0.136322021484375, 0.16423797607421875, 0.1921539306640625, 0.22006988525390625, 0.24798583984375, 0.27590179443359375, 0.3038177490234375, 0.33173370361328125, 0.359649658203125, 0.38756561279296875, 0.4154815673828125, 0.44339752197265625, 0.4713134765625, 0.49922943115234375, 0.5271453857421875, 0.5550613403320312, 0.582977294921875, 0.6108932495117188, 0.6388092041015625, 0.6667251586914062, 0.69464111328125, 0.7225570678710938, 0.7504730224609375, 0.7783889770507812, 0.806304931640625, 0.8342208862304688, 0.8621368408203125, 0.8900527954101562, 0.91796875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 7.0, 2.0, 6.0, 9.0, 7.0, 7.0, 15.0, 14.0, 11.0, 20.0, 13.0, 19.0, 24.0, 47.0, 31.0, 29.0, 30.0, 50.0, 51.0, 40.0, 49.0, 31.0, 1063.0, 36.0, 38.0, 41.0, 34.0, 39.0, 34.0, 23.0, 28.0, 18.0, 24.0, 18.0, 19.0, 16.0, 16.0, 15.0, 6.0, 9.0, 7.0, 10.0, 8.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.828125, -2.728302001953125, -2.62847900390625, -2.528656005859375, -2.4288330078125, -2.329010009765625, -2.22918701171875, -2.129364013671875, -2.029541015625, -1.929718017578125, -1.82989501953125, -1.730072021484375, -1.6302490234375, -1.530426025390625, -1.43060302734375, -1.330780029296875, -1.23095703125, -1.131134033203125, -1.03131103515625, -0.931488037109375, -0.8316650390625, -0.731842041015625, -0.63201904296875, -0.532196044921875, -0.432373046875, -0.332550048828125, -0.23272705078125, -0.132904052734375, -0.0330810546875, 0.066741943359375, 0.16656494140625, 0.266387939453125, 0.3662109375, 0.466033935546875, 0.56585693359375, 0.665679931640625, 0.7655029296875, 0.865325927734375, 0.96514892578125, 1.064971923828125, 1.164794921875, 1.264617919921875, 1.36444091796875, 1.464263916015625, 1.5640869140625, 1.663909912109375, 1.76373291015625, 1.863555908203125, 1.96337890625, 2.063201904296875, 2.16302490234375, 2.262847900390625, 2.3626708984375, 2.462493896484375, 2.56231689453125, 2.662139892578125, 2.761962890625, 2.861785888671875, 2.96160888671875, 3.061431884765625, 3.1612548828125, 3.261077880859375, 3.36090087890625, 3.460723876953125, 3.560546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 15.0, 13.0, 22.0, 32.0, 47.0, 67.0, 110.0, 176.0, 248.0, 352.0, 514.0, 729.0, 1040.0, 1557.0, 2174.0, 3126.0, 4583.0, 6768.0, 9845.0, 15197.0, 23305.0, 36507.0, 58957.0, 97970.0, 171060.0, 1290048.0, 144192.0, 84142.0, 50819.0, 31761.0, 20265.0, 13211.0, 9017.0, 6006.0, 3924.0, 2851.0, 2081.0, 1361.0, 924.0, 666.0, 479.0, 331.0, 200.0, 128.0, 105.0, 71.0, 49.0, 30.0, 12.0, 19.0, 7.0, 8.0, 2.0, 6.0, 0.0, 3.0], "bins": [-0.7353515625, -0.7133026123046875, -0.691253662109375, -0.6692047119140625, -0.64715576171875, -0.6251068115234375, -0.603057861328125, -0.5810089111328125, -0.5589599609375, -0.5369110107421875, -0.514862060546875, -0.4928131103515625, -0.47076416015625, -0.4487152099609375, -0.426666259765625, -0.4046173095703125, -0.382568359375, -0.3605194091796875, -0.338470458984375, -0.3164215087890625, -0.29437255859375, -0.2723236083984375, -0.250274658203125, -0.2282257080078125, -0.2061767578125, -0.1841278076171875, -0.162078857421875, -0.1400299072265625, -0.11798095703125, -0.0959320068359375, -0.073883056640625, -0.0518341064453125, -0.02978515625, -0.0077362060546875, 0.014312744140625, 0.0363616943359375, 0.05841064453125, 0.0804595947265625, 0.102508544921875, 0.1245574951171875, 0.1466064453125, 0.1686553955078125, 0.190704345703125, 0.2127532958984375, 0.23480224609375, 0.2568511962890625, 0.278900146484375, 0.3009490966796875, 0.322998046875, 0.3450469970703125, 0.367095947265625, 0.3891448974609375, 0.41119384765625, 0.4332427978515625, 0.455291748046875, 0.4773406982421875, 0.4993896484375, 0.5214385986328125, 0.543487548828125, 0.5655364990234375, 0.58758544921875, 0.6096343994140625, 0.631683349609375, 0.6537322998046875, 0.67578125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 10.0, 9.0, 11.0, 6.0, 7.0, 15.0, 16.0, 20.0, 16.0, 23.0, 20.0, 34.0, 43.0, 56.0, 49.0, 52.0, 58.0, 52.0, 69.0, 61.0, 55.0, 55.0, 37.0, 43.0, 35.0, 36.0, 25.0, 16.0, 15.0, 5.0, 8.0, 9.0, 8.0, 5.0, 7.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000400543212890625, -0.0003871545195579529, -0.00037376582622528076, -0.00036037713289260864, -0.0003469884395599365, -0.0003335997462272644, -0.0003202110528945923, -0.00030682235956192017, -0.00029343366622924805, -0.00028004497289657593, -0.0002666562795639038, -0.0002532675862312317, -0.00023987889289855957, -0.00022649019956588745, -0.00021310150623321533, -0.0001997128129005432, -0.0001863241195678711, -0.00017293542623519897, -0.00015954673290252686, -0.00014615803956985474, -0.00013276934623718262, -0.0001193806529045105, -0.00010599195957183838, -9.260326623916626e-05, -7.921457290649414e-05, -6.582587957382202e-05, -5.24371862411499e-05, -3.904849290847778e-05, -2.5659799575805664e-05, -1.2271106243133545e-05, 1.1175870895385742e-06, 1.4506280422210693e-05, 2.7894973754882812e-05, 4.128366708755493e-05, 5.467236042022705e-05, 6.806105375289917e-05, 8.144974708557129e-05, 9.483844041824341e-05, 0.00010822713375091553, 0.00012161582708358765, 0.00013500452041625977, 0.00014839321374893188, 0.000161781907081604, 0.00017517060041427612, 0.00018855929374694824, 0.00020194798707962036, 0.00021533668041229248, 0.0002287253737449646, 0.00024211406707763672, 0.00025550276041030884, 0.00026889145374298096, 0.0002822801470756531, 0.0002956688404083252, 0.0003090575337409973, 0.00032244622707366943, 0.00033583492040634155, 0.00034922361373901367, 0.0003626123070716858, 0.0003760010004043579, 0.00038938969373703003, 0.00040277838706970215, 0.00041616708040237427, 0.0004295557737350464, 0.0004429444670677185, 0.0004563331604003906]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 16.0, 19.0, 35.0, 49.0, 65.0, 82.0, 165.0, 303.0, 532.0, 3075.0, 1039797.0, 3084.0, 553.0, 240.0, 143.0, 107.0, 68.0, 44.0, 38.0, 18.0, 12.0, 9.0, 13.0, 15.0, 12.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0155487060546875, -0.015144824981689453, -0.014740943908691406, -0.01433706283569336, -0.013933181762695312, -0.013529300689697266, -0.013125419616699219, -0.012721538543701172, -0.012317657470703125, -0.011913776397705078, -0.011509895324707031, -0.011106014251708984, -0.010702133178710938, -0.01029825210571289, -0.009894371032714844, -0.009490489959716797, -0.00908660888671875, -0.008682727813720703, -0.008278846740722656, -0.00787496566772461, -0.0074710845947265625, -0.007067203521728516, -0.006663322448730469, -0.006259441375732422, -0.005855560302734375, -0.005451679229736328, -0.005047798156738281, -0.004643917083740234, -0.0042400360107421875, -0.0038361549377441406, -0.0034322738647460938, -0.003028392791748047, -0.00262451171875, -0.002220630645751953, -0.0018167495727539062, -0.0014128684997558594, -0.0010089874267578125, -0.0006051063537597656, -0.00020122528076171875, 0.00020265579223632812, 0.000606536865234375, 0.0010104179382324219, 0.0014142990112304688, 0.0018181800842285156, 0.0022220611572265625, 0.0026259422302246094, 0.0030298233032226562, 0.003433704376220703, 0.00383758544921875, 0.004241466522216797, 0.004645347595214844, 0.005049228668212891, 0.0054531097412109375, 0.005856990814208984, 0.006260871887207031, 0.006664752960205078, 0.007068634033203125, 0.007472515106201172, 0.007876396179199219, 0.008280277252197266, 0.008684158325195312, 0.00908803939819336, 0.009491920471191406, 0.009895801544189453, 0.0102996826171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 91.0, 730.0, 189.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023884994443506002, -0.002328182104974985, -0.0022678645327687263, -0.0022075471933931112, -0.002147229854017496, -0.002086912514641881, -0.002026595175266266, -0.001966277603060007, -0.001905960263684392, -0.0018456429243087769, -0.00178532546851784, -0.001725008012726903, -0.0016646906733512878, -0.0016043733339756727, -0.0015440558781847358, -0.0014837384223937988, -0.0014234210830181837, -0.0013631037436425686, -0.0013027862878516316, -0.0012424688320606947, -0.0011821514926850796, -0.0011218341533094645, -0.0010615166975185275, -0.0010011992417275906, -0.0009408819023519754, -0.0008805645047686994, -0.0008202471071854234, -0.0007599297096021473, -0.0006996123120188713, -0.0006392949144355953, -0.0005789775168523192, -0.0005186601192690432, -0.000458342838101089, -0.00039802544051781297, -0.00033770804293453693, -0.0002773906453512609, -0.00021707324776798487, -0.00015675585018470883, -9.64384526014328e-05, -3.612105501815677e-05, 2.4196342565119267e-05, 8.45137401483953e-05, 0.00014483113773167133, 0.00020514853531494737, 0.0002654659328982234, 0.00032578333048149943, 0.00038610072806477547, 0.0004464181256480515, 0.0005067355232313275, 0.0005670529208146036, 0.0006273703183978796, 0.0006876877159811556, 0.0007480051135644317, 0.0008083225111477077, 0.0008686399087309837, 0.0009289573063142598, 0.0009892747038975358, 0.0010495921596884727, 0.0011099094990640879, 0.001170226838439703, 0.00123054429423064, 0.0012908617500215769, 0.001351179089397192, 0.0014114964287728071, 0.001471813884563744]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 8.0, 21.0, 17.0, 11.0, 10.0, 22.0, 25.0, 39.0, 40.0, 37.0, 26.0, 39.0, 32.0, 43.0, 40.0, 37.0, 31.0, 44.0, 37.0, 38.0, 31.0, 24.0, 23.0, 34.0, 33.0, 33.0, 22.0, 21.0, 26.0, 16.0, 20.0, 18.0, 9.0, 15.0, 8.0, 7.0, 10.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.00021779537200927734, -0.00021124351769685745, -0.00020469166338443756, -0.00019813980907201767, -0.00019158795475959778, -0.0001850361004471779, -0.000178484246134758, -0.0001719323918223381, -0.0001653805375099182, -0.00015882868319749832, -0.00015227682888507843, -0.00014572497457265854, -0.00013917312026023865, -0.00013262126594781876, -0.00012606941163539886, -0.00011951755732297897, -0.00011296570301055908, -0.00010641384869813919, -9.98619943857193e-05, -9.331014007329941e-05, -8.675828576087952e-05, -8.020643144845963e-05, -7.365457713603973e-05, -6.710272282361984e-05, -6.055086851119995e-05, -5.399901419878006e-05, -4.744715988636017e-05, -4.089530557394028e-05, -3.4343451261520386e-05, -2.7791596949100494e-05, -2.1239742636680603e-05, -1.4687888324260712e-05, -8.13603401184082e-06, -1.584179699420929e-06, 4.967674612998962e-06, 1.1519528925418854e-05, 1.8071383237838745e-05, 2.4623237550258636e-05, 3.117509186267853e-05, 3.772694617509842e-05, 4.427880048751831e-05, 5.08306547999382e-05, 5.738250911235809e-05, 6.393436342477798e-05, 7.048621773719788e-05, 7.703807204961777e-05, 8.358992636203766e-05, 9.014178067445755e-05, 9.669363498687744e-05, 0.00010324548929929733, 0.00010979734361171722, 0.00011634919792413712, 0.000122901052236557, 0.0001294529065489769, 0.0001360047608613968, 0.00014255661517381668, 0.00014910846948623657, 0.00015566032379865646, 0.00016221217811107635, 0.00016876403242349625, 0.00017531588673591614, 0.00018186774104833603, 0.00018841959536075592, 0.0001949714496731758, 0.0002015233039855957]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 11.0, 2.0, 5.0, 9.0, 5.0, 9.0, 13.0, 15.0, 16.0, 21.0, 23.0, 29.0, 35.0, 18.0, 26.0, 28.0, 49.0, 45.0, 31.0, 49.0, 43.0, 45.0, 50.0, 45.0, 38.0, 48.0, 38.0, 34.0, 34.0, 25.0, 25.0, 27.0, 21.0, 12.0, 15.0, 12.0, 13.0, 13.0, 9.0, 4.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.00384521484375, -4.8319091796875, -4.65997314453125, -4.488037109375, -4.31610107421875, -4.1441650390625, -3.97222900390625, -3.80029296875, -3.62835693359375, -3.4564208984375, -3.28448486328125, -3.112548828125, -2.94061279296875, -2.7686767578125, -2.59674072265625, -2.4248046875, -2.25286865234375, -2.0809326171875, -1.90899658203125, -1.737060546875, -1.56512451171875, -1.3931884765625, -1.22125244140625, -1.04931640625, -0.87738037109375, -0.7054443359375, -0.53350830078125, -0.361572265625, -0.18963623046875, -0.0177001953125, 0.15423583984375, 0.326171875, 0.49810791015625, 0.6700439453125, 0.84197998046875, 1.013916015625, 1.18585205078125, 1.3577880859375, 1.52972412109375, 1.70166015625, 1.87359619140625, 2.0455322265625, 2.21746826171875, 2.389404296875, 2.56134033203125, 2.7332763671875, 2.90521240234375, 3.0771484375, 3.24908447265625, 3.4210205078125, 3.59295654296875, 3.764892578125, 3.93682861328125, 4.1087646484375, 4.28070068359375, 4.45263671875, 4.62457275390625, 4.7965087890625, 4.96844482421875, 5.140380859375, 5.31231689453125, 5.4842529296875, 5.65618896484375, 5.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 10.0, 3.0, 8.0, 10.0, 7.0, 18.0, 18.0, 28.0, 40.0, 69.0, 101.0, 191.0, 335.0, 626.0, 1269.0, 2618.0, 5253.0, 11807.0, 28155.0, 79228.0, 252014.0, 419149.0, 158916.0, 52188.0, 19926.0, 8633.0, 3864.0, 1971.0, 922.0, 483.0, 268.0, 151.0, 83.0, 65.0, 28.0, 23.0, 23.0, 11.0, 14.0, 11.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.24609375, -3.13897705078125, -3.0318603515625, -2.92474365234375, -2.817626953125, -2.71051025390625, -2.6033935546875, -2.49627685546875, -2.38916015625, -2.28204345703125, -2.1749267578125, -2.06781005859375, -1.960693359375, -1.85357666015625, -1.7464599609375, -1.63934326171875, -1.5322265625, -1.42510986328125, -1.3179931640625, -1.21087646484375, -1.103759765625, -0.99664306640625, -0.8895263671875, -0.78240966796875, -0.67529296875, -0.56817626953125, -0.4610595703125, -0.35394287109375, -0.246826171875, -0.13970947265625, -0.0325927734375, 0.07452392578125, 0.181640625, 0.28875732421875, 0.3958740234375, 0.50299072265625, 0.610107421875, 0.71722412109375, 0.8243408203125, 0.93145751953125, 1.03857421875, 1.14569091796875, 1.2528076171875, 1.35992431640625, 1.467041015625, 1.57415771484375, 1.6812744140625, 1.78839111328125, 1.8955078125, 2.00262451171875, 2.1097412109375, 2.21685791015625, 2.323974609375, 2.43109130859375, 2.5382080078125, 2.64532470703125, 2.75244140625, 2.85955810546875, 2.9666748046875, 3.07379150390625, 3.180908203125, 3.28802490234375, 3.3951416015625, 3.50225830078125, 3.609375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 5.0, 6.0, 8.0, 10.0, 14.0, 17.0, 21.0, 27.0, 17.0, 28.0, 34.0, 30.0, 45.0, 33.0, 47.0, 52.0, 56.0, 86.0, 1532.0, 462.0, 83.0, 63.0, 51.0, 42.0, 38.0, 29.0, 27.0, 18.0, 19.0, 27.0, 8.0, 24.0, 22.0, 17.0, 9.0, 9.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -18.999755859375, -18.40576171875, -17.811767578125, -17.2177734375, -16.623779296875, -16.02978515625, -15.435791015625, -14.841796875, -14.247802734375, -13.65380859375, -13.059814453125, -12.4658203125, -11.871826171875, -11.27783203125, -10.683837890625, -10.08984375, -9.495849609375, -8.90185546875, -8.307861328125, -7.7138671875, -7.119873046875, -6.52587890625, -5.931884765625, -5.337890625, -4.743896484375, -4.14990234375, -3.555908203125, -2.9619140625, -2.367919921875, -1.77392578125, -1.179931640625, -0.5859375, 0.008056640625, 0.60205078125, 1.196044921875, 1.7900390625, 2.384033203125, 2.97802734375, 3.572021484375, 4.166015625, 4.760009765625, 5.35400390625, 5.947998046875, 6.5419921875, 7.135986328125, 7.72998046875, 8.323974609375, 8.91796875, 9.511962890625, 10.10595703125, 10.699951171875, 11.2939453125, 11.887939453125, 12.48193359375, 13.075927734375, 13.669921875, 14.263916015625, 14.85791015625, 15.451904296875, 16.0458984375, 16.639892578125, 17.23388671875, 17.827880859375, 18.421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 1.0, 10.0, 3.0, 8.0, 14.0, 15.0, 24.0, 20.0, 15.0, 30.0, 31.0, 47.0, 55.0, 98.0, 148.0, 215.0, 349.0, 1009.0, 12165.0, 3080595.0, 47790.0, 1687.0, 493.0, 275.0, 160.0, 98.0, 81.0, 40.0, 46.0, 31.0, 26.0, 29.0, 25.0, 10.0, 18.0, 7.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.68603515625, -28.6845703125, -27.68310546875, -26.681640625, -25.68017578125, -24.6787109375, -23.67724609375, -22.67578125, -21.67431640625, -20.6728515625, -19.67138671875, -18.669921875, -17.66845703125, -16.6669921875, -15.66552734375, -14.6640625, -13.66259765625, -12.6611328125, -11.65966796875, -10.658203125, -9.65673828125, -8.6552734375, -7.65380859375, -6.65234375, -5.65087890625, -4.6494140625, -3.64794921875, -2.646484375, -1.64501953125, -0.6435546875, 0.35791015625, 1.359375, 2.36083984375, 3.3623046875, 4.36376953125, 5.365234375, 6.36669921875, 7.3681640625, 8.36962890625, 9.37109375, 10.37255859375, 11.3740234375, 12.37548828125, 13.376953125, 14.37841796875, 15.3798828125, 16.38134765625, 17.3828125, 18.38427734375, 19.3857421875, 20.38720703125, 21.388671875, 22.39013671875, 23.3916015625, 24.39306640625, 25.39453125, 26.39599609375, 27.3974609375, 28.39892578125, 29.400390625, 30.40185546875, 31.4033203125, 32.40478515625, 33.40625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 48.0, 802.0, 160.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.05388069152832, -6.874826431274414, -2.695772171020508, 1.4832820892333984, 5.662336349487305, 9.841390609741211, 14.020444869995117, 18.199499130249023, 22.37855339050293, 26.557607650756836, 30.736661911010742, 34.91571807861328, 39.09477233886719, 43.273826599121094, 47.452880859375, 51.631935119628906, 55.81098937988281, 59.99004364013672, 64.16909790039062, 68.34815216064453, 72.52720642089844, 76.70626068115234, 80.88531494140625, 85.06436920166016, 89.24342346191406, 93.42247772216797, 97.60153198242188, 101.78058624267578, 105.95964050292969, 110.1386947631836, 114.3177490234375, 118.4968032836914, 122.67584228515625, 126.85489654541016, 131.03395080566406, 135.2130126953125, 139.39205932617188, 143.57110595703125, 147.7501678466797, 151.92922973632812, 156.1082763671875, 160.28732299804688, 164.4663848876953, 168.64544677734375, 172.82449340820312, 177.0035400390625, 181.18260192871094, 185.36166381835938, 189.54071044921875, 193.71975708007812, 197.89881896972656, 202.077880859375, 206.25692749023438, 210.43597412109375, 214.6150360107422, 218.79409790039062, 222.97314453125, 227.15219116210938, 231.3312530517578, 235.51031494140625, 239.68936157226562, 243.868408203125, 248.04747009277344, 252.22653198242188, 256.40557861328125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 10.0, 8.0, 12.0, 15.0, 6.0, 4.0, 18.0, 18.0, 17.0, 30.0, 28.0, 21.0, 19.0, 35.0, 35.0, 48.0, 38.0, 39.0, 34.0, 29.0, 42.0, 53.0, 37.0, 32.0, 38.0, 44.0, 36.0, 25.0, 28.0, 22.0, 23.0, 28.0, 14.0, 17.0, 15.0, 13.0, 10.0, 10.0, 14.0, 9.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-63.37583923339844, -61.554351806640625, -59.73286437988281, -57.911380767822266, -56.08989334106445, -54.26840591430664, -52.446922302246094, -50.62543487548828, -48.80394744873047, -46.982460021972656, -45.160972595214844, -43.3394889831543, -41.518001556396484, -39.69651412963867, -37.875030517578125, -36.05354309082031, -34.2320556640625, -32.41056823730469, -30.589082717895508, -28.767597198486328, -26.946109771728516, -25.124622344970703, -23.303136825561523, -21.481651306152344, -19.66016387939453, -17.83867645263672, -16.01719093322754, -14.195704460144043, -12.374217987060547, -10.55273151397705, -8.731245040893555, -6.909758567810059, -5.0882720947265625, -3.2667856216430664, -1.4452991485595703, 0.3761873245239258, 2.197673797607422, 4.019160270690918, 5.840646743774414, 7.66213321685791, 9.483619689941406, 11.305106163024902, 13.126592636108398, 14.948079109191895, 16.76956558227539, 18.591053009033203, 20.412538528442383, 22.234024047851562, 24.055511474609375, 25.876998901367188, 27.698484420776367, 29.519969940185547, 31.34145736694336, 33.16294479370117, 34.98442840576172, 36.80591583251953, 38.627403259277344, 40.448890686035156, 42.27037811279297, 44.091861724853516, 45.91334915161133, 47.73483657836914, 49.55632019042969, 51.3778076171875, 53.19929504394531]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 3.0, 7.0, 9.0, 4.0, 8.0, 9.0, 18.0, 13.0, 19.0, 22.0, 32.0, 17.0, 24.0, 36.0, 25.0, 43.0, 38.0, 40.0, 29.0, 41.0, 39.0, 47.0, 52.0, 37.0, 42.0, 37.0, 42.0, 37.0, 27.0, 22.0, 35.0, 24.0, 20.0, 17.0, 12.0, 13.0, 12.0, 9.0, 11.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.904296875, -4.734375, -4.564453125, -4.39453125, -4.224609375, -4.0546875, -3.884765625, -3.71484375, -3.544921875, -3.375, -3.205078125, -3.03515625, -2.865234375, -2.6953125, -2.525390625, -2.35546875, -2.185546875, -2.015625, -1.845703125, -1.67578125, -1.505859375, -1.3359375, -1.166015625, -0.99609375, -0.826171875, -0.65625, -0.486328125, -0.31640625, -0.146484375, 0.0234375, 0.193359375, 0.36328125, 0.533203125, 0.703125, 0.873046875, 1.04296875, 1.212890625, 1.3828125, 1.552734375, 1.72265625, 1.892578125, 2.0625, 2.232421875, 2.40234375, 2.572265625, 2.7421875, 2.912109375, 3.08203125, 3.251953125, 3.421875, 3.591796875, 3.76171875, 3.931640625, 4.1015625, 4.271484375, 4.44140625, 4.611328125, 4.78125, 4.951171875, 5.12109375, 5.291015625, 5.4609375, 5.630859375, 5.80078125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 8.0, 7.0, 6.0, 10.0, 4.0, 13.0, 17.0, 22.0, 26.0, 31.0, 33.0, 38.0, 57.0, 96.0, 156.0, 331.0, 1098.0, 6321.0, 67677.0, 1612939.0, 2372440.0, 121022.0, 9339.0, 1561.0, 427.0, 201.0, 103.0, 53.0, 50.0, 45.0, 24.0, 27.0, 20.0, 14.0, 18.0, 10.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9765625, -15.4456787109375, -14.914794921875, -14.3839111328125, -13.85302734375, -13.3221435546875, -12.791259765625, -12.2603759765625, -11.7294921875, -11.1986083984375, -10.667724609375, -10.1368408203125, -9.60595703125, -9.0750732421875, -8.544189453125, -8.0133056640625, -7.482421875, -6.9515380859375, -6.420654296875, -5.8897705078125, -5.35888671875, -4.8280029296875, -4.297119140625, -3.7662353515625, -3.2353515625, -2.7044677734375, -2.173583984375, -1.6427001953125, -1.11181640625, -0.5809326171875, -0.050048828125, 0.4808349609375, 1.01171875, 1.5426025390625, 2.073486328125, 2.6043701171875, 3.13525390625, 3.6661376953125, 4.197021484375, 4.7279052734375, 5.2587890625, 5.7896728515625, 6.320556640625, 6.8514404296875, 7.38232421875, 7.9132080078125, 8.444091796875, 8.9749755859375, 9.505859375, 10.0367431640625, 10.567626953125, 11.0985107421875, 11.62939453125, 12.1602783203125, 12.691162109375, 13.2220458984375, 13.7529296875, 14.2838134765625, 14.814697265625, 15.3455810546875, 15.87646484375, 16.4073486328125, 16.938232421875, 17.4691162109375, 18.0]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 19.0, 16.0, 31.0, 34.0, 48.0, 88.0, 122.0, 192.0, 230.0, 360.0, 516.0, 609.0, 555.0, 402.0, 263.0, 195.0, 117.0, 74.0, 62.0, 40.0, 27.0, 27.0, 12.0, 8.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.646240234375, -19.04248046875, -18.438720703125, -17.8349609375, -17.231201171875, -16.62744140625, -16.023681640625, -15.419921875, -14.816162109375, -14.21240234375, -13.608642578125, -13.0048828125, -12.401123046875, -11.79736328125, -11.193603515625, -10.58984375, -9.986083984375, -9.38232421875, -8.778564453125, -8.1748046875, -7.571044921875, -6.96728515625, -6.363525390625, -5.759765625, -5.156005859375, -4.55224609375, -3.948486328125, -3.3447265625, -2.740966796875, -2.13720703125, -1.533447265625, -0.9296875, -0.325927734375, 0.27783203125, 0.881591796875, 1.4853515625, 2.089111328125, 2.69287109375, 3.296630859375, 3.900390625, 4.504150390625, 5.10791015625, 5.711669921875, 6.3154296875, 6.919189453125, 7.52294921875, 8.126708984375, 8.73046875, 9.334228515625, 9.93798828125, 10.541748046875, 11.1455078125, 11.749267578125, 12.35302734375, 12.956787109375, 13.560546875, 14.164306640625, 14.76806640625, 15.371826171875, 15.9755859375, 16.579345703125, 17.18310546875, 17.786865234375, 18.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 9.0, 2.0, 7.0, 4.0, 11.0, 12.0, 18.0, 21.0, 28.0, 40.0, 49.0, 58.0, 93.0, 103.0, 157.0, 215.0, 330.0, 835.0, 7116.0, 3160006.0, 1019411.0, 3970.0, 681.0, 319.0, 208.0, 146.0, 116.0, 78.0, 65.0, 40.0, 37.0, 23.0, 27.0, 12.0, 13.0, 8.0, 4.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.59375, -56.63525390625, -54.6767578125, -52.71826171875, -50.759765625, -48.80126953125, -46.8427734375, -44.88427734375, -42.92578125, -40.96728515625, -39.0087890625, -37.05029296875, -35.091796875, -33.13330078125, -31.1748046875, -29.21630859375, -27.2578125, -25.29931640625, -23.3408203125, -21.38232421875, -19.423828125, -17.46533203125, -15.5068359375, -13.54833984375, -11.58984375, -9.63134765625, -7.6728515625, -5.71435546875, -3.755859375, -1.79736328125, 0.1611328125, 2.11962890625, 4.078125, 6.03662109375, 7.9951171875, 9.95361328125, 11.912109375, 13.87060546875, 15.8291015625, 17.78759765625, 19.74609375, 21.70458984375, 23.6630859375, 25.62158203125, 27.580078125, 29.53857421875, 31.4970703125, 33.45556640625, 35.4140625, 37.37255859375, 39.3310546875, 41.28955078125, 43.248046875, 45.20654296875, 47.1650390625, 49.12353515625, 51.08203125, 53.04052734375, 54.9990234375, 56.95751953125, 58.916015625, 60.87451171875, 62.8330078125, 64.79150390625, 66.75]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 15.0, 24.0, 68.0, 123.0, 210.0, 178.0, 146.0, 118.0, 61.0, 38.0, 16.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.94272232055664, -50.34061050415039, -47.73849868774414, -45.13638687133789, -42.534278869628906, -39.932167053222656, -37.330055236816406, -34.727943420410156, -32.125831604003906, -29.523719787597656, -26.921607971191406, -24.31949806213379, -21.71738624572754, -19.11527442932129, -16.513164520263672, -13.911052703857422, -11.308940887451172, -8.706829071044922, -6.104718208312988, -3.5026068687438965, -0.9004955291748047, 1.7016162872314453, 4.303727149963379, 6.9058380126953125, 9.507949829101562, 12.110061645507812, 14.712172508239746, 17.31428337097168, 19.91639518737793, 22.51850700378418, 25.120616912841797, 27.722728729248047, 30.32483673095703, 32.92694854736328, 35.52906036376953, 38.13117218017578, 40.73328399658203, 43.33539581298828, 45.937503814697266, 48.539615631103516, 51.141727447509766, 53.743839263916016, 56.345951080322266, 58.948062896728516, 61.5501708984375, 64.15228271484375, 66.75439453125, 69.35650634765625, 71.9586181640625, 74.56072998046875, 77.162841796875, 79.76495361328125, 82.3670654296875, 84.96917724609375, 87.5712890625, 90.17340087890625, 92.7755126953125, 95.37762451171875, 97.979736328125, 100.58184814453125, 103.1839599609375, 105.78607177734375, 108.38818359375, 110.99029541015625, 113.59239959716797]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 7.0, 8.0, 9.0, 8.0, 8.0, 12.0, 10.0, 14.0, 14.0, 25.0, 18.0, 34.0, 21.0, 38.0, 33.0, 38.0, 43.0, 43.0, 44.0, 40.0, 43.0, 48.0, 46.0, 38.0, 36.0, 35.0, 31.0, 35.0, 37.0, 21.0, 34.0, 21.0, 13.0, 16.0, 12.0, 18.0, 14.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.909263610839844, -48.3282585144043, -46.74725341796875, -45.16624450683594, -43.58523941040039, -42.004234313964844, -40.4232292175293, -38.84222412109375, -37.2612190246582, -35.680213928222656, -34.09920883178711, -32.51820373535156, -30.937196731567383, -29.356189727783203, -27.775184631347656, -26.19417953491211, -24.61317253112793, -23.032167434692383, -21.451160430908203, -19.870155334472656, -18.28915023803711, -16.708145141601562, -15.127138137817383, -13.546133041381836, -11.965126991271973, -10.38412094116211, -8.803115844726562, -7.222109794616699, -5.641104221343994, -4.060098648071289, -2.479092597961426, -0.8980875015258789, 0.6829185485839844, 2.2639241218566895, 3.8449299335479736, 5.425935745239258, 7.006941318511963, 8.587946891784668, 10.168952941894531, 11.749958038330078, 13.330964088439941, 14.911970138549805, 16.49297523498535, 18.07398223876953, 19.654987335205078, 21.235992431640625, 22.816997528076172, 24.39800262451172, 25.9790096282959, 27.560014724731445, 29.141021728515625, 30.722026824951172, 32.30303192138672, 33.884037017822266, 35.46504211425781, 37.046051025390625, 38.62705612182617, 40.20806121826172, 41.789066314697266, 43.37007141113281, 44.951080322265625, 46.53208541870117, 48.11309051513672, 49.694095611572266, 51.27510070800781]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 11.0, 19.0, 27.0, 52.0, 54.0, 94.0, 138.0, 217.0, 294.0, 463.0, 721.0, 1118.0, 1805.0, 2591.0, 4134.0, 6490.0, 10333.0, 17389.0, 29919.0, 53212.0, 97122.0, 184213.0, 270767.0, 163479.0, 87091.0, 47589.0, 26958.0, 15897.0, 9661.0, 5912.0, 3794.0, 2482.0, 1520.0, 967.0, 689.0, 449.0, 305.0, 189.0, 136.0, 79.0, 49.0, 42.0, 27.0, 19.0, 11.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9563674926757812, -0.9259185791015625, -0.8954696655273438, -0.865020751953125, -0.8345718383789062, -0.8041229248046875, -0.7736740112304688, -0.74322509765625, -0.7127761840820312, -0.6823272705078125, -0.6518783569335938, -0.621429443359375, -0.5909805297851562, -0.5605316162109375, -0.5300827026367188, -0.4996337890625, -0.46918487548828125, -0.4387359619140625, -0.40828704833984375, -0.377838134765625, -0.34738922119140625, -0.3169403076171875, -0.28649139404296875, -0.25604248046875, -0.22559356689453125, -0.1951446533203125, -0.16469573974609375, -0.134246826171875, -0.10379791259765625, -0.0733489990234375, -0.04290008544921875, -0.012451171875, 0.01799774169921875, 0.0484466552734375, 0.07889556884765625, 0.109344482421875, 0.13979339599609375, 0.1702423095703125, 0.20069122314453125, 0.23114013671875, 0.26158905029296875, 0.2920379638671875, 0.32248687744140625, 0.352935791015625, 0.38338470458984375, 0.4138336181640625, 0.44428253173828125, 0.4747314453125, 0.5051803588867188, 0.5356292724609375, 0.5660781860351562, 0.596527099609375, 0.6269760131835938, 0.6574249267578125, 0.6878738403320312, 0.71832275390625, 0.7487716674804688, 0.7792205810546875, 0.8096694946289062, 0.840118408203125, 0.8705673217773438, 0.9010162353515625, 0.9314651489257812, 0.9619140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 5.0, 7.0, 9.0, 6.0, 10.0, 10.0, 19.0, 18.0, 14.0, 26.0, 28.0, 45.0, 30.0, 46.0, 33.0, 37.0, 36.0, 28.0, 49.0, 1065.0, 43.0, 46.0, 38.0, 47.0, 39.0, 40.0, 26.0, 26.0, 30.0, 25.0, 30.0, 24.0, 14.0, 20.0, 14.0, 10.0, 4.0, 8.0, 6.0, 6.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0], "bins": [-4.18359375, -4.06707763671875, -3.9505615234375, -3.83404541015625, -3.717529296875, -3.60101318359375, -3.4844970703125, -3.36798095703125, -3.25146484375, -3.13494873046875, -3.0184326171875, -2.90191650390625, -2.785400390625, -2.66888427734375, -2.5523681640625, -2.43585205078125, -2.3193359375, -2.20281982421875, -2.0863037109375, -1.96978759765625, -1.853271484375, -1.73675537109375, -1.6202392578125, -1.50372314453125, -1.38720703125, -1.27069091796875, -1.1541748046875, -1.03765869140625, -0.921142578125, -0.80462646484375, -0.6881103515625, -0.57159423828125, -0.455078125, -0.33856201171875, -0.2220458984375, -0.10552978515625, 0.010986328125, 0.12750244140625, 0.2440185546875, 0.36053466796875, 0.47705078125, 0.59356689453125, 0.7100830078125, 0.82659912109375, 0.943115234375, 1.05963134765625, 1.1761474609375, 1.29266357421875, 1.4091796875, 1.52569580078125, 1.6422119140625, 1.75872802734375, 1.875244140625, 1.99176025390625, 2.1082763671875, 2.22479248046875, 2.34130859375, 2.45782470703125, 2.5743408203125, 2.69085693359375, 2.807373046875, 2.92388916015625, 3.0404052734375, 3.15692138671875, 3.2734375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 12.0, 23.0, 31.0, 24.0, 72.0, 81.0, 133.0, 193.0, 325.0, 476.0, 836.0, 1276.0, 1985.0, 3081.0, 5152.0, 8236.0, 13357.0, 22130.0, 37946.0, 65216.0, 117977.0, 225570.0, 1294953.0, 127456.0, 69846.0, 39582.0, 23720.0, 14155.0, 8701.0, 5368.0, 3379.0, 2170.0, 1346.0, 821.0, 560.0, 327.0, 218.0, 142.0, 83.0, 59.0, 55.0, 16.0, 12.0, 8.0, 10.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8340911865234375, -0.805389404296875, -0.7766876220703125, -0.74798583984375, -0.7192840576171875, -0.690582275390625, -0.6618804931640625, -0.6331787109375, -0.6044769287109375, -0.575775146484375, -0.5470733642578125, -0.51837158203125, -0.4896697998046875, -0.460968017578125, -0.4322662353515625, -0.403564453125, -0.3748626708984375, -0.346160888671875, -0.3174591064453125, -0.28875732421875, -0.2600555419921875, -0.231353759765625, -0.2026519775390625, -0.1739501953125, -0.1452484130859375, -0.116546630859375, -0.0878448486328125, -0.05914306640625, -0.0304412841796875, -0.001739501953125, 0.0269622802734375, 0.0556640625, 0.0843658447265625, 0.113067626953125, 0.1417694091796875, 0.17047119140625, 0.1991729736328125, 0.227874755859375, 0.2565765380859375, 0.2852783203125, 0.3139801025390625, 0.342681884765625, 0.3713836669921875, 0.40008544921875, 0.4287872314453125, 0.457489013671875, 0.4861907958984375, 0.514892578125, 0.5435943603515625, 0.572296142578125, 0.6009979248046875, 0.62969970703125, 0.6584014892578125, 0.687103271484375, 0.7158050537109375, 0.7445068359375, 0.7732086181640625, 0.801910400390625, 0.8306121826171875, 0.85931396484375, 0.8880157470703125, 0.916717529296875, 0.9454193115234375, 0.97412109375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 3.0, 8.0, 12.0, 15.0, 6.0, 21.0, 25.0, 24.0, 32.0, 41.0, 57.0, 51.0, 60.0, 62.0, 71.0, 68.0, 58.0, 38.0, 60.0, 49.0, 43.0, 32.0, 33.0, 23.0, 10.0, 14.0, 11.0, 9.0, 15.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004563331604003906, -0.00044209882616996765, -0.0004278644919395447, -0.0004136301577091217, -0.00039939582347869873, -0.00038516148924827576, -0.0003709271550178528, -0.0003566928207874298, -0.00034245848655700684, -0.00032822415232658386, -0.0003139898180961609, -0.0002997554838657379, -0.00028552114963531494, -0.00027128681540489197, -0.000257052481174469, -0.00024281814694404602, -0.00022858381271362305, -0.00021434947848320007, -0.0002001151442527771, -0.00018588081002235413, -0.00017164647579193115, -0.00015741214156150818, -0.0001431778073310852, -0.00012894347310066223, -0.00011470913887023926, -0.00010047480463981628, -8.624047040939331e-05, -7.200613617897034e-05, -5.777180194854736e-05, -4.353746771812439e-05, -2.9303133487701416e-05, -1.5068799257278442e-05, -8.344650268554688e-07, 1.3399869203567505e-05, 2.763420343399048e-05, 4.186853766441345e-05, 5.6102871894836426e-05, 7.03372061252594e-05, 8.457154035568237e-05, 9.880587458610535e-05, 0.00011304020881652832, 0.0001272745430469513, 0.00014150887727737427, 0.00015574321150779724, 0.00016997754573822021, 0.0001842118799686432, 0.00019844621419906616, 0.00021268054842948914, 0.0002269148826599121, 0.00024114921689033508, 0.00025538355112075806, 0.00026961788535118103, 0.000283852219581604, 0.000298086553812027, 0.00031232088804244995, 0.0003265552222728729, 0.0003407895565032959, 0.00035502389073371887, 0.00036925822496414185, 0.0003834925591945648, 0.0003977268934249878, 0.00041196122765541077, 0.00042619556188583374, 0.0004404298961162567, 0.0004546642303466797]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 8.0, 9.0, 13.0, 18.0, 33.0, 34.0, 53.0, 71.0, 118.0, 213.0, 330.0, 821.0, 244133.0, 800553.0, 1071.0, 421.0, 211.0, 136.0, 72.0, 46.0, 32.0, 25.0, 18.0, 18.0, 16.0, 12.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 9.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01161956787109375, -0.01124560832977295, -0.010871648788452148, -0.010497689247131348, -0.010123729705810547, -0.009749770164489746, -0.009375810623168945, -0.009001851081848145, -0.008627891540527344, -0.008253931999206543, -0.007879972457885742, -0.007506012916564941, -0.007132053375244141, -0.00675809383392334, -0.006384134292602539, -0.006010174751281738, -0.0056362152099609375, -0.005262255668640137, -0.004888296127319336, -0.004514336585998535, -0.004140377044677734, -0.0037664175033569336, -0.003392457962036133, -0.003018498420715332, -0.0026445388793945312, -0.0022705793380737305, -0.0018966197967529297, -0.001522660255432129, -0.0011487007141113281, -0.0007747411727905273, -0.00040078163146972656, -2.682209014892578e-05, 0.000347137451171875, 0.0007210969924926758, 0.0010950565338134766, 0.0014690160751342773, 0.0018429756164550781, 0.002216935157775879, 0.0025908946990966797, 0.0029648542404174805, 0.0033388137817382812, 0.003712773323059082, 0.004086732864379883, 0.004460692405700684, 0.004834651947021484, 0.005208611488342285, 0.005582571029663086, 0.005956530570983887, 0.0063304901123046875, 0.006704449653625488, 0.007078409194946289, 0.00745236873626709, 0.00782632827758789, 0.008200287818908691, 0.008574247360229492, 0.008948206901550293, 0.009322166442871094, 0.009696125984191895, 0.010070085525512695, 0.010444045066833496, 0.010818004608154297, 0.011191964149475098, 0.011565923690795898, 0.0119398832321167, 0.0123138427734375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 76.0, 348.0, 413.0, 146.0, 23.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006749026360921562, -0.0006397803663276136, -0.0006046581547707319, -0.0005695358850061893, -0.0005344136152416468, -0.0004992913454771042, -0.00046416910481639206, -0.00042904686415567994, -0.00039392459439113736, -0.0003588023246265948, -0.00032368008396588266, -0.00028855784330517054, -0.00025343557354062796, -0.0002183133183280006, -0.00018319106311537325, -0.00014806882245466113, -0.00011294655269011855, -7.78242974774912e-05, -4.270204226486385e-05, -7.579787052236497e-06, 2.7542468160390854e-05, 6.26647233730182e-05, 9.778697858564556e-05, 0.00013290921924635768, 0.00016803148901090026, 0.0002031537442235276, 0.00023827599943615496, 0.0002733982400968671, 0.00030852050986140966, 0.00034364277962595224, 0.00037876502028666437, 0.0004138872609473765, 0.00044900947250425816, 0.00048413174226880074, 0.0005192540120333433, 0.000554376223590225, 0.0005894984933547676, 0.0006246207631193101, 0.0006597429746761918, 0.0006948652444407344, 0.000729987514205277, 0.0007651097839698195, 0.0008002320537343621, 0.0008353542652912438, 0.0008704765350557864, 0.000905598804820329, 0.0009407210163772106, 0.0009758432861417532, 0.0010109655559062958, 0.0010460878256708384, 0.001081210095435381, 0.0011163323651999235, 0.001151454634964466, 0.0011865767883136868, 0.0012216990580782294, 0.001256821327842772, 0.0012919435976073146, 0.0013270658673718572, 0.0013621881371363997, 0.0013973104069009423, 0.001432432560250163, 0.0014675548300147057, 0.0015026770997792482, 0.0015377993695437908, 0.0015729216393083334]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 3.0, 7.0, 4.0, 15.0, 13.0, 16.0, 16.0, 23.0, 21.0, 23.0, 34.0, 23.0, 33.0, 36.0, 37.0, 40.0, 38.0, 30.0, 35.0, 45.0, 53.0, 23.0, 45.0, 45.0, 34.0, 26.0, 33.0, 30.0, 37.0, 19.0, 28.0, 17.0, 16.0, 13.0, 11.0, 6.0, 18.0, 10.0, 4.0, 5.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00021910667419433594, -0.00021243561059236526, -0.0002057645469903946, -0.00019909348338842392, -0.00019242241978645325, -0.00018575135618448257, -0.0001790802925825119, -0.00017240922898054123, -0.00016573816537857056, -0.00015906710177659988, -0.0001523960381746292, -0.00014572497457265854, -0.00013905391097068787, -0.0001323828473687172, -0.00012571178376674652, -0.00011904072016477585, -0.00011236965656280518, -0.0001056985929608345, -9.902752935886383e-05, -9.235646575689316e-05, -8.568540215492249e-05, -7.901433855295181e-05, -7.234327495098114e-05, -6.567221134901047e-05, -5.9001147747039795e-05, -5.233008414506912e-05, -4.565902054309845e-05, -3.898795694112778e-05, -3.2316893339157104e-05, -2.5645829737186432e-05, -1.897476613521576e-05, -1.2303702533245087e-05, -5.632638931274414e-06, 1.0384246706962585e-06, 7.709488272666931e-06, 1.4380551874637604e-05, 2.1051615476608276e-05, 2.772267907857895e-05, 3.439374268054962e-05, 4.1064806282520294e-05, 4.773586988449097e-05, 5.440693348646164e-05, 6.107799708843231e-05, 6.774906069040298e-05, 7.442012429237366e-05, 8.109118789434433e-05, 8.7762251496315e-05, 9.443331509828568e-05, 0.00010110437870025635, 0.00010777544230222702, 0.00011444650590419769, 0.00012111756950616837, 0.00012778863310813904, 0.0001344596967101097, 0.00014113076031208038, 0.00014780182391405106, 0.00015447288751602173, 0.0001611439511179924, 0.00016781501471996307, 0.00017448607832193375, 0.00018115714192390442, 0.0001878282055258751, 0.00019449926912784576, 0.00020117033272981644, 0.0002078413963317871]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 6.0, 12.0, 11.0, 10.0, 8.0, 17.0, 22.0, 23.0, 27.0, 26.0, 29.0, 45.0, 36.0, 37.0, 39.0, 32.0, 51.0, 38.0, 44.0, 46.0, 43.0, 37.0, 39.0, 41.0, 37.0, 35.0, 31.0, 25.0, 22.0, 17.0, 18.0, 21.0, 14.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.5546875, -5.3758544921875, -5.197021484375, -5.0181884765625, -4.83935546875, -4.6605224609375, -4.481689453125, -4.3028564453125, -4.1240234375, -3.9451904296875, -3.766357421875, -3.5875244140625, -3.40869140625, -3.2298583984375, -3.051025390625, -2.8721923828125, -2.693359375, -2.5145263671875, -2.335693359375, -2.1568603515625, -1.97802734375, -1.7991943359375, -1.620361328125, -1.4415283203125, -1.2626953125, -1.0838623046875, -0.905029296875, -0.7261962890625, -0.54736328125, -0.3685302734375, -0.189697265625, -0.0108642578125, 0.16796875, 0.3468017578125, 0.525634765625, 0.7044677734375, 0.88330078125, 1.0621337890625, 1.240966796875, 1.4197998046875, 1.5986328125, 1.7774658203125, 1.956298828125, 2.1351318359375, 2.31396484375, 2.4927978515625, 2.671630859375, 2.8504638671875, 3.029296875, 3.2081298828125, 3.386962890625, 3.5657958984375, 3.74462890625, 3.9234619140625, 4.102294921875, 4.2811279296875, 4.4599609375, 4.6387939453125, 4.817626953125, 4.9964599609375, 5.17529296875, 5.3541259765625, 5.532958984375, 5.7117919921875, 5.890625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 34.0, 33.0, 53.0, 69.0, 108.0, 136.0, 194.0, 282.0, 391.0, 579.0, 907.0, 1337.0, 2202.0, 3598.0, 6162.0, 11728.0, 24533.0, 60251.0, 194739.0, 504320.0, 143932.0, 47955.0, 20478.0, 10027.0, 5499.0, 3094.0, 1955.0, 1216.0, 809.0, 546.0, 399.0, 291.0, 199.0, 116.0, 90.0, 77.0, 37.0, 37.0, 33.0, 21.0, 19.0, 11.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.65234375, -4.51300048828125, -4.3736572265625, -4.23431396484375, -4.094970703125, -3.95562744140625, -3.8162841796875, -3.67694091796875, -3.53759765625, -3.39825439453125, -3.2589111328125, -3.11956787109375, -2.980224609375, -2.84088134765625, -2.7015380859375, -2.56219482421875, -2.4228515625, -2.28350830078125, -2.1441650390625, -2.00482177734375, -1.865478515625, -1.72613525390625, -1.5867919921875, -1.44744873046875, -1.30810546875, -1.16876220703125, -1.0294189453125, -0.89007568359375, -0.750732421875, -0.61138916015625, -0.4720458984375, -0.33270263671875, -0.193359375, -0.05401611328125, 0.0853271484375, 0.22467041015625, 0.364013671875, 0.50335693359375, 0.6427001953125, 0.78204345703125, 0.92138671875, 1.06072998046875, 1.2000732421875, 1.33941650390625, 1.478759765625, 1.61810302734375, 1.7574462890625, 1.89678955078125, 2.0361328125, 2.17547607421875, 2.3148193359375, 2.45416259765625, 2.593505859375, 2.73284912109375, 2.8721923828125, 3.01153564453125, 3.15087890625, 3.29022216796875, 3.4295654296875, 3.56890869140625, 3.708251953125, 3.84759521484375, 3.9869384765625, 4.12628173828125, 4.265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 3.0, 8.0, 9.0, 11.0, 12.0, 14.0, 21.0, 27.0, 24.0, 25.0, 21.0, 32.0, 26.0, 29.0, 33.0, 29.0, 56.0, 83.0, 271.0, 1680.0, 123.0, 61.0, 55.0, 44.0, 31.0, 28.0, 32.0, 34.0, 27.0, 29.0, 16.0, 18.0, 20.0, 16.0, 8.0, 10.0, 10.0, 13.0, 8.0, 9.0, 8.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.533447265625, -16.00439453125, -15.475341796875, -14.9462890625, -14.417236328125, -13.88818359375, -13.359130859375, -12.830078125, -12.301025390625, -11.77197265625, -11.242919921875, -10.7138671875, -10.184814453125, -9.65576171875, -9.126708984375, -8.59765625, -8.068603515625, -7.53955078125, -7.010498046875, -6.4814453125, -5.952392578125, -5.42333984375, -4.894287109375, -4.365234375, -3.836181640625, -3.30712890625, -2.778076171875, -2.2490234375, -1.719970703125, -1.19091796875, -0.661865234375, -0.1328125, 0.396240234375, 0.92529296875, 1.454345703125, 1.9833984375, 2.512451171875, 3.04150390625, 3.570556640625, 4.099609375, 4.628662109375, 5.15771484375, 5.686767578125, 6.2158203125, 6.744873046875, 7.27392578125, 7.802978515625, 8.33203125, 8.861083984375, 9.39013671875, 9.919189453125, 10.4482421875, 10.977294921875, 11.50634765625, 12.035400390625, 12.564453125, 13.093505859375, 13.62255859375, 14.151611328125, 14.6806640625, 15.209716796875, 15.73876953125, 16.267822265625, 16.796875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 5.0, 7.0, 11.0, 16.0, 17.0, 23.0, 23.0, 25.0, 43.0, 41.0, 82.0, 132.0, 167.0, 283.0, 646.0, 3322.0, 609572.0, 2525340.0, 4324.0, 710.0, 313.0, 163.0, 113.0, 81.0, 62.0, 57.0, 28.0, 22.0, 14.0, 14.0, 9.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.15625, -35.78271484375, -34.4091796875, -33.03564453125, -31.662109375, -30.28857421875, -28.9150390625, -27.54150390625, -26.16796875, -24.79443359375, -23.4208984375, -22.04736328125, -20.673828125, -19.30029296875, -17.9267578125, -16.55322265625, -15.1796875, -13.80615234375, -12.4326171875, -11.05908203125, -9.685546875, -8.31201171875, -6.9384765625, -5.56494140625, -4.19140625, -2.81787109375, -1.4443359375, -0.07080078125, 1.302734375, 2.67626953125, 4.0498046875, 5.42333984375, 6.796875, 8.17041015625, 9.5439453125, 10.91748046875, 12.291015625, 13.66455078125, 15.0380859375, 16.41162109375, 17.78515625, 19.15869140625, 20.5322265625, 21.90576171875, 23.279296875, 24.65283203125, 26.0263671875, 27.39990234375, 28.7734375, 30.14697265625, 31.5205078125, 32.89404296875, 34.267578125, 35.64111328125, 37.0146484375, 38.38818359375, 39.76171875, 41.13525390625, 42.5087890625, 43.88232421875, 45.255859375, 46.62939453125, 48.0029296875, 49.37646484375, 50.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 10.0, 22.0, 55.0, 58.0, 100.0, 113.0, 176.0, 137.0, 101.0, 97.0, 55.0, 39.0, 13.0, 10.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.346296310424805, -28.64324188232422, -27.940187454223633, -27.237133026123047, -26.534076690673828, -25.831022262573242, -25.127967834472656, -24.42491340637207, -23.721858978271484, -23.0188045501709, -22.315750122070312, -21.612693786621094, -20.909639358520508, -20.206584930419922, -19.503530502319336, -18.80047607421875, -18.09741973876953, -17.394365310668945, -16.69131088256836, -15.988255500793457, -15.285201072692871, -14.582145690917969, -13.879091262817383, -13.176036834716797, -12.472982406616211, -11.769927978515625, -11.066872596740723, -10.363818168640137, -9.66076374053955, -8.957708358764648, -8.254653930664062, -7.551599502563477, -6.848544120788574, -6.14548921585083, -5.442434787750244, -4.7393798828125, -4.036325454711914, -3.33327054977417, -2.630215644836426, -1.9271612167358398, -1.2241063117980957, -0.5210515856742859, 0.18200314044952393, 0.8850579261779785, 1.5881125926971436, 2.2911672592163086, 2.9942221641540527, 3.6972765922546387, 4.400331497192383, 5.103386402130127, 5.806440830230713, 6.509495735168457, 7.212550163269043, 7.915605068206787, 8.618659973144531, 9.321714401245117, 10.024768829345703, 10.727823257446289, 11.430878639221191, 12.133933067321777, 12.836987495422363, 13.540042877197266, 14.243097305297852, 14.946151733398438, 15.64920711517334]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 5.0, 10.0, 7.0, 9.0, 16.0, 12.0, 14.0, 7.0, 13.0, 22.0, 15.0, 20.0, 38.0, 30.0, 28.0, 28.0, 37.0, 34.0, 40.0, 41.0, 40.0, 35.0, 54.0, 32.0, 37.0, 36.0, 33.0, 35.0, 27.0, 29.0, 25.0, 22.0, 28.0, 29.0, 14.0, 18.0, 19.0, 12.0, 6.0, 9.0, 7.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-57.35395812988281, -55.69116973876953, -54.028385162353516, -52.3656005859375, -50.70281219482422, -49.04002380371094, -47.37723922729492, -45.714454650878906, -44.051666259765625, -42.388877868652344, -40.72609329223633, -39.06330871582031, -37.40052032470703, -35.73773193359375, -34.074947357177734, -32.41216278076172, -30.749374389648438, -29.08658790588379, -27.42380142211914, -25.761014938354492, -24.098228454589844, -22.435441970825195, -20.772655487060547, -19.1098690032959, -17.44708251953125, -15.784296035766602, -14.121509552001953, -12.458723068237305, -10.795936584472656, -9.133150100708008, -7.470363616943359, -5.807577133178711, -4.1447906494140625, -2.482004165649414, -0.8192176818847656, 0.8435688018798828, 2.5063552856445312, 4.16914176940918, 5.831928253173828, 7.494714736938477, 9.157501220703125, 10.820287704467773, 12.483074188232422, 14.14586067199707, 15.808647155761719, 17.471433639526367, 19.134220123291016, 20.797006607055664, 22.459793090820312, 24.12257957458496, 25.78536605834961, 27.448152542114258, 29.110939025878906, 30.773725509643555, 32.4365119934082, 34.09929656982422, 35.7620849609375, 37.42487335205078, 39.0876579284668, 40.75044250488281, 42.413230895996094, 44.076019287109375, 45.73880386352539, 47.401588439941406, 49.06437683105469]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 8.0, 6.0, 14.0, 11.0, 16.0, 15.0, 27.0, 19.0, 32.0, 25.0, 30.0, 43.0, 41.0, 31.0, 40.0, 49.0, 33.0, 43.0, 44.0, 46.0, 41.0, 35.0, 49.0, 42.0, 34.0, 37.0, 25.0, 16.0, 24.0, 18.0, 21.0, 18.0, 7.0, 10.0, 9.0, 10.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.66796875, -5.4833984375, -5.298828125, -5.1142578125, -4.9296875, -4.7451171875, -4.560546875, -4.3759765625, -4.19140625, -4.0068359375, -3.822265625, -3.6376953125, -3.453125, -3.2685546875, -3.083984375, -2.8994140625, -2.71484375, -2.5302734375, -2.345703125, -2.1611328125, -1.9765625, -1.7919921875, -1.607421875, -1.4228515625, -1.23828125, -1.0537109375, -0.869140625, -0.6845703125, -0.5, -0.3154296875, -0.130859375, 0.0537109375, 0.23828125, 0.4228515625, 0.607421875, 0.7919921875, 0.9765625, 1.1611328125, 1.345703125, 1.5302734375, 1.71484375, 1.8994140625, 2.083984375, 2.2685546875, 2.453125, 2.6376953125, 2.822265625, 3.0068359375, 3.19140625, 3.3759765625, 3.560546875, 3.7451171875, 3.9296875, 4.1142578125, 4.298828125, 4.4833984375, 4.66796875, 4.8525390625, 5.037109375, 5.2216796875, 5.40625, 5.5908203125, 5.775390625, 5.9599609375, 6.14453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 8.0, 10.0, 8.0, 16.0, 22.0, 33.0, 62.0, 74.0, 120.0, 180.0, 310.0, 584.0, 1073.0, 2127.0, 4443.0, 10263.0, 27643.0, 88036.0, 324207.0, 1008811.0, 1525975.0, 835750.0, 254567.0, 70797.0, 22539.0, 8820.0, 3717.0, 1833.0, 930.0, 481.0, 310.0, 176.0, 111.0, 71.0, 46.0, 33.0, 25.0, 19.0, 11.0, 10.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.6412353515625, -5.442626953125, -5.2440185546875, -5.04541015625, -4.8468017578125, -4.648193359375, -4.4495849609375, -4.2509765625, -4.0523681640625, -3.853759765625, -3.6551513671875, -3.45654296875, -3.2579345703125, -3.059326171875, -2.8607177734375, -2.662109375, -2.4635009765625, -2.264892578125, -2.0662841796875, -1.86767578125, -1.6690673828125, -1.470458984375, -1.2718505859375, -1.0732421875, -0.8746337890625, -0.676025390625, -0.4774169921875, -0.27880859375, -0.0802001953125, 0.118408203125, 0.3170166015625, 0.515625, 0.7142333984375, 0.912841796875, 1.1114501953125, 1.31005859375, 1.5086669921875, 1.707275390625, 1.9058837890625, 2.1044921875, 2.3031005859375, 2.501708984375, 2.7003173828125, 2.89892578125, 3.0975341796875, 3.296142578125, 3.4947509765625, 3.693359375, 3.8919677734375, 4.090576171875, 4.2891845703125, 4.48779296875, 4.6864013671875, 4.885009765625, 5.0836181640625, 5.2822265625, 5.4808349609375, 5.679443359375, 5.8780517578125, 6.07666015625, 6.2752685546875, 6.473876953125, 6.6724853515625, 6.87109375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 12.0, 12.0, 10.0, 15.0, 28.0, 45.0, 61.0, 72.0, 101.0, 133.0, 168.0, 256.0, 316.0, 433.0, 507.0, 481.0, 396.0, 280.0, 209.0, 122.0, 133.0, 79.0, 54.0, 46.0, 34.0, 21.0, 17.0, 10.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.078125, -20.57275390625, -20.0673828125, -19.56201171875, -19.056640625, -18.55126953125, -18.0458984375, -17.54052734375, -17.03515625, -16.52978515625, -16.0244140625, -15.51904296875, -15.013671875, -14.50830078125, -14.0029296875, -13.49755859375, -12.9921875, -12.48681640625, -11.9814453125, -11.47607421875, -10.970703125, -10.46533203125, -9.9599609375, -9.45458984375, -8.94921875, -8.44384765625, -7.9384765625, -7.43310546875, -6.927734375, -6.42236328125, -5.9169921875, -5.41162109375, -4.90625, -4.40087890625, -3.8955078125, -3.39013671875, -2.884765625, -2.37939453125, -1.8740234375, -1.36865234375, -0.86328125, -0.35791015625, 0.1474609375, 0.65283203125, 1.158203125, 1.66357421875, 2.1689453125, 2.67431640625, 3.1796875, 3.68505859375, 4.1904296875, 4.69580078125, 5.201171875, 5.70654296875, 6.2119140625, 6.71728515625, 7.22265625, 7.72802734375, 8.2333984375, 8.73876953125, 9.244140625, 9.74951171875, 10.2548828125, 10.76025390625, 11.265625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 5.0, 8.0, 8.0, 10.0, 15.0, 18.0, 30.0, 30.0, 54.0, 75.0, 86.0, 116.0, 154.0, 266.0, 477.0, 2098.0, 224599.0, 3953174.0, 11097.0, 861.0, 352.0, 218.0, 146.0, 77.0, 70.0, 59.0, 36.0, 43.0, 19.0, 14.0, 20.0, 13.0, 11.0, 9.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.1875, -48.1181640625, -46.048828125, -43.9794921875, -41.91015625, -39.8408203125, -37.771484375, -35.7021484375, -33.6328125, -31.5634765625, -29.494140625, -27.4248046875, -25.35546875, -23.2861328125, -21.216796875, -19.1474609375, -17.078125, -15.0087890625, -12.939453125, -10.8701171875, -8.80078125, -6.7314453125, -4.662109375, -2.5927734375, -0.5234375, 1.5458984375, 3.615234375, 5.6845703125, 7.75390625, 9.8232421875, 11.892578125, 13.9619140625, 16.03125, 18.1005859375, 20.169921875, 22.2392578125, 24.30859375, 26.3779296875, 28.447265625, 30.5166015625, 32.5859375, 34.6552734375, 36.724609375, 38.7939453125, 40.86328125, 42.9326171875, 45.001953125, 47.0712890625, 49.140625, 51.2099609375, 53.279296875, 55.3486328125, 57.41796875, 59.4873046875, 61.556640625, 63.6259765625, 65.6953125, 67.7646484375, 69.833984375, 71.9033203125, 73.97265625, 76.0419921875, 78.111328125, 80.1806640625, 82.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 10.0, 63.0, 173.0, 275.0, 268.0, 159.0, 45.0, 13.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-199.8118133544922, -195.46070861816406, -191.10958862304688, -186.75848388671875, -182.40737915039062, -178.0562744140625, -173.7051544189453, -169.3540496826172, -165.00294494628906, -160.65184020996094, -156.30072021484375, -151.94961547851562, -147.5985107421875, -143.24740600585938, -138.8962860107422, -134.54518127441406, -130.19406127929688, -125.84294891357422, -121.4918441772461, -117.14073181152344, -112.78962707519531, -108.43851470947266, -104.08740234375, -99.73629760742188, -95.38519287109375, -91.0340805053711, -86.68297576904297, -82.33186340332031, -77.98075866699219, -73.62964630126953, -69.27853393554688, -64.92742919921875, -60.576324462890625, -56.225215911865234, -51.874107360839844, -47.52299499511719, -43.17189025878906, -38.820777893066406, -34.469669342041016, -30.118560791015625, -25.767452239990234, -21.416343688964844, -17.065235137939453, -12.71412467956543, -8.363016128540039, -4.011907577514648, 0.339202880859375, 4.690311431884766, 9.041419982910156, 13.392528533935547, 17.743637084960938, 22.09474754333496, 26.44585609436035, 30.796964645385742, 35.148075103759766, 39.499183654785156, 43.85029220581055, 48.20140075683594, 52.55250930786133, 56.90361785888672, 61.254730224609375, 65.6058349609375, 69.95694732666016, 74.30805969238281, 78.65916442871094]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 11.0, 7.0, 9.0, 7.0, 16.0, 18.0, 16.0, 22.0, 18.0, 20.0, 28.0, 28.0, 36.0, 36.0, 52.0, 49.0, 53.0, 38.0, 46.0, 36.0, 43.0, 33.0, 36.0, 40.0, 39.0, 34.0, 27.0, 33.0, 30.0, 19.0, 20.0, 14.0, 12.0, 13.0, 10.0, 13.0, 9.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.4869384765625, -49.87363052368164, -48.260318756103516, -46.647010803222656, -45.03369903564453, -43.42039108276367, -41.80708312988281, -40.19377136230469, -38.58046340942383, -36.96715545654297, -35.353843688964844, -33.740535736083984, -32.12722396850586, -30.513916015625, -28.900606155395508, -27.287296295166016, -25.673986434936523, -24.06067657470703, -22.44736671447754, -20.834056854248047, -19.220748901367188, -17.607439041137695, -15.994129180908203, -14.380820274353027, -12.767510414123535, -11.154200553894043, -9.540891647338867, -7.927581787109375, -6.314272403717041, -4.700963020324707, -3.087653160095215, -1.474344253540039, 0.13896560668945312, 1.7522751092910767, 3.3655846118927, 4.978894233703613, 6.592203617095947, 8.205513000488281, 9.818822860717773, 11.43213176727295, 13.045441627502441, 14.658751487731934, 16.27206039428711, 17.8853702545166, 19.498680114746094, 21.111988067626953, 22.725299835205078, 24.338607788085938, 25.95191764831543, 27.565227508544922, 29.178537368774414, 30.791847229003906, 32.405155181884766, 34.018463134765625, 35.63177490234375, 37.24508285522461, 38.858394622802734, 40.471702575683594, 42.08501434326172, 43.69832229614258, 45.3116340637207, 46.92494201660156, 48.53825378417969, 50.15156173706055, 51.764869689941406]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 9.0, 6.0, 6.0, 17.0, 22.0, 33.0, 43.0, 51.0, 95.0, 150.0, 201.0, 323.0, 468.0, 736.0, 1060.0, 1597.0, 2532.0, 3924.0, 6090.0, 9483.0, 15250.0, 24923.0, 40460.0, 69007.0, 119891.0, 215314.0, 225635.0, 126166.0, 72457.0, 43064.0, 25618.0, 15892.0, 9843.0, 6407.0, 4040.0, 2665.0, 1722.0, 1114.0, 765.0, 473.0, 331.0, 237.0, 139.0, 90.0, 76.0, 43.0, 32.0, 21.0, 17.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.86572265625, -0.8378372192382812, -0.8099517822265625, -0.7820663452148438, -0.754180908203125, -0.7262954711914062, -0.6984100341796875, -0.6705245971679688, -0.64263916015625, -0.6147537231445312, -0.5868682861328125, -0.5589828491210938, -0.531097412109375, -0.5032119750976562, -0.4753265380859375, -0.44744110107421875, -0.4195556640625, -0.39167022705078125, -0.3637847900390625, -0.33589935302734375, -0.308013916015625, -0.28012847900390625, -0.2522430419921875, -0.22435760498046875, -0.19647216796875, -0.16858673095703125, -0.1407012939453125, -0.11281585693359375, -0.084930419921875, -0.05704498291015625, -0.0291595458984375, -0.00127410888671875, 0.026611328125, 0.05449676513671875, 0.0823822021484375, 0.11026763916015625, 0.138153076171875, 0.16603851318359375, 0.1939239501953125, 0.22180938720703125, 0.24969482421875, 0.27758026123046875, 0.3054656982421875, 0.33335113525390625, 0.361236572265625, 0.38912200927734375, 0.4170074462890625, 0.44489288330078125, 0.4727783203125, 0.5006637573242188, 0.5285491943359375, 0.5564346313476562, 0.584320068359375, 0.6122055053710938, 0.6400909423828125, 0.6679763793945312, 0.69586181640625, 0.7237472534179688, 0.7516326904296875, 0.7795181274414062, 0.807403564453125, 0.8352890014648438, 0.8631744384765625, 0.8910598754882812, 0.9189453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 7.0, 2.0, 2.0, 3.0, 8.0, 10.0, 9.0, 10.0, 9.0, 18.0, 8.0, 11.0, 21.0, 25.0, 30.0, 26.0, 28.0, 33.0, 29.0, 33.0, 41.0, 39.0, 34.0, 27.0, 38.0, 1056.0, 27.0, 32.0, 43.0, 33.0, 33.0, 35.0, 36.0, 32.0, 19.0, 20.0, 20.0, 24.0, 17.0, 16.0, 19.0, 11.0, 12.0, 10.0, 8.0, 14.0, 9.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.55078125, -3.448150634765625, -3.34552001953125, -3.242889404296875, -3.1402587890625, -3.037628173828125, -2.93499755859375, -2.832366943359375, -2.729736328125, -2.627105712890625, -2.52447509765625, -2.421844482421875, -2.3192138671875, -2.216583251953125, -2.11395263671875, -2.011322021484375, -1.90869140625, -1.806060791015625, -1.70343017578125, -1.600799560546875, -1.4981689453125, -1.395538330078125, -1.29290771484375, -1.190277099609375, -1.087646484375, -0.985015869140625, -0.88238525390625, -0.779754638671875, -0.6771240234375, -0.574493408203125, -0.47186279296875, -0.369232177734375, -0.2666015625, -0.163970947265625, -0.06134033203125, 0.041290283203125, 0.1439208984375, 0.246551513671875, 0.34918212890625, 0.451812744140625, 0.554443359375, 0.657073974609375, 0.75970458984375, 0.862335205078125, 0.9649658203125, 1.067596435546875, 1.17022705078125, 1.272857666015625, 1.37548828125, 1.478118896484375, 1.58074951171875, 1.683380126953125, 1.7860107421875, 1.888641357421875, 1.99127197265625, 2.093902587890625, 2.196533203125, 2.299163818359375, 2.40179443359375, 2.504425048828125, 2.6070556640625, 2.709686279296875, 2.81231689453125, 2.914947509765625, 3.017578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 8.0, 14.0, 23.0, 25.0, 38.0, 48.0, 73.0, 126.0, 177.0, 260.0, 375.0, 544.0, 819.0, 1209.0, 1762.0, 2443.0, 3634.0, 5305.0, 7798.0, 11428.0, 17042.0, 26258.0, 39833.0, 62694.0, 100271.0, 174079.0, 1278231.0, 132673.0, 80289.0, 51215.0, 32617.0, 21592.0, 14070.0, 9557.0, 6579.0, 4383.0, 3038.0, 2099.0, 1363.0, 994.0, 697.0, 493.0, 327.0, 199.0, 161.0, 90.0, 66.0, 41.0, 24.0, 14.0, 15.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.71240234375, -0.6888656616210938, -0.6653289794921875, -0.6417922973632812, -0.618255615234375, -0.5947189331054688, -0.5711822509765625, -0.5476455688476562, -0.52410888671875, -0.5005722045898438, -0.4770355224609375, -0.45349884033203125, -0.429962158203125, -0.40642547607421875, -0.3828887939453125, -0.35935211181640625, -0.3358154296875, -0.31227874755859375, -0.2887420654296875, -0.26520538330078125, -0.241668701171875, -0.21813201904296875, -0.1945953369140625, -0.17105865478515625, -0.14752197265625, -0.12398529052734375, -0.1004486083984375, -0.07691192626953125, -0.053375244140625, -0.02983856201171875, -0.0063018798828125, 0.01723480224609375, 0.040771484375, 0.06430816650390625, 0.0878448486328125, 0.11138153076171875, 0.134918212890625, 0.15845489501953125, 0.1819915771484375, 0.20552825927734375, 0.22906494140625, 0.25260162353515625, 0.2761383056640625, 0.29967498779296875, 0.323211669921875, 0.34674835205078125, 0.3702850341796875, 0.39382171630859375, 0.4173583984375, 0.44089508056640625, 0.4644317626953125, 0.48796844482421875, 0.511505126953125, 0.5350418090820312, 0.5585784912109375, 0.5821151733398438, 0.60565185546875, 0.6291885375976562, 0.6527252197265625, 0.6762619018554688, 0.699798583984375, 0.7233352661132812, 0.7468719482421875, 0.7704086303710938, 0.7939453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 10.0, 8.0, 10.0, 13.0, 17.0, 14.0, 17.0, 19.0, 24.0, 30.0, 32.0, 36.0, 48.0, 42.0, 53.0, 60.0, 47.0, 53.0, 52.0, 50.0, 55.0, 49.0, 33.0, 38.0, 24.0, 21.0, 15.0, 11.0, 20.0, 15.0, 12.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004000663757324219, -0.0003859996795654297, -0.0003719329833984375, -0.0003578662872314453, -0.0003437995910644531, -0.00032973289489746094, -0.00031566619873046875, -0.00030159950256347656, -0.0002875328063964844, -0.0002734661102294922, -0.0002593994140625, -0.0002453327178955078, -0.00023126602172851562, -0.00021719932556152344, -0.00020313262939453125, -0.00018906593322753906, -0.00017499923706054688, -0.0001609325408935547, -0.0001468658447265625, -0.0001327991485595703, -0.00011873245239257812, -0.00010466575622558594, -9.059906005859375e-05, -7.653236389160156e-05, -6.246566772460938e-05, -4.839897155761719e-05, -3.4332275390625e-05, -2.0265579223632812e-05, -6.198883056640625e-06, 7.867813110351562e-06, 2.193450927734375e-05, 3.600120544433594e-05, 5.0067901611328125e-05, 6.413459777832031e-05, 7.82012939453125e-05, 9.226799011230469e-05, 0.00010633468627929688, 0.00012040138244628906, 0.00013446807861328125, 0.00014853477478027344, 0.00016260147094726562, 0.0001766681671142578, 0.00019073486328125, 0.0002048015594482422, 0.00021886825561523438, 0.00023293495178222656, 0.00024700164794921875, 0.00026106834411621094, 0.0002751350402832031, 0.0002892017364501953, 0.0003032684326171875, 0.0003173351287841797, 0.0003314018249511719, 0.00034546852111816406, 0.00035953521728515625, 0.00037360191345214844, 0.0003876686096191406, 0.0004017353057861328, 0.000415802001953125, 0.0004298686981201172, 0.0004439353942871094, 0.00045800209045410156, 0.00047206878662109375, 0.00048613548278808594, 0.0005002021789550781]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 9.0, 13.0, 15.0, 14.0, 15.0, 20.0, 43.0, 45.0, 64.0, 107.0, 143.0, 267.0, 495.0, 1038.0, 107731.0, 935202.0, 1854.0, 543.0, 284.0, 201.0, 112.0, 71.0, 64.0, 30.0, 32.0, 23.0, 23.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.012176513671875, -0.01179802417755127, -0.011419534683227539, -0.011041045188903809, -0.010662555694580078, -0.010284066200256348, -0.009905576705932617, -0.009527087211608887, -0.009148597717285156, -0.008770108222961426, -0.008391618728637695, -0.008013129234313965, -0.007634639739990234, -0.007256150245666504, -0.0068776607513427734, -0.006499171257019043, -0.0061206817626953125, -0.005742192268371582, -0.0053637027740478516, -0.004985213279724121, -0.004606723785400391, -0.00422823429107666, -0.0038497447967529297, -0.0034712553024291992, -0.0030927658081054688, -0.0027142763137817383, -0.002335786819458008, -0.0019572973251342773, -0.0015788078308105469, -0.0012003183364868164, -0.0008218288421630859, -0.00044333934783935547, -6.4849853515625e-05, 0.00031363964080810547, 0.0006921291351318359, 0.0010706186294555664, 0.0014491081237792969, 0.0018275976181030273, 0.002206087112426758, 0.0025845766067504883, 0.0029630661010742188, 0.0033415555953979492, 0.0037200450897216797, 0.00409853458404541, 0.004477024078369141, 0.004855513572692871, 0.0052340030670166016, 0.005612492561340332, 0.0059909820556640625, 0.006369471549987793, 0.0067479610443115234, 0.007126450538635254, 0.007504940032958984, 0.007883429527282715, 0.008261919021606445, 0.008640408515930176, 0.009018898010253906, 0.009397387504577637, 0.009775876998901367, 0.010154366493225098, 0.010532855987548828, 0.010911345481872559, 0.011289834976196289, 0.01166832447052002, 0.01204681396484375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 180.0, 417.0, 275.0, 79.0, 19.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006863728631287813, -0.0006496244459412992, -0.0006128760287538171, -0.000576127611566335, -0.0005393791943788528, -0.0005026307189837098, -0.0004658823017962277, -0.0004291338846087456, -0.00039238546742126346, -0.00035563705023378134, -0.0003188886330462992, -0.00028214018675498664, -0.0002453917695675045, -0.0002086433523800224, -0.00017189492064062506, -0.0001351464889012277, -9.83980717137456e-05, -6.164964725030586e-05, -2.490122278686613e-05, 1.1847201676573604e-05, 4.859562614001334e-05, 8.534404332749546e-05, 0.0001220924750668928, 0.00015884090680629015, 0.00019558932399377227, 0.0002323377411812544, 0.0002690861583687365, 0.0003058346046600491, 0.0003425830218475312, 0.0003793314390350133, 0.0004160798853263259, 0.000452828302513808, 0.0004895767197012901, 0.0005263251368887722, 0.0005630735540762544, 0.0005998219712637365, 0.0006365703884512186, 0.0006733188638463616, 0.0007100672810338438, 0.0007468156982213259, 0.000783564115408808, 0.0008203125325962901, 0.0008570609497837722, 0.0008938093669712543, 0.0009305578423663974, 0.0009673062013462186, 0.0010040546767413616, 0.0010408030357211828, 0.0010775515111163259, 0.0011142999865114689, 0.00115104834549129, 0.0011877968208864331, 0.0012245451798662543, 0.0012612936552613974, 0.0012980420142412186, 0.0013347904896363616, 0.0013715389650315046, 0.0014082874404266477, 0.0014450357994064689, 0.001481784274801612, 0.001518532633781433, 0.0015552811091765761, 0.0015920294681563973, 0.0016287779435515404, 0.0016655263025313616]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 10.0, 9.0, 5.0, 3.0, 4.0, 9.0, 11.0, 14.0, 20.0, 15.0, 12.0, 18.0, 21.0, 23.0, 23.0, 32.0, 26.0, 36.0, 28.0, 29.0, 35.0, 27.0, 37.0, 35.0, 47.0, 36.0, 35.0, 30.0, 25.0, 30.0, 31.0, 34.0, 32.0, 29.0, 19.0, 29.0, 17.0, 18.0, 16.0, 12.0, 15.0, 5.0, 10.0, 7.0, 9.0, 5.0, 9.0, 8.0, 8.0, 4.0, 4.0, 0.0, 1.0], "bins": [-0.0002532005310058594, -0.0002459865063428879, -0.00023877248167991638, -0.00023155845701694489, -0.0002243444323539734, -0.0002171304076910019, -0.0002099163830280304, -0.0002027023583650589, -0.0001954883337020874, -0.0001882743090391159, -0.0001810602843761444, -0.0001738462597131729, -0.00016663223505020142, -0.00015941821038722992, -0.00015220418572425842, -0.00014499016106128693, -0.00013777613639831543, -0.00013056211173534393, -0.00012334808707237244, -0.00011613406240940094, -0.00010892003774642944, -0.00010170601308345795, -9.449198842048645e-05, -8.727796375751495e-05, -8.006393909454346e-05, -7.284991443157196e-05, -6.563588976860046e-05, -5.842186510562897e-05, -5.120784044265747e-05, -4.3993815779685974e-05, -3.677979111671448e-05, -2.956576645374298e-05, -2.2351741790771484e-05, -1.5137717127799988e-05, -7.923692464828491e-06, -7.096678018569946e-07, 6.504356861114502e-06, 1.3718381524085999e-05, 2.0932406187057495e-05, 2.8146430850028992e-05, 3.536045551300049e-05, 4.2574480175971985e-05, 4.978850483894348e-05, 5.700252950191498e-05, 6.421655416488647e-05, 7.143057882785797e-05, 7.864460349082947e-05, 8.585862815380096e-05, 9.307265281677246e-05, 0.00010028667747974396, 0.00010750070214271545, 0.00011471472680568695, 0.00012192875146865845, 0.00012914277613162994, 0.00013635680079460144, 0.00014357082545757294, 0.00015078485012054443, 0.00015799887478351593, 0.00016521289944648743, 0.00017242692410945892, 0.00017964094877243042, 0.00018685497343540192, 0.0001940689980983734, 0.0002012830227613449, 0.0002084970474243164]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 8.0, 13.0, 11.0, 6.0, 22.0, 22.0, 25.0, 17.0, 35.0, 36.0, 30.0, 36.0, 37.0, 50.0, 34.0, 48.0, 44.0, 42.0, 46.0, 53.0, 45.0, 36.0, 40.0, 32.0, 29.0, 23.0, 31.0, 29.0, 17.0, 14.0, 13.0, 20.0, 7.0, 8.0, 9.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3590087890625, -6.167236328125, -5.9754638671875, -5.78369140625, -5.5919189453125, -5.400146484375, -5.2083740234375, -5.0166015625, -4.8248291015625, -4.633056640625, -4.4412841796875, -4.24951171875, -4.0577392578125, -3.865966796875, -3.6741943359375, -3.482421875, -3.2906494140625, -3.098876953125, -2.9071044921875, -2.71533203125, -2.5235595703125, -2.331787109375, -2.1400146484375, -1.9482421875, -1.7564697265625, -1.564697265625, -1.3729248046875, -1.18115234375, -0.9893798828125, -0.797607421875, -0.6058349609375, -0.4140625, -0.2222900390625, -0.030517578125, 0.1612548828125, 0.35302734375, 0.5447998046875, 0.736572265625, 0.9283447265625, 1.1201171875, 1.3118896484375, 1.503662109375, 1.6954345703125, 1.88720703125, 2.0789794921875, 2.270751953125, 2.4625244140625, 2.654296875, 2.8460693359375, 3.037841796875, 3.2296142578125, 3.42138671875, 3.6131591796875, 3.804931640625, 3.9967041015625, 4.1884765625, 4.3802490234375, 4.572021484375, 4.7637939453125, 4.95556640625, 5.1473388671875, 5.339111328125, 5.5308837890625, 5.72265625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 11.0, 15.0, 22.0, 28.0, 33.0, 63.0, 88.0, 132.0, 234.0, 400.0, 616.0, 1197.0, 2148.0, 4364.0, 9285.0, 23070.0, 69216.0, 271163.0, 470391.0, 130645.0, 38222.0, 14247.0, 6268.0, 2936.0, 1565.0, 838.0, 503.0, 314.0, 170.0, 112.0, 76.0, 57.0, 41.0, 17.0, 15.0, 14.0, 5.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.2734375, -5.11944580078125, -4.9654541015625, -4.81146240234375, -4.657470703125, -4.50347900390625, -4.3494873046875, -4.19549560546875, -4.04150390625, -3.88751220703125, -3.7335205078125, -3.57952880859375, -3.425537109375, -3.27154541015625, -3.1175537109375, -2.96356201171875, -2.8095703125, -2.65557861328125, -2.5015869140625, -2.34759521484375, -2.193603515625, -2.03961181640625, -1.8856201171875, -1.73162841796875, -1.57763671875, -1.42364501953125, -1.2696533203125, -1.11566162109375, -0.961669921875, -0.80767822265625, -0.6536865234375, -0.49969482421875, -0.345703125, -0.19171142578125, -0.0377197265625, 0.11627197265625, 0.270263671875, 0.42425537109375, 0.5782470703125, 0.73223876953125, 0.88623046875, 1.04022216796875, 1.1942138671875, 1.34820556640625, 1.502197265625, 1.65618896484375, 1.8101806640625, 1.96417236328125, 2.1181640625, 2.27215576171875, 2.4261474609375, 2.58013916015625, 2.734130859375, 2.88812255859375, 3.0421142578125, 3.19610595703125, 3.35009765625, 3.50408935546875, 3.6580810546875, 3.81207275390625, 3.966064453125, 4.12005615234375, 4.2740478515625, 4.42803955078125, 4.58203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 14.0, 6.0, 19.0, 15.0, 31.0, 21.0, 26.0, 24.0, 27.0, 40.0, 43.0, 43.0, 39.0, 62.0, 112.0, 444.0, 1519.0, 111.0, 60.0, 44.0, 34.0, 31.0, 43.0, 38.0, 27.0, 21.0, 22.0, 23.0, 12.0, 10.0, 15.0, 12.0, 9.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.796875, -22.146484375, -21.49609375, -20.845703125, -20.1953125, -19.544921875, -18.89453125, -18.244140625, -17.59375, -16.943359375, -16.29296875, -15.642578125, -14.9921875, -14.341796875, -13.69140625, -13.041015625, -12.390625, -11.740234375, -11.08984375, -10.439453125, -9.7890625, -9.138671875, -8.48828125, -7.837890625, -7.1875, -6.537109375, -5.88671875, -5.236328125, -4.5859375, -3.935546875, -3.28515625, -2.634765625, -1.984375, -1.333984375, -0.68359375, -0.033203125, 0.6171875, 1.267578125, 1.91796875, 2.568359375, 3.21875, 3.869140625, 4.51953125, 5.169921875, 5.8203125, 6.470703125, 7.12109375, 7.771484375, 8.421875, 9.072265625, 9.72265625, 10.373046875, 11.0234375, 11.673828125, 12.32421875, 12.974609375, 13.625, 14.275390625, 14.92578125, 15.576171875, 16.2265625, 16.876953125, 17.52734375, 18.177734375, 18.828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 12.0, 16.0, 16.0, 18.0, 24.0, 34.0, 33.0, 45.0, 69.0, 120.0, 116.0, 187.0, 300.0, 520.0, 2440.0, 644345.0, 2492429.0, 3273.0, 572.0, 321.0, 207.0, 132.0, 96.0, 70.0, 66.0, 46.0, 31.0, 38.0, 16.0, 22.0, 10.0, 14.0, 8.0, 11.0, 6.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.65625, -37.32568359375, -35.9951171875, -34.66455078125, -33.333984375, -32.00341796875, -30.6728515625, -29.34228515625, -28.01171875, -26.68115234375, -25.3505859375, -24.02001953125, -22.689453125, -21.35888671875, -20.0283203125, -18.69775390625, -17.3671875, -16.03662109375, -14.7060546875, -13.37548828125, -12.044921875, -10.71435546875, -9.3837890625, -8.05322265625, -6.72265625, -5.39208984375, -4.0615234375, -2.73095703125, -1.400390625, -0.06982421875, 1.2607421875, 2.59130859375, 3.921875, 5.25244140625, 6.5830078125, 7.91357421875, 9.244140625, 10.57470703125, 11.9052734375, 13.23583984375, 14.56640625, 15.89697265625, 17.2275390625, 18.55810546875, 19.888671875, 21.21923828125, 22.5498046875, 23.88037109375, 25.2109375, 26.54150390625, 27.8720703125, 29.20263671875, 30.533203125, 31.86376953125, 33.1943359375, 34.52490234375, 35.85546875, 37.18603515625, 38.5166015625, 39.84716796875, 41.177734375, 42.50830078125, 43.8388671875, 45.16943359375, 46.5]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 41.0, 225.0, 452.0, 246.0, 35.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.57462310791016, -66.5911865234375, -64.60775756835938, -62.62432098388672, -60.64088439941406, -58.657447814941406, -56.674015045166016, -54.690582275390625, -52.70714569091797, -50.72370910644531, -48.74027633666992, -46.75684356689453, -44.773406982421875, -42.78997039794922, -40.80653762817383, -38.82310485839844, -36.83966827392578, -34.856231689453125, -32.872798919677734, -30.88936424255371, -28.905929565429688, -26.922494888305664, -24.93906021118164, -22.955625534057617, -20.972190856933594, -18.98875617980957, -17.005321502685547, -15.021886825561523, -13.0384521484375, -11.055017471313477, -9.071582794189453, -7.08814811706543, -5.104709625244141, -3.121274948120117, -1.1378402709960938, 0.8455944061279297, 2.829029083251953, 4.812463760375977, 6.7958984375, 8.779333114624023, 10.762767791748047, 12.74620246887207, 14.729637145996094, 16.713071823120117, 18.69650650024414, 20.679941177368164, 22.663375854492188, 24.64681053161621, 26.630245208740234, 28.613679885864258, 30.59711456298828, 32.58055114746094, 34.56398391723633, 36.54741668701172, 38.530853271484375, 40.51428985595703, 42.49772262573242, 44.48115539550781, 46.46459197998047, 48.448028564453125, 50.431461334228516, 52.414894104003906, 54.39833068847656, 56.38176727294922, 58.36520004272461]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 8.0, 9.0, 13.0, 22.0, 17.0, 17.0, 18.0, 18.0, 26.0, 30.0, 33.0, 31.0, 40.0, 52.0, 54.0, 37.0, 51.0, 51.0, 66.0, 52.0, 39.0, 33.0, 34.0, 36.0, 26.0, 29.0, 28.0, 19.0, 14.0, 21.0, 6.0, 8.0, 15.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.504302978515625, -58.72920227050781, -56.954105377197266, -55.17900466918945, -53.403907775878906, -51.628807067871094, -49.85370635986328, -48.078609466552734, -46.30350875854492, -44.52840805053711, -42.75331115722656, -40.97821044921875, -39.2031135559082, -37.42801284790039, -35.652915954589844, -33.87781524658203, -32.10271453857422, -30.32761573791504, -28.55251693725586, -26.777416229248047, -25.002317428588867, -23.227218627929688, -21.452119827270508, -19.677021026611328, -17.90192413330078, -16.1268253326416, -14.351725578308105, -12.576626777648926, -10.80152702331543, -9.02642822265625, -7.25132942199707, -5.476229667663574, -3.701129913330078, -1.9260307550430298, -0.15093159675598145, 1.6241674423217773, 3.3992667198181152, 5.174365997314453, 6.949464797973633, 8.724564552307129, 10.499663352966309, 12.274762153625488, 14.049861907958984, 15.824960708618164, 17.600059509277344, 19.375160217285156, 21.150257110595703, 22.925357818603516, 24.700456619262695, 26.475555419921875, 28.250654220581055, 30.025753021240234, 31.800853729248047, 33.575950622558594, 35.351051330566406, 37.12615203857422, 38.901248931884766, 40.67634963989258, 42.451446533203125, 44.22654724121094, 46.001644134521484, 47.7767448425293, 49.551841735839844, 51.326942443847656, 53.10204315185547]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 3.0, 5.0, 10.0, 13.0, 9.0, 21.0, 19.0, 27.0, 19.0, 29.0, 30.0, 35.0, 39.0, 35.0, 27.0, 51.0, 52.0, 36.0, 43.0, 42.0, 41.0, 49.0, 57.0, 31.0, 24.0, 38.0, 28.0, 23.0, 26.0, 20.0, 22.0, 20.0, 19.0, 9.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6640625, -6.47216796875, -6.2802734375, -6.08837890625, -5.896484375, -5.70458984375, -5.5126953125, -5.32080078125, -5.12890625, -4.93701171875, -4.7451171875, -4.55322265625, -4.361328125, -4.16943359375, -3.9775390625, -3.78564453125, -3.59375, -3.40185546875, -3.2099609375, -3.01806640625, -2.826171875, -2.63427734375, -2.4423828125, -2.25048828125, -2.05859375, -1.86669921875, -1.6748046875, -1.48291015625, -1.291015625, -1.09912109375, -0.9072265625, -0.71533203125, -0.5234375, -0.33154296875, -0.1396484375, 0.05224609375, 0.244140625, 0.43603515625, 0.6279296875, 0.81982421875, 1.01171875, 1.20361328125, 1.3955078125, 1.58740234375, 1.779296875, 1.97119140625, 2.1630859375, 2.35498046875, 2.546875, 2.73876953125, 2.9306640625, 3.12255859375, 3.314453125, 3.50634765625, 3.6982421875, 3.89013671875, 4.08203125, 4.27392578125, 4.4658203125, 4.65771484375, 4.849609375, 5.04150390625, 5.2333984375, 5.42529296875, 5.6171875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 10.0, 12.0, 14.0, 19.0, 26.0, 27.0, 31.0, 30.0, 45.0, 62.0, 60.0, 120.0, 232.0, 862.0, 17477.0, 3487930.0, 682171.0, 4040.0, 480.0, 166.0, 98.0, 62.0, 52.0, 42.0, 41.0, 27.0, 21.0, 15.0, 18.0, 16.0, 12.0, 13.0, 8.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.8125, -37.697265625, -36.58203125, -35.466796875, -34.3515625, -33.236328125, -32.12109375, -31.005859375, -29.890625, -28.775390625, -27.66015625, -26.544921875, -25.4296875, -24.314453125, -23.19921875, -22.083984375, -20.96875, -19.853515625, -18.73828125, -17.623046875, -16.5078125, -15.392578125, -14.27734375, -13.162109375, -12.046875, -10.931640625, -9.81640625, -8.701171875, -7.5859375, -6.470703125, -5.35546875, -4.240234375, -3.125, -2.009765625, -0.89453125, 0.220703125, 1.3359375, 2.451171875, 3.56640625, 4.681640625, 5.796875, 6.912109375, 8.02734375, 9.142578125, 10.2578125, 11.373046875, 12.48828125, 13.603515625, 14.71875, 15.833984375, 16.94921875, 18.064453125, 19.1796875, 20.294921875, 21.41015625, 22.525390625, 23.640625, 24.755859375, 25.87109375, 26.986328125, 28.1015625, 29.216796875, 30.33203125, 31.447265625, 32.5625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 9.0, 17.0, 17.0, 23.0, 24.0, 35.0, 42.0, 47.0, 73.0, 84.0, 125.0, 175.0, 214.0, 287.0, 310.0, 342.0, 392.0, 405.0, 321.0, 255.0, 201.0, 137.0, 103.0, 83.0, 70.0, 52.0, 48.0, 42.0, 39.0, 20.0, 21.0, 13.0, 11.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.6640625, -11.3040771484375, -10.944091796875, -10.5841064453125, -10.22412109375, -9.8641357421875, -9.504150390625, -9.1441650390625, -8.7841796875, -8.4241943359375, -8.064208984375, -7.7042236328125, -7.34423828125, -6.9842529296875, -6.624267578125, -6.2642822265625, -5.904296875, -5.5443115234375, -5.184326171875, -4.8243408203125, -4.46435546875, -4.1043701171875, -3.744384765625, -3.3843994140625, -3.0244140625, -2.6644287109375, -2.304443359375, -1.9444580078125, -1.58447265625, -1.2244873046875, -0.864501953125, -0.5045166015625, -0.14453125, 0.2154541015625, 0.575439453125, 0.9354248046875, 1.29541015625, 1.6553955078125, 2.015380859375, 2.3753662109375, 2.7353515625, 3.0953369140625, 3.455322265625, 3.8153076171875, 4.17529296875, 4.5352783203125, 4.895263671875, 5.2552490234375, 5.615234375, 5.9752197265625, 6.335205078125, 6.6951904296875, 7.05517578125, 7.4151611328125, 7.775146484375, 8.1351318359375, 8.4951171875, 8.8551025390625, 9.215087890625, 9.5750732421875, 9.93505859375, 10.2950439453125, 10.655029296875, 11.0150146484375, 11.375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 4.0, 1.0, 13.0, 7.0, 10.0, 11.0, 16.0, 30.0, 32.0, 30.0, 54.0, 48.0, 75.0, 80.0, 103.0, 146.0, 173.0, 267.0, 399.0, 869.0, 6599.0, 2688803.0, 1489234.0, 5082.0, 800.0, 418.0, 249.0, 165.0, 117.0, 103.0, 76.0, 70.0, 36.0, 40.0, 27.0, 27.0, 12.0, 18.0, 11.0, 12.0, 5.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.625, -41.876953125, -40.12890625, -38.380859375, -36.6328125, -34.884765625, -33.13671875, -31.388671875, -29.640625, -27.892578125, -26.14453125, -24.396484375, -22.6484375, -20.900390625, -19.15234375, -17.404296875, -15.65625, -13.908203125, -12.16015625, -10.412109375, -8.6640625, -6.916015625, -5.16796875, -3.419921875, -1.671875, 0.076171875, 1.82421875, 3.572265625, 5.3203125, 7.068359375, 8.81640625, 10.564453125, 12.3125, 14.060546875, 15.80859375, 17.556640625, 19.3046875, 21.052734375, 22.80078125, 24.548828125, 26.296875, 28.044921875, 29.79296875, 31.541015625, 33.2890625, 35.037109375, 36.78515625, 38.533203125, 40.28125, 42.029296875, 43.77734375, 45.525390625, 47.2734375, 49.021484375, 50.76953125, 52.517578125, 54.265625, 56.013671875, 57.76171875, 59.509765625, 61.2578125, 63.005859375, 64.75390625, 66.501953125, 68.25]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 14.0, 41.0, 103.0, 176.0, 238.0, 231.0, 116.0, 63.0, 16.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.58984375, -22.22252082824707, -18.85519790649414, -15.487876892089844, -12.120553970336914, -8.753231048583984, -5.3859100341796875, -2.018587112426758, 1.3487358093261719, 4.716058254241943, 8.083380699157715, 11.450702667236328, 14.818025588989258, 18.185348510742188, 21.552669525146484, 24.919992446899414, 28.287315368652344, 31.654638290405273, 35.0219612121582, 38.3892822265625, 41.75660705566406, 45.12392807006836, 48.491249084472656, 51.85857391357422, 55.225894927978516, 58.59321594238281, 61.960540771484375, 65.32786560058594, 68.69518280029297, 72.06250762939453, 75.42982482910156, 78.79714965820312, 82.16447448730469, 85.53179931640625, 88.89911651611328, 92.26644134521484, 95.6337661743164, 99.00108337402344, 102.368408203125, 105.73573303222656, 109.10305786132812, 112.47038269042969, 115.83769989013672, 119.20502471923828, 122.57234954833984, 125.93966674804688, 129.30699157714844, 132.67431640625, 136.0416259765625, 139.40895080566406, 142.77627563476562, 146.14358520507812, 149.5109100341797, 152.87823486328125, 156.2455596923828, 159.61288452148438, 162.98020935058594, 166.3475341796875, 169.71485900878906, 173.08218383789062, 176.44949340820312, 179.8168182373047, 183.18414306640625, 186.5514678955078, 189.91879272460938]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 7.0, 10.0, 12.0, 12.0, 3.0, 17.0, 16.0, 15.0, 19.0, 19.0, 23.0, 22.0, 21.0, 26.0, 41.0, 34.0, 41.0, 36.0, 44.0, 38.0, 44.0, 38.0, 47.0, 43.0, 31.0, 41.0, 31.0, 30.0, 23.0, 22.0, 27.0, 20.0, 30.0, 16.0, 12.0, 8.0, 19.0, 9.0, 10.0, 12.0, 5.0, 2.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.049949645996094, -34.77021789550781, -33.49048614501953, -32.21075439453125, -30.93102264404297, -29.651290893554688, -28.371559143066406, -27.091827392578125, -25.812095642089844, -24.532363891601562, -23.25263214111328, -21.972900390625, -20.69316864013672, -19.413436889648438, -18.133705139160156, -16.853973388671875, -15.574239730834961, -14.29450798034668, -13.014776229858398, -11.735044479370117, -10.455312728881836, -9.175580978393555, -7.895848274230957, -6.616116523742676, -5.3363847732543945, -4.056653022766113, -2.776921033859253, -1.4971890449523926, -0.21745729446411133, 1.06227445602417, 2.3420066833496094, 3.6217384338378906, 4.901470184326172, 6.181201934814453, 7.460933685302734, 8.740665435791016, 10.020397186279297, 11.300128936767578, 12.579861640930176, 13.859593391418457, 15.139325141906738, 16.419057846069336, 17.698789596557617, 18.9785213470459, 20.25825309753418, 21.53798484802246, 22.817716598510742, 24.097448348999023, 25.377180099487305, 26.656911849975586, 27.936643600463867, 29.21637535095215, 30.49610710144043, 31.77583885192871, 33.055572509765625, 34.335304260253906, 35.61503601074219, 36.89476776123047, 38.17449951171875, 39.45423126220703, 40.73396301269531, 42.013694763183594, 43.293426513671875, 44.573158264160156, 45.85289001464844]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 20.0, 20.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 18.0, 26.0, 41.0, 45.0, 75.0, 118.0, 158.0, 195.0, 315.0, 476.0, 664.0, 916.0, 1365.0, 1929.0, 2785.0, 4232.0, 6430.0, 9579.0, 14449.0, 22414.0, 35127.0, 55854.0, 89463.0, 146149.0, 227960.0, 159915.0, 97740.0, 60889.0, 37760.0, 24092.0, 15798.0, 10257.0, 6864.0, 4595.0, 3073.0, 2098.0, 1467.0, 964.0, 667.0, 513.0, 286.0, 243.0, 147.0, 123.0, 82.0, 60.0, 32.0, 37.0, 16.0, 11.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0], "bins": [-0.84423828125, -0.8175125122070312, -0.7907867431640625, -0.7640609741210938, -0.737335205078125, -0.7106094360351562, -0.6838836669921875, -0.6571578979492188, -0.63043212890625, -0.6037063598632812, -0.5769805908203125, -0.5502548217773438, -0.523529052734375, -0.49680328369140625, -0.4700775146484375, -0.44335174560546875, -0.4166259765625, -0.38990020751953125, -0.3631744384765625, -0.33644866943359375, -0.309722900390625, -0.28299713134765625, -0.2562713623046875, -0.22954559326171875, -0.20281982421875, -0.17609405517578125, -0.1493682861328125, -0.12264251708984375, -0.095916748046875, -0.06919097900390625, -0.0424652099609375, -0.01573944091796875, 0.010986328125, 0.03771209716796875, 0.0644378662109375, 0.09116363525390625, 0.117889404296875, 0.14461517333984375, 0.1713409423828125, 0.19806671142578125, 0.22479248046875, 0.25151824951171875, 0.2782440185546875, 0.30496978759765625, 0.331695556640625, 0.35842132568359375, 0.3851470947265625, 0.41187286376953125, 0.4385986328125, 0.46532440185546875, 0.4920501708984375, 0.5187759399414062, 0.545501708984375, 0.5722274780273438, 0.5989532470703125, 0.6256790161132812, 0.65240478515625, 0.6791305541992188, 0.7058563232421875, 0.7325820922851562, 0.759307861328125, 0.7860336303710938, 0.8127593994140625, 0.8394851684570312, 0.8662109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 3.0, 6.0, 7.0, 16.0, 18.0, 21.0, 23.0, 31.0, 22.0, 32.0, 48.0, 38.0, 39.0, 31.0, 36.0, 45.0, 44.0, 1077.0, 41.0, 45.0, 48.0, 39.0, 29.0, 41.0, 22.0, 29.0, 27.0, 24.0, 22.0, 21.0, 16.0, 15.0, 11.0, 7.0, 8.0, 6.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.390625, -4.267822265625, -4.14501953125, -4.022216796875, -3.8994140625, -3.776611328125, -3.65380859375, -3.531005859375, -3.408203125, -3.285400390625, -3.16259765625, -3.039794921875, -2.9169921875, -2.794189453125, -2.67138671875, -2.548583984375, -2.42578125, -2.302978515625, -2.18017578125, -2.057373046875, -1.9345703125, -1.811767578125, -1.68896484375, -1.566162109375, -1.443359375, -1.320556640625, -1.19775390625, -1.074951171875, -0.9521484375, -0.829345703125, -0.70654296875, -0.583740234375, -0.4609375, -0.338134765625, -0.21533203125, -0.092529296875, 0.0302734375, 0.153076171875, 0.27587890625, 0.398681640625, 0.521484375, 0.644287109375, 0.76708984375, 0.889892578125, 1.0126953125, 1.135498046875, 1.25830078125, 1.381103515625, 1.50390625, 1.626708984375, 1.74951171875, 1.872314453125, 1.9951171875, 2.117919921875, 2.24072265625, 2.363525390625, 2.486328125, 2.609130859375, 2.73193359375, 2.854736328125, 2.9775390625, 3.100341796875, 3.22314453125, 3.345947265625, 3.46875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 9.0, 9.0, 15.0, 23.0, 33.0, 67.0, 95.0, 124.0, 186.0, 286.0, 452.0, 626.0, 967.0, 1513.0, 2239.0, 3438.0, 5013.0, 7713.0, 12092.0, 18818.0, 30214.0, 49345.0, 83538.0, 149650.0, 1311109.0, 174373.0, 96039.0, 55742.0, 33704.0, 21266.0, 13136.0, 8562.0, 5725.0, 3724.0, 2449.0, 1653.0, 1100.0, 722.0, 446.0, 298.0, 213.0, 134.0, 88.0, 69.0, 33.0, 26.0, 17.0, 13.0, 9.0, 6.0, 2.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.833984375, -0.8067474365234375, -0.779510498046875, -0.7522735595703125, -0.72503662109375, -0.6977996826171875, -0.670562744140625, -0.6433258056640625, -0.6160888671875, -0.5888519287109375, -0.561614990234375, -0.5343780517578125, -0.50714111328125, -0.4799041748046875, -0.452667236328125, -0.4254302978515625, -0.398193359375, -0.3709564208984375, -0.343719482421875, -0.3164825439453125, -0.28924560546875, -0.2620086669921875, -0.234771728515625, -0.2075347900390625, -0.1802978515625, -0.1530609130859375, -0.125823974609375, -0.0985870361328125, -0.07135009765625, -0.0441131591796875, -0.016876220703125, 0.0103607177734375, 0.03759765625, 0.0648345947265625, 0.092071533203125, 0.1193084716796875, 0.14654541015625, 0.1737823486328125, 0.201019287109375, 0.2282562255859375, 0.2554931640625, 0.2827301025390625, 0.309967041015625, 0.3372039794921875, 0.36444091796875, 0.3916778564453125, 0.418914794921875, 0.4461517333984375, 0.473388671875, 0.5006256103515625, 0.527862548828125, 0.5550994873046875, 0.58233642578125, 0.6095733642578125, 0.636810302734375, 0.6640472412109375, 0.6912841796875, 0.7185211181640625, 0.745758056640625, 0.7729949951171875, 0.80023193359375, 0.8274688720703125, 0.854705810546875, 0.8819427490234375, 0.9091796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 6.0, 6.0, 9.0, 14.0, 8.0, 13.0, 11.0, 17.0, 22.0, 26.0, 44.0, 39.0, 45.0, 45.0, 57.0, 69.0, 71.0, 54.0, 71.0, 57.0, 49.0, 45.0, 40.0, 30.0, 23.0, 26.0, 15.0, 15.0, 11.0, 9.0, 15.0, 6.0, 5.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005655288696289062, -0.0005484223365783691, -0.000531315803527832, -0.0005142092704772949, -0.0004971027374267578, -0.0004799962043762207, -0.0004628896713256836, -0.0004457831382751465, -0.0004286766052246094, -0.00041157007217407227, -0.00039446353912353516, -0.00037735700607299805, -0.00036025047302246094, -0.00034314393997192383, -0.0003260374069213867, -0.0003089308738708496, -0.0002918243408203125, -0.0002747178077697754, -0.0002576112747192383, -0.00024050474166870117, -0.00022339820861816406, -0.00020629167556762695, -0.00018918514251708984, -0.00017207860946655273, -0.00015497207641601562, -0.00013786554336547852, -0.0001207590103149414, -0.0001036524772644043, -8.654594421386719e-05, -6.943941116333008e-05, -5.233287811279297e-05, -3.522634506225586e-05, -1.811981201171875e-05, -1.0132789611816406e-06, 1.609325408935547e-05, 3.319978713989258e-05, 5.030632019042969e-05, 6.74128532409668e-05, 8.45193862915039e-05, 0.00010162591934204102, 0.00011873245239257812, 0.00013583898544311523, 0.00015294551849365234, 0.00017005205154418945, 0.00018715858459472656, 0.00020426511764526367, 0.00022137165069580078, 0.0002384781837463379, 0.000255584716796875, 0.0002726912498474121, 0.0002897977828979492, 0.00030690431594848633, 0.00032401084899902344, 0.00034111738204956055, 0.00035822391510009766, 0.00037533044815063477, 0.0003924369812011719, 0.000409543514251709, 0.0004266500473022461, 0.0004437565803527832, 0.0004608631134033203, 0.0004779696464538574, 0.0004950761795043945, 0.0005121827125549316, 0.0005292892456054688]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 12.0, 12.0, 25.0, 20.0, 28.0, 53.0, 77.0, 126.0, 210.0, 491.0, 1654.0, 1016260.0, 27997.0, 780.0, 296.0, 164.0, 102.0, 80.0, 41.0, 38.0, 12.0, 14.0, 15.0, 9.0, 9.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0157012939453125, -0.015190839767456055, -0.01468038558959961, -0.014169931411743164, -0.013659477233886719, -0.013149023056030273, -0.012638568878173828, -0.012128114700317383, -0.011617660522460938, -0.011107206344604492, -0.010596752166748047, -0.010086297988891602, -0.009575843811035156, -0.009065389633178711, -0.008554935455322266, -0.00804448127746582, -0.007534027099609375, -0.00702357292175293, -0.006513118743896484, -0.006002664566040039, -0.005492210388183594, -0.0049817562103271484, -0.004471302032470703, -0.003960847854614258, -0.0034503936767578125, -0.002939939498901367, -0.002429485321044922, -0.0019190311431884766, -0.0014085769653320312, -0.0008981227874755859, -0.0003876686096191406, 0.0001227855682373047, 0.00063323974609375, 0.0011436939239501953, 0.0016541481018066406, 0.002164602279663086, 0.0026750564575195312, 0.0031855106353759766, 0.003695964813232422, 0.004206418991088867, 0.0047168731689453125, 0.005227327346801758, 0.005737781524658203, 0.0062482357025146484, 0.006758689880371094, 0.007269144058227539, 0.007779598236083984, 0.00829005241394043, 0.008800506591796875, 0.00931096076965332, 0.009821414947509766, 0.010331869125366211, 0.010842323303222656, 0.011352777481079102, 0.011863231658935547, 0.012373685836791992, 0.012884140014648438, 0.013394594192504883, 0.013905048370361328, 0.014415502548217773, 0.014925956726074219, 0.015436410903930664, 0.01594686508178711, 0.016457319259643555, 0.0169677734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 105.0, 682.0, 215.0, 9.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009810629999265075, -0.00091396807692945, -0.0008468731539323926, -0.0007797781727276742, -0.0007126832497306168, -0.0006455883267335594, -0.000578493345528841, -0.0005113984225317836, -0.00044430349953472614, -0.0003772085765376687, -0.0003101136244367808, -0.00024301868688780814, -0.00017592374933883548, -0.00010882882634177804, -4.1733874240890145e-05, 2.536107785999775e-05, 9.245600085705519e-05, 0.00015955093840602785, 0.00022664587595500052, 0.0002937408280558884, 0.00036083575105294585, 0.0004279306740500033, 0.0004950256552547216, 0.0005621205782517791, 0.0006292155012488365, 0.000696310424245894, 0.0007634053472429514, 0.0008305003284476697, 0.0008975952514447272, 0.0009646901744417846, 0.001031785155646503, 0.0010988800786435604, 0.0011659751180559397, 0.0012330700410529971, 0.0013001649640500546, 0.001367259887047112, 0.0014343548100441694, 0.0015014498494565487, 0.0015685447724536061, 0.0016356396954506636, 0.001702734618447721, 0.0017698295414447784, 0.0018369244644418359, 0.0019040193874388933, 0.0019711144268512726, 0.002038209233433008, 0.0021053042728453875, 0.0021723993122577667, 0.0022394941188395023, 0.0023065891582518816, 0.002373683964833617, 0.0024407790042459965, 0.002507873810827732, 0.0025749688502401114, 0.002642063656821847, 0.0027091586962342262, 0.002776253502815962, 0.002843348542228341, 0.0029104433488100767, 0.002977538388222456, 0.0030446331948041916, 0.003111728234216571, 0.0031788230407983065, 0.0032459180802106857, 0.003313013119623065]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 6.0, 11.0, 3.0, 5.0, 8.0, 10.0, 15.0, 5.0, 12.0, 29.0, 13.0, 25.0, 31.0, 33.0, 37.0, 43.0, 40.0, 34.0, 38.0, 32.0, 36.0, 36.0, 37.0, 33.0, 30.0, 32.0, 47.0, 33.0, 35.0, 28.0, 24.0, 23.0, 35.0, 16.0, 17.0, 11.0, 13.0, 12.0, 14.0, 9.0, 11.0, 11.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0002714991569519043, -0.0002638213336467743, -0.0002561435103416443, -0.0002484656870365143, -0.00024078786373138428, -0.00023311004042625427, -0.00022543221712112427, -0.00021775439381599426, -0.00021007657051086426, -0.00020239874720573425, -0.00019472092390060425, -0.00018704310059547424, -0.00017936527729034424, -0.00017168745398521423, -0.00016400963068008423, -0.00015633180737495422, -0.00014865398406982422, -0.00014097616076469421, -0.0001332983374595642, -0.0001256205141544342, -0.0001179426908493042, -0.0001102648675441742, -0.00010258704423904419, -9.490922093391418e-05, -8.723139762878418e-05, -7.955357432365417e-05, -7.187575101852417e-05, -6.419792771339417e-05, -5.652010440826416e-05, -4.8842281103134155e-05, -4.116445779800415e-05, -3.3486634492874146e-05, -2.580881118774414e-05, -1.8130987882614136e-05, -1.0453164577484131e-05, -2.775341272354126e-06, 4.902482032775879e-06, 1.2580305337905884e-05, 2.025812864303589e-05, 2.7935951948165894e-05, 3.56137752532959e-05, 4.32915985584259e-05, 5.096942186355591e-05, 5.864724516868591e-05, 6.632506847381592e-05, 7.400289177894592e-05, 8.168071508407593e-05, 8.935853838920593e-05, 9.703636169433594e-05, 0.00010471418499946594, 0.00011239200830459595, 0.00012006983160972595, 0.00012774765491485596, 0.00013542547821998596, 0.00014310330152511597, 0.00015078112483024597, 0.00015845894813537598, 0.00016613677144050598, 0.00017381459474563599, 0.000181492418050766, 0.000189170241355896, 0.000196848064661026, 0.000204525887966156, 0.000212203711271286, 0.00021988153457641602]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 1.0, 13.0, 7.0, 8.0, 15.0, 13.0, 16.0, 21.0, 17.0, 25.0, 30.0, 33.0, 33.0, 36.0, 30.0, 46.0, 31.0, 35.0, 41.0, 26.0, 48.0, 40.0, 39.0, 44.0, 41.0, 27.0, 39.0, 26.0, 28.0, 29.0, 28.0, 16.0, 21.0, 19.0, 15.0, 12.0, 7.0, 14.0, 8.0, 6.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.33203125, -6.1514892578125, -5.970947265625, -5.7904052734375, -5.60986328125, -5.4293212890625, -5.248779296875, -5.0682373046875, -4.8876953125, -4.7071533203125, -4.526611328125, -4.3460693359375, -4.16552734375, -3.9849853515625, -3.804443359375, -3.6239013671875, -3.443359375, -3.2628173828125, -3.082275390625, -2.9017333984375, -2.72119140625, -2.5406494140625, -2.360107421875, -2.1795654296875, -1.9990234375, -1.8184814453125, -1.637939453125, -1.4573974609375, -1.27685546875, -1.0963134765625, -0.915771484375, -0.7352294921875, -0.5546875, -0.3741455078125, -0.193603515625, -0.0130615234375, 0.16748046875, 0.3480224609375, 0.528564453125, 0.7091064453125, 0.8896484375, 1.0701904296875, 1.250732421875, 1.4312744140625, 1.61181640625, 1.7923583984375, 1.972900390625, 2.1534423828125, 2.333984375, 2.5145263671875, 2.695068359375, 2.8756103515625, 3.05615234375, 3.2366943359375, 3.417236328125, 3.5977783203125, 3.7783203125, 3.9588623046875, 4.139404296875, 4.3199462890625, 4.50048828125, 4.6810302734375, 4.861572265625, 5.0421142578125, 5.22265625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 9.0, 10.0, 11.0, 13.0, 25.0, 39.0, 49.0, 80.0, 113.0, 144.0, 227.0, 372.0, 593.0, 969.0, 1526.0, 2629.0, 4192.0, 7286.0, 12230.0, 22611.0, 43806.0, 92643.0, 232976.0, 354338.0, 139737.0, 61580.0, 30810.0, 16265.0, 9209.0, 5593.0, 3174.0, 1956.0, 1249.0, 747.0, 447.0, 283.0, 203.0, 128.0, 85.0, 61.0, 47.0, 30.0, 18.0, 14.0, 11.0, 7.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.00390625, -2.907745361328125, -2.81158447265625, -2.715423583984375, -2.6192626953125, -2.523101806640625, -2.42694091796875, -2.330780029296875, -2.234619140625, -2.138458251953125, -2.04229736328125, -1.946136474609375, -1.8499755859375, -1.753814697265625, -1.65765380859375, -1.561492919921875, -1.46533203125, -1.369171142578125, -1.27301025390625, -1.176849365234375, -1.0806884765625, -0.984527587890625, -0.88836669921875, -0.792205810546875, -0.696044921875, -0.599884033203125, -0.50372314453125, -0.407562255859375, -0.3114013671875, -0.215240478515625, -0.11907958984375, -0.022918701171875, 0.0732421875, 0.169403076171875, 0.26556396484375, 0.361724853515625, 0.4578857421875, 0.554046630859375, 0.65020751953125, 0.746368408203125, 0.842529296875, 0.938690185546875, 1.03485107421875, 1.131011962890625, 1.2271728515625, 1.323333740234375, 1.41949462890625, 1.515655517578125, 1.61181640625, 1.707977294921875, 1.80413818359375, 1.900299072265625, 1.9964599609375, 2.092620849609375, 2.18878173828125, 2.284942626953125, 2.381103515625, 2.477264404296875, 2.57342529296875, 2.669586181640625, 2.7657470703125, 2.861907958984375, 2.95806884765625, 3.054229736328125, 3.150390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 4.0, 6.0, 7.0, 4.0, 7.0, 16.0, 12.0, 18.0, 23.0, 17.0, 27.0, 31.0, 33.0, 47.0, 52.0, 57.0, 102.0, 1565.0, 449.0, 105.0, 56.0, 53.0, 58.0, 47.0, 40.0, 31.0, 25.0, 32.0, 21.0, 22.0, 20.0, 10.0, 13.0, 6.0, 6.0, 4.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.515625, -19.781982421875, -19.04833984375, -18.314697265625, -17.5810546875, -16.847412109375, -16.11376953125, -15.380126953125, -14.646484375, -13.912841796875, -13.17919921875, -12.445556640625, -11.7119140625, -10.978271484375, -10.24462890625, -9.510986328125, -8.77734375, -8.043701171875, -7.31005859375, -6.576416015625, -5.8427734375, -5.109130859375, -4.37548828125, -3.641845703125, -2.908203125, -2.174560546875, -1.44091796875, -0.707275390625, 0.0263671875, 0.760009765625, 1.49365234375, 2.227294921875, 2.9609375, 3.694580078125, 4.42822265625, 5.161865234375, 5.8955078125, 6.629150390625, 7.36279296875, 8.096435546875, 8.830078125, 9.563720703125, 10.29736328125, 11.031005859375, 11.7646484375, 12.498291015625, 13.23193359375, 13.965576171875, 14.69921875, 15.432861328125, 16.16650390625, 16.900146484375, 17.6337890625, 18.367431640625, 19.10107421875, 19.834716796875, 20.568359375, 21.302001953125, 22.03564453125, 22.769287109375, 23.5029296875, 24.236572265625, 24.97021484375, 25.703857421875, 26.4375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 12.0, 15.0, 11.0, 19.0, 26.0, 35.0, 39.0, 49.0, 55.0, 82.0, 125.0, 170.0, 249.0, 349.0, 744.0, 7047.0, 3009985.0, 123302.0, 1951.0, 480.0, 280.0, 172.0, 123.0, 82.0, 69.0, 51.0, 29.0, 29.0, 19.0, 11.0, 11.0, 10.0, 11.0, 13.0, 7.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.6875, -44.2939453125, -42.900390625, -41.5068359375, -40.11328125, -38.7197265625, -37.326171875, -35.9326171875, -34.5390625, -33.1455078125, -31.751953125, -30.3583984375, -28.96484375, -27.5712890625, -26.177734375, -24.7841796875, -23.390625, -21.9970703125, -20.603515625, -19.2099609375, -17.81640625, -16.4228515625, -15.029296875, -13.6357421875, -12.2421875, -10.8486328125, -9.455078125, -8.0615234375, -6.66796875, -5.2744140625, -3.880859375, -2.4873046875, -1.09375, 0.2998046875, 1.693359375, 3.0869140625, 4.48046875, 5.8740234375, 7.267578125, 8.6611328125, 10.0546875, 11.4482421875, 12.841796875, 14.2353515625, 15.62890625, 17.0224609375, 18.416015625, 19.8095703125, 21.203125, 22.5966796875, 23.990234375, 25.3837890625, 26.77734375, 28.1708984375, 29.564453125, 30.9580078125, 32.3515625, 33.7451171875, 35.138671875, 36.5322265625, 37.92578125, 39.3193359375, 40.712890625, 42.1064453125, 43.5]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 51.0, 151.0, 372.0, 297.0, 112.0, 20.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.156606674194336, -27.310348510742188, -25.464088439941406, -23.617830276489258, -21.77157211303711, -19.925312042236328, -18.07905387878418, -16.23279571533203, -14.386536598205566, -12.540277481079102, -10.694019317626953, -8.847760200500488, -7.001501560211182, -5.155242919921875, -3.30898380279541, -1.4627256393432617, 0.3835334777832031, 2.2297921180725098, 4.076050758361816, 5.922309875488281, 7.768568515777588, 9.614827156066895, 11.46108627319336, 13.307344436645508, 15.153603553771973, 16.999862670898438, 18.846120834350586, 20.692378997802734, 22.538639068603516, 24.384897232055664, 26.231155395507812, 28.077415466308594, 29.92367172241211, 31.769929885864258, 33.616188049316406, 35.46244812011719, 37.30870819091797, 39.154964447021484, 41.001224517822266, 42.84748077392578, 44.69374084472656, 46.540000915527344, 48.38625717163086, 50.23251724243164, 52.07877731323242, 53.92503356933594, 55.77129364013672, 57.6175537109375, 59.46381378173828, 61.31007385253906, 63.15633010864258, 65.00259399414062, 66.84884643554688, 68.69510650634766, 70.54136657714844, 72.38762664794922, 74.23387908935547, 76.08013916015625, 77.92639923095703, 79.77265930175781, 81.61891174316406, 83.46517181396484, 85.31143188476562, 87.1576919555664, 89.00395202636719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 10.0, 7.0, 6.0, 18.0, 17.0, 24.0, 14.0, 11.0, 27.0, 26.0, 30.0, 45.0, 29.0, 34.0, 32.0, 29.0, 43.0, 45.0, 59.0, 33.0, 33.0, 38.0, 38.0, 35.0, 46.0, 25.0, 30.0, 24.0, 33.0, 22.0, 21.0, 19.0, 19.0, 8.0, 16.0, 11.0, 7.0, 5.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.529762268066406, -49.7943115234375, -48.058860778808594, -46.32341384887695, -44.58796310424805, -42.85251235961914, -41.117061614990234, -39.381614685058594, -37.64616394042969, -35.91071319580078, -34.175262451171875, -32.439815521240234, -30.704364776611328, -28.968914031982422, -27.233463287353516, -25.498014450073242, -23.762563705444336, -22.02711296081543, -20.291664123535156, -18.55621337890625, -16.820764541625977, -15.08531379699707, -13.34986400604248, -11.61441421508789, -9.8789644241333, -8.143514633178711, -6.408064842224121, -4.672614574432373, -2.937164783477783, -1.2017145156860352, 0.5337352752685547, 2.2691850662231445, 4.004634857177734, 5.740084648132324, 7.475534439086914, 9.21098518371582, 10.946434020996094, 12.681884765625, 14.41733455657959, 16.15278434753418, 17.888233184814453, 19.62368392944336, 21.359132766723633, 23.09458351135254, 24.830032348632812, 26.56548309326172, 28.300933837890625, 30.0363826751709, 31.771833419799805, 33.50728225708008, 35.242733001708984, 36.97818374633789, 38.7136344909668, 40.44908142089844, 42.184532165527344, 43.91998291015625, 45.655433654785156, 47.39088439941406, 49.12633514404297, 50.86178207397461, 52.597232818603516, 54.33268356323242, 56.06813430786133, 57.80358123779297, 59.539031982421875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 10.0, 9.0, 8.0, 16.0, 11.0, 12.0, 16.0, 24.0, 28.0, 32.0, 30.0, 32.0, 41.0, 30.0, 42.0, 39.0, 37.0, 41.0, 40.0, 39.0, 40.0, 42.0, 52.0, 33.0, 29.0, 31.0, 34.0, 31.0, 24.0, 21.0, 18.0, 20.0, 19.0, 11.0, 16.0, 10.0, 7.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.75, -6.55615234375, -6.3623046875, -6.16845703125, -5.974609375, -5.78076171875, -5.5869140625, -5.39306640625, -5.19921875, -5.00537109375, -4.8115234375, -4.61767578125, -4.423828125, -4.22998046875, -4.0361328125, -3.84228515625, -3.6484375, -3.45458984375, -3.2607421875, -3.06689453125, -2.873046875, -2.67919921875, -2.4853515625, -2.29150390625, -2.09765625, -1.90380859375, -1.7099609375, -1.51611328125, -1.322265625, -1.12841796875, -0.9345703125, -0.74072265625, -0.546875, -0.35302734375, -0.1591796875, 0.03466796875, 0.228515625, 0.42236328125, 0.6162109375, 0.81005859375, 1.00390625, 1.19775390625, 1.3916015625, 1.58544921875, 1.779296875, 1.97314453125, 2.1669921875, 2.36083984375, 2.5546875, 2.74853515625, 2.9423828125, 3.13623046875, 3.330078125, 3.52392578125, 3.7177734375, 3.91162109375, 4.10546875, 4.29931640625, 4.4931640625, 4.68701171875, 4.880859375, 5.07470703125, 5.2685546875, 5.46240234375, 5.65625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 9.0, 10.0, 22.0, 26.0, 30.0, 39.0, 51.0, 59.0, 116.0, 149.0, 206.0, 373.0, 578.0, 1210.0, 2707.0, 7473.0, 29676.0, 183918.0, 1015312.0, 1962888.0, 820835.0, 133066.0, 24050.0, 6327.0, 2372.0, 1112.0, 588.0, 338.0, 217.0, 171.0, 82.0, 63.0, 46.0, 48.0, 22.0, 14.0, 19.0, 13.0, 14.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.28125, -8.9949951171875, -8.708740234375, -8.4224853515625, -8.13623046875, -7.8499755859375, -7.563720703125, -7.2774658203125, -6.9912109375, -6.7049560546875, -6.418701171875, -6.1324462890625, -5.84619140625, -5.5599365234375, -5.273681640625, -4.9874267578125, -4.701171875, -4.4149169921875, -4.128662109375, -3.8424072265625, -3.55615234375, -3.2698974609375, -2.983642578125, -2.6973876953125, -2.4111328125, -2.1248779296875, -1.838623046875, -1.5523681640625, -1.26611328125, -0.9798583984375, -0.693603515625, -0.4073486328125, -0.12109375, 0.1651611328125, 0.451416015625, 0.7376708984375, 1.02392578125, 1.3101806640625, 1.596435546875, 1.8826904296875, 2.1689453125, 2.4552001953125, 2.741455078125, 3.0277099609375, 3.31396484375, 3.6002197265625, 3.886474609375, 4.1727294921875, 4.458984375, 4.7452392578125, 5.031494140625, 5.3177490234375, 5.60400390625, 5.8902587890625, 6.176513671875, 6.4627685546875, 6.7490234375, 7.0352783203125, 7.321533203125, 7.6077880859375, 7.89404296875, 8.1802978515625, 8.466552734375, 8.7528076171875, 9.0390625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 8.0, 11.0, 16.0, 30.0, 37.0, 56.0, 68.0, 86.0, 119.0, 134.0, 209.0, 332.0, 396.0, 535.0, 506.0, 374.0, 281.0, 245.0, 178.0, 116.0, 95.0, 66.0, 46.0, 35.0, 26.0, 19.0, 17.0, 11.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3631591796875, -11.906005859375, -11.4488525390625, -10.99169921875, -10.5345458984375, -10.077392578125, -9.6202392578125, -9.1630859375, -8.7059326171875, -8.248779296875, -7.7916259765625, -7.33447265625, -6.8773193359375, -6.420166015625, -5.9630126953125, -5.505859375, -5.0487060546875, -4.591552734375, -4.1343994140625, -3.67724609375, -3.2200927734375, -2.762939453125, -2.3057861328125, -1.8486328125, -1.3914794921875, -0.934326171875, -0.4771728515625, -0.02001953125, 0.4371337890625, 0.894287109375, 1.3514404296875, 1.80859375, 2.2657470703125, 2.722900390625, 3.1800537109375, 3.63720703125, 4.0943603515625, 4.551513671875, 5.0086669921875, 5.4658203125, 5.9229736328125, 6.380126953125, 6.8372802734375, 7.29443359375, 7.7515869140625, 8.208740234375, 8.6658935546875, 9.123046875, 9.5802001953125, 10.037353515625, 10.4945068359375, 10.95166015625, 11.4088134765625, 11.865966796875, 12.3231201171875, 12.7802734375, 13.2374267578125, 13.694580078125, 14.1517333984375, 14.60888671875, 15.0660400390625, 15.523193359375, 15.9803466796875, 16.4375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 12.0, 18.0, 24.0, 25.0, 36.0, 37.0, 54.0, 87.0, 115.0, 167.0, 267.0, 429.0, 1373.0, 137776.0, 4044247.0, 7766.0, 740.0, 361.0, 201.0, 138.0, 110.0, 63.0, 53.0, 38.0, 33.0, 20.0, 16.0, 17.0, 8.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.15625, -59.95849609375, -57.7607421875, -55.56298828125, -53.365234375, -51.16748046875, -48.9697265625, -46.77197265625, -44.57421875, -42.37646484375, -40.1787109375, -37.98095703125, -35.783203125, -33.58544921875, -31.3876953125, -29.18994140625, -26.9921875, -24.79443359375, -22.5966796875, -20.39892578125, -18.201171875, -16.00341796875, -13.8056640625, -11.60791015625, -9.41015625, -7.21240234375, -5.0146484375, -2.81689453125, -0.619140625, 1.57861328125, 3.7763671875, 5.97412109375, 8.171875, 10.36962890625, 12.5673828125, 14.76513671875, 16.962890625, 19.16064453125, 21.3583984375, 23.55615234375, 25.75390625, 27.95166015625, 30.1494140625, 32.34716796875, 34.544921875, 36.74267578125, 38.9404296875, 41.13818359375, 43.3359375, 45.53369140625, 47.7314453125, 49.92919921875, 52.126953125, 54.32470703125, 56.5224609375, 58.72021484375, 60.91796875, 63.11572265625, 65.3134765625, 67.51123046875, 69.708984375, 71.90673828125, 74.1044921875, 76.30224609375, 78.5]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 16.0, 194.0, 529.0, 245.0, 28.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.300514221191406, -44.32118225097656, -36.34185028076172, -28.362516403198242, -20.3831844329834, -12.403850555419922, -4.424518585205078, 3.5548133850097656, 11.53414535522461, 19.513477325439453, 27.492809295654297, 35.472145080566406, 43.45147705078125, 51.430809020996094, 59.41014099121094, 67.38947296142578, 75.36880493164062, 83.34813690185547, 91.32746887207031, 99.30680084228516, 107.2861328125, 115.26547241210938, 123.24479675292969, 131.22413635253906, 139.20346069335938, 147.18280029296875, 155.16212463378906, 163.14146423339844, 171.12078857421875, 179.10012817382812, 187.07945251464844, 195.0587921142578, 203.0381317138672, 211.01747131347656, 218.99679565429688, 226.97613525390625, 234.95545959472656, 242.93479919433594, 250.91412353515625, 258.8934631347656, 266.872802734375, 274.8521423339844, 282.83148193359375, 290.810791015625, 298.7901306152344, 306.76947021484375, 314.7488098144531, 322.7281188964844, 330.70745849609375, 338.6867980957031, 346.6661376953125, 354.64544677734375, 362.6247863769531, 370.6041259765625, 378.5834655761719, 386.5627746582031, 394.5421142578125, 402.5214538574219, 410.50079345703125, 418.4801025390625, 426.4594421386719, 434.43878173828125, 442.4181213378906, 450.3974304199219, 458.37677001953125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 10.0, 13.0, 12.0, 14.0, 25.0, 22.0, 22.0, 31.0, 27.0, 27.0, 37.0, 38.0, 30.0, 41.0, 38.0, 34.0, 43.0, 45.0, 53.0, 42.0, 17.0, 42.0, 41.0, 26.0, 25.0, 33.0, 29.0, 27.0, 26.0, 26.0, 14.0, 13.0, 9.0, 13.0, 8.0, 3.0, 8.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.74163055419922, -44.348087310791016, -42.95454788208008, -41.561004638671875, -40.16746520996094, -38.773921966552734, -37.38037872314453, -35.986839294433594, -34.59329605102539, -33.19975280761719, -31.80621337890625, -30.412670135498047, -29.019128799438477, -27.625587463378906, -26.232046127319336, -24.838504791259766, -23.444963455200195, -22.051422119140625, -20.657880783081055, -19.264339447021484, -17.87079620361328, -16.47725486755371, -15.08371353149414, -13.690171241760254, -12.296629905700684, -10.903088569641113, -9.509546279907227, -8.116004943847656, -6.722463130950928, -5.328921318054199, -3.935379981994629, -2.541837692260742, -1.1482963562011719, 0.2452453374862671, 1.638787031173706, 3.0323286056518555, 4.425870418548584, 5.8194122314453125, 7.212953567504883, 8.60649585723877, 10.00003719329834, 11.39357852935791, 12.787120819091797, 14.180662155151367, 15.574203491210938, 16.96774673461914, 18.361286163330078, 19.75482940673828, 21.14837074279785, 22.541912078857422, 23.935453414916992, 25.328994750976562, 26.722537994384766, 28.116079330444336, 29.509620666503906, 30.90316390991211, 32.29670333862305, 33.69024658203125, 35.08378601074219, 36.47732925415039, 37.87086868286133, 39.26441192626953, 40.65795135498047, 42.05149459838867, 43.445037841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 37.0, 43.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 15.0, 20.0, 24.0, 39.0, 61.0, 93.0, 133.0, 236.0, 333.0, 534.0, 864.0, 1294.0, 2130.0, 3409.0, 5581.0, 8892.0, 14662.0, 24440.0, 42134.0, 74351.0, 136709.0, 251402.0, 214002.0, 113439.0, 63492.0, 35997.0, 21129.0, 12519.0, 7876.0, 4749.0, 2916.0, 1851.0, 1167.0, 714.0, 469.0, 287.0, 229.0, 126.0, 77.0, 46.0, 42.0, 22.0, 15.0, 8.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95654296875, -0.9233932495117188, -0.8902435302734375, -0.8570938110351562, -0.823944091796875, -0.7907943725585938, -0.7576446533203125, -0.7244949340820312, -0.69134521484375, -0.6581954956054688, -0.6250457763671875, -0.5918960571289062, -0.558746337890625, -0.5255966186523438, -0.4924468994140625, -0.45929718017578125, -0.4261474609375, -0.39299774169921875, -0.3598480224609375, -0.32669830322265625, -0.293548583984375, -0.26039886474609375, -0.2272491455078125, -0.19409942626953125, -0.16094970703125, -0.12779998779296875, -0.0946502685546875, -0.06150054931640625, -0.028350830078125, 0.00479888916015625, 0.0379486083984375, 0.07109832763671875, 0.104248046875, 0.13739776611328125, 0.1705474853515625, 0.20369720458984375, 0.236846923828125, 0.26999664306640625, 0.3031463623046875, 0.33629608154296875, 0.36944580078125, 0.40259552001953125, 0.4357452392578125, 0.46889495849609375, 0.502044677734375, 0.5351943969726562, 0.5683441162109375, 0.6014938354492188, 0.6346435546875, 0.6677932739257812, 0.7009429931640625, 0.7340927124023438, 0.767242431640625, 0.8003921508789062, 0.8335418701171875, 0.8666915893554688, 0.89984130859375, 0.9329910278320312, 0.9661407470703125, 0.9992904663085938, 1.032440185546875, 1.0655899047851562, 1.0987396240234375, 1.1318893432617188, 1.1650390625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 11.0, 10.0, 13.0, 26.0, 27.0, 13.0, 27.0, 35.0, 29.0, 29.0, 42.0, 35.0, 40.0, 33.0, 51.0, 48.0, 1065.0, 41.0, 41.0, 32.0, 41.0, 42.0, 31.0, 28.0, 36.0, 26.0, 16.0, 26.0, 19.0, 8.0, 14.0, 14.0, 6.0, 3.0, 9.0, 5.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.443359375, -3.325775146484375, -3.20819091796875, -3.090606689453125, -2.9730224609375, -2.855438232421875, -2.73785400390625, -2.620269775390625, -2.502685546875, -2.385101318359375, -2.26751708984375, -2.149932861328125, -2.0323486328125, -1.914764404296875, -1.79718017578125, -1.679595947265625, -1.56201171875, -1.444427490234375, -1.32684326171875, -1.209259033203125, -1.0916748046875, -0.974090576171875, -0.85650634765625, -0.738922119140625, -0.621337890625, -0.503753662109375, -0.38616943359375, -0.268585205078125, -0.1510009765625, -0.033416748046875, 0.08416748046875, 0.201751708984375, 0.3193359375, 0.436920166015625, 0.55450439453125, 0.672088623046875, 0.7896728515625, 0.907257080078125, 1.02484130859375, 1.142425537109375, 1.260009765625, 1.377593994140625, 1.49517822265625, 1.612762451171875, 1.7303466796875, 1.847930908203125, 1.96551513671875, 2.083099365234375, 2.20068359375, 2.318267822265625, 2.43585205078125, 2.553436279296875, 2.6710205078125, 2.788604736328125, 2.90618896484375, 3.023773193359375, 3.141357421875, 3.258941650390625, 3.37652587890625, 3.494110107421875, 3.6116943359375, 3.729278564453125, 3.84686279296875, 3.964447021484375, 4.08203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 16.0, 11.0, 23.0, 45.0, 53.0, 97.0, 118.0, 214.0, 267.0, 421.0, 574.0, 856.0, 1314.0, 2002.0, 3115.0, 4649.0, 7316.0, 11763.0, 18493.0, 30250.0, 50059.0, 85780.0, 159367.0, 1323726.0, 170074.0, 89833.0, 52398.0, 31235.0, 19162.0, 11937.0, 7608.0, 4863.0, 3198.0, 2044.0, 1376.0, 983.0, 604.0, 392.0, 267.0, 199.0, 131.0, 100.0, 59.0, 45.0, 31.0, 27.0, 12.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.95556640625, -0.9270782470703125, -0.898590087890625, -0.8701019287109375, -0.84161376953125, -0.8131256103515625, -0.784637451171875, -0.7561492919921875, -0.7276611328125, -0.6991729736328125, -0.670684814453125, -0.6421966552734375, -0.61370849609375, -0.5852203369140625, -0.556732177734375, -0.5282440185546875, -0.499755859375, -0.4712677001953125, -0.442779541015625, -0.4142913818359375, -0.38580322265625, -0.3573150634765625, -0.328826904296875, -0.3003387451171875, -0.2718505859375, -0.2433624267578125, -0.214874267578125, -0.1863861083984375, -0.15789794921875, -0.1294097900390625, -0.100921630859375, -0.0724334716796875, -0.0439453125, -0.0154571533203125, 0.013031005859375, 0.0415191650390625, 0.07000732421875, 0.0984954833984375, 0.126983642578125, 0.1554718017578125, 0.1839599609375, 0.2124481201171875, 0.240936279296875, 0.2694244384765625, 0.29791259765625, 0.3264007568359375, 0.354888916015625, 0.3833770751953125, 0.411865234375, 0.4403533935546875, 0.468841552734375, 0.4973297119140625, 0.52581787109375, 0.5543060302734375, 0.582794189453125, 0.6112823486328125, 0.6397705078125, 0.6682586669921875, 0.696746826171875, 0.7252349853515625, 0.75372314453125, 0.7822113037109375, 0.810699462890625, 0.8391876220703125, 0.86767578125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 11.0, 11.0, 11.0, 22.0, 20.0, 26.0, 32.0, 36.0, 53.0, 71.0, 82.0, 69.0, 82.0, 78.0, 58.0, 76.0, 40.0, 41.0, 34.0, 33.0, 19.0, 21.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000858306884765625, -0.0008352473378181458, -0.0008121877908706665, -0.0007891282439231873, -0.000766068696975708, -0.0007430091500282288, -0.0007199496030807495, -0.0006968900561332703, -0.000673830509185791, -0.0006507709622383118, -0.0006277114152908325, -0.0006046518683433533, -0.000581592321395874, -0.0005585327744483948, -0.0005354732275009155, -0.0005124136805534363, -0.000489354133605957, -0.0004662945866584778, -0.00044323503971099854, -0.0004201754927635193, -0.00039711594581604004, -0.0003740563988685608, -0.00035099685192108154, -0.0003279373049736023, -0.00030487775802612305, -0.0002818182110786438, -0.00025875866413116455, -0.0002356991171836853, -0.00021263957023620605, -0.0001895800232887268, -0.00016652047634124756, -0.0001434609293937683, -0.00012040138244628906, -9.734183549880981e-05, -7.428228855133057e-05, -5.122274160385132e-05, -2.816319465637207e-05, -5.103647708892822e-06, 1.7955899238586426e-05, 4.1015446186065674e-05, 6.407499313354492e-05, 8.713454008102417e-05, 0.00011019408702850342, 0.00013325363397598267, 0.00015631318092346191, 0.00017937272787094116, 0.0002024322748184204, 0.00022549182176589966, 0.0002485513687133789, 0.00027161091566085815, 0.0002946704626083374, 0.00031773000955581665, 0.0003407895565032959, 0.00036384910345077515, 0.0003869086503982544, 0.00040996819734573364, 0.0004330277442932129, 0.00045608729124069214, 0.0004791468381881714, 0.0005022063851356506, 0.0005252659320831299, 0.0005483254790306091, 0.0005713850259780884, 0.0005944445729255676, 0.0006175041198730469]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 9.0, 4.0, 8.0, 4.0, 13.0, 15.0, 25.0, 28.0, 29.0, 45.0, 49.0, 98.0, 126.0, 229.0, 505.0, 2101.0, 1024475.0, 19171.0, 811.0, 314.0, 152.0, 94.0, 61.0, 45.0, 35.0, 24.0, 23.0, 17.0, 12.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01293182373046875, -0.01240837574005127, -0.011884927749633789, -0.011361479759216309, -0.010838031768798828, -0.010314583778381348, -0.009791135787963867, -0.009267687797546387, -0.008744239807128906, -0.008220791816711426, -0.007697343826293945, -0.007173895835876465, -0.006650447845458984, -0.006126999855041504, -0.0056035518646240234, -0.005080103874206543, -0.0045566558837890625, -0.004033207893371582, -0.0035097599029541016, -0.002986311912536621, -0.0024628639221191406, -0.0019394159317016602, -0.0014159679412841797, -0.0008925199508666992, -0.00036907196044921875, 0.00015437602996826172, 0.0006778240203857422, 0.0012012720108032227, 0.0017247200012207031, 0.0022481679916381836, 0.002771615982055664, 0.0032950639724731445, 0.003818511962890625, 0.0043419599533081055, 0.004865407943725586, 0.005388855934143066, 0.005912303924560547, 0.006435751914978027, 0.006959199905395508, 0.007482647895812988, 0.008006095886230469, 0.00852954387664795, 0.00905299186706543, 0.00957643985748291, 0.01009988784790039, 0.010623335838317871, 0.011146783828735352, 0.011670231819152832, 0.012193679809570312, 0.012717127799987793, 0.013240575790405273, 0.013764023780822754, 0.014287471771240234, 0.014810919761657715, 0.015334367752075195, 0.015857815742492676, 0.016381263732910156, 0.016904711723327637, 0.017428159713745117, 0.017951607704162598, 0.018475055694580078, 0.01899850368499756, 0.01952195167541504, 0.02004539966583252, 0.02056884765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 206.0, 599.0, 181.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001273144967854023, -0.001213787472806871, -0.001154429977759719, -0.0010950724827125669, -0.0010357149876654148, -0.0009763575508259237, -0.0009170001139864326, -0.0008576426189392805, -0.0007982851238921285, -0.0007389276288449764, -0.0006795701337978244, -0.0006202126969583333, -0.0005608552019111812, -0.0005014977068640292, -0.0004421402409207076, -0.000382782774977386, -0.00032342527993023396, -0.0002640677848830819, -0.00020471031893976033, -0.0001453528384445235, -8.59953579492867e-05, -2.6637862902134657e-05, 3.271960304118693e-05, 9.207706898450851e-05, 0.00015143456403166056, 0.00021079204452689737, 0.0002701495250221342, 0.00032950699096545577, 0.0003888644860126078, 0.00044822198105975986, 0.000507579417899251, 0.000566936912946403, 0.0006262944079935551, 0.0006856519030407071, 0.0007450093980878592, 0.0008043668349273503, 0.0008637243299745023, 0.0009230818250216544, 0.0009824392618611455, 0.0010417967569082975, 0.0011011542519554496, 0.0011605117470026016, 0.0012198692420497537, 0.0012792267370969057, 0.001338584115728736, 0.0013979417271912098, 0.00145729910582304, 0.001516656600870192, 0.001576014095917344, 0.0016353715909644961, 0.0016947290860116482, 0.0017540865810588002, 0.0018134440761059523, 0.0018728014547377825, 0.0019321589497849345, 0.0019915164448320866, 0.0020508738234639168, 0.002110231202095747, 0.002169588813558221, 0.002228946192190051, 0.002288303803652525, 0.002347661182284355, 0.002407018793746829, 0.0024663761723786592, 0.002525733783841133]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 8.0, 15.0, 13.0, 17.0, 12.0, 21.0, 20.0, 25.0, 31.0, 38.0, 41.0, 35.0, 35.0, 50.0, 38.0, 58.0, 40.0, 45.0, 39.0, 47.0, 53.0, 39.0, 48.0, 41.0, 23.0, 25.0, 28.0, 23.0, 22.0, 11.0, 13.0, 7.0, 9.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037992000579833984, -0.0003685504198074341, -0.0003571808338165283, -0.00034581124782562256, -0.0003344416618347168, -0.00032307207584381104, -0.0003117024898529053, -0.0003003329038619995, -0.00028896331787109375, -0.000277593731880188, -0.0002662241458892822, -0.00025485455989837646, -0.0002434849739074707, -0.00023211538791656494, -0.00022074580192565918, -0.00020937621593475342, -0.00019800662994384766, -0.0001866370439529419, -0.00017526745796203613, -0.00016389787197113037, -0.0001525282859802246, -0.00014115869998931885, -0.00012978911399841309, -0.00011841952800750732, -0.00010704994201660156, -9.56803560256958e-05, -8.431077003479004e-05, -7.294118404388428e-05, -6.157159805297852e-05, -5.0202012062072754e-05, -3.883242607116699e-05, -2.746284008026123e-05, -1.609325408935547e-05, -4.723668098449707e-06, 6.645917892456055e-06, 1.8015503883361816e-05, 2.9385089874267578e-05, 4.075467586517334e-05, 5.21242618560791e-05, 6.349384784698486e-05, 7.486343383789062e-05, 8.623301982879639e-05, 9.760260581970215e-05, 0.00010897219181060791, 0.00012034177780151367, 0.00013171136379241943, 0.0001430809497833252, 0.00015445053577423096, 0.00016582012176513672, 0.00017718970775604248, 0.00018855929374694824, 0.000199928879737854, 0.00021129846572875977, 0.00022266805171966553, 0.0002340376377105713, 0.00024540722370147705, 0.0002567768096923828, 0.0002681463956832886, 0.00027951598167419434, 0.0002908855676651001, 0.00030225515365600586, 0.0003136247396469116, 0.0003249943256378174, 0.00033636391162872314, 0.0003477334976196289]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 2.0, 6.0, 6.0, 14.0, 16.0, 9.0, 17.0, 15.0, 25.0, 37.0, 25.0, 25.0, 28.0, 36.0, 42.0, 49.0, 43.0, 47.0, 37.0, 51.0, 44.0, 43.0, 40.0, 38.0, 42.0, 33.0, 40.0, 24.0, 35.0, 26.0, 26.0, 17.0, 12.0, 17.0, 7.0, 8.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.90234375, -6.6944580078125, -6.486572265625, -6.2786865234375, -6.07080078125, -5.8629150390625, -5.655029296875, -5.4471435546875, -5.2392578125, -5.0313720703125, -4.823486328125, -4.6156005859375, -4.40771484375, -4.1998291015625, -3.991943359375, -3.7840576171875, -3.576171875, -3.3682861328125, -3.160400390625, -2.9525146484375, -2.74462890625, -2.5367431640625, -2.328857421875, -2.1209716796875, -1.9130859375, -1.7052001953125, -1.497314453125, -1.2894287109375, -1.08154296875, -0.8736572265625, -0.665771484375, -0.4578857421875, -0.25, -0.0421142578125, 0.165771484375, 0.3736572265625, 0.58154296875, 0.7894287109375, 0.997314453125, 1.2052001953125, 1.4130859375, 1.6209716796875, 1.828857421875, 2.0367431640625, 2.24462890625, 2.4525146484375, 2.660400390625, 2.8682861328125, 3.076171875, 3.2840576171875, 3.491943359375, 3.6998291015625, 3.90771484375, 4.1156005859375, 4.323486328125, 4.5313720703125, 4.7392578125, 4.9471435546875, 5.155029296875, 5.3629150390625, 5.57080078125, 5.7786865234375, 5.986572265625, 6.1944580078125, 6.40234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 19.0, 18.0, 14.0, 22.0, 35.0, 65.0, 92.0, 106.0, 161.0, 232.0, 362.0, 594.0, 1046.0, 1934.0, 3851.0, 8274.0, 17506.0, 37971.0, 84670.0, 199725.0, 366990.0, 180739.0, 77462.0, 35009.0, 16119.0, 7426.0, 3543.0, 1886.0, 954.0, 566.0, 384.0, 244.0, 149.0, 115.0, 74.0, 61.0, 33.0, 30.0, 13.0, 13.0, 12.0, 12.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.75177001953125, -3.6285400390625, -3.50531005859375, -3.382080078125, -3.25885009765625, -3.1356201171875, -3.01239013671875, -2.88916015625, -2.76593017578125, -2.6427001953125, -2.51947021484375, -2.396240234375, -2.27301025390625, -2.1497802734375, -2.02655029296875, -1.9033203125, -1.78009033203125, -1.6568603515625, -1.53363037109375, -1.410400390625, -1.28717041015625, -1.1639404296875, -1.04071044921875, -0.91748046875, -0.79425048828125, -0.6710205078125, -0.54779052734375, -0.424560546875, -0.30133056640625, -0.1781005859375, -0.05487060546875, 0.068359375, 0.19158935546875, 0.3148193359375, 0.43804931640625, 0.561279296875, 0.68450927734375, 0.8077392578125, 0.93096923828125, 1.05419921875, 1.17742919921875, 1.3006591796875, 1.42388916015625, 1.547119140625, 1.67034912109375, 1.7935791015625, 1.91680908203125, 2.0400390625, 2.16326904296875, 2.2864990234375, 2.40972900390625, 2.532958984375, 2.65618896484375, 2.7794189453125, 2.90264892578125, 3.02587890625, 3.14910888671875, 3.2723388671875, 3.39556884765625, 3.518798828125, 3.64202880859375, 3.7652587890625, 3.88848876953125, 4.01171875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 3.0, 1.0, 4.0, 9.0, 10.0, 11.0, 11.0, 16.0, 24.0, 33.0, 31.0, 39.0, 25.0, 44.0, 53.0, 53.0, 61.0, 111.0, 1536.0, 454.0, 121.0, 58.0, 41.0, 48.0, 37.0, 32.0, 31.0, 30.0, 28.0, 17.0, 13.0, 12.0, 9.0, 10.0, 6.0, 8.0, 9.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-28.84375, -28.063720703125, -27.28369140625, -26.503662109375, -25.7236328125, -24.943603515625, -24.16357421875, -23.383544921875, -22.603515625, -21.823486328125, -21.04345703125, -20.263427734375, -19.4833984375, -18.703369140625, -17.92333984375, -17.143310546875, -16.36328125, -15.583251953125, -14.80322265625, -14.023193359375, -13.2431640625, -12.463134765625, -11.68310546875, -10.903076171875, -10.123046875, -9.343017578125, -8.56298828125, -7.782958984375, -7.0029296875, -6.222900390625, -5.44287109375, -4.662841796875, -3.8828125, -3.102783203125, -2.32275390625, -1.542724609375, -0.7626953125, 0.017333984375, 0.79736328125, 1.577392578125, 2.357421875, 3.137451171875, 3.91748046875, 4.697509765625, 5.4775390625, 6.257568359375, 7.03759765625, 7.817626953125, 8.59765625, 9.377685546875, 10.15771484375, 10.937744140625, 11.7177734375, 12.497802734375, 13.27783203125, 14.057861328125, 14.837890625, 15.617919921875, 16.39794921875, 17.177978515625, 17.9580078125, 18.738037109375, 19.51806640625, 20.298095703125, 21.078125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 8.0, 12.0, 10.0, 10.0, 20.0, 21.0, 22.0, 30.0, 48.0, 75.0, 94.0, 125.0, 164.0, 281.0, 456.0, 1595.0, 78745.0, 3056121.0, 5950.0, 705.0, 344.0, 238.0, 174.0, 105.0, 70.0, 72.0, 44.0, 39.0, 33.0, 15.0, 19.0, 12.0, 12.0, 9.0, 4.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.25, -46.4794921875, -44.708984375, -42.9384765625, -41.16796875, -39.3974609375, -37.626953125, -35.8564453125, -34.0859375, -32.3154296875, -30.544921875, -28.7744140625, -27.00390625, -25.2333984375, -23.462890625, -21.6923828125, -19.921875, -18.1513671875, -16.380859375, -14.6103515625, -12.83984375, -11.0693359375, -9.298828125, -7.5283203125, -5.7578125, -3.9873046875, -2.216796875, -0.4462890625, 1.32421875, 3.0947265625, 4.865234375, 6.6357421875, 8.40625, 10.1767578125, 11.947265625, 13.7177734375, 15.48828125, 17.2587890625, 19.029296875, 20.7998046875, 22.5703125, 24.3408203125, 26.111328125, 27.8818359375, 29.65234375, 31.4228515625, 33.193359375, 34.9638671875, 36.734375, 38.5048828125, 40.275390625, 42.0458984375, 43.81640625, 45.5869140625, 47.357421875, 49.1279296875, 50.8984375, 52.6689453125, 54.439453125, 56.2099609375, 57.98046875, 59.7509765625, 61.521484375, 63.2919921875, 65.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 34.0, 95.0, 232.0, 364.0, 198.0, 65.0, 14.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.634822845458984, -10.941692352294922, -9.248560905456543, -7.555429935455322, -5.862298965454102, -4.169168472290039, -2.47603702545166, -0.7829055786132812, 0.9102249145507812, 2.603355884552002, 4.296486854553223, 5.989617824554443, 7.682748794555664, 9.375879287719727, 11.069010734558105, 12.762142181396484, 14.455272674560547, 16.14840316772461, 17.841533660888672, 19.534666061401367, 21.22779655456543, 22.920927047729492, 24.614059448242188, 26.30718994140625, 28.000320434570312, 29.693450927734375, 31.386581420898438, 33.0797119140625, 34.77284240722656, 36.465972900390625, 38.15910720825195, 39.852237701416016, 41.54536437988281, 43.238494873046875, 44.93162536621094, 46.624755859375, 48.31788635253906, 50.011016845703125, 51.70415115356445, 53.397281646728516, 55.09041213989258, 56.78354263305664, 58.4766731262207, 60.169803619384766, 61.862937927246094, 63.556068420410156, 65.24919891357422, 66.94232940673828, 68.63545989990234, 70.3285903930664, 72.02172088623047, 73.71485137939453, 75.4079818725586, 77.10111236572266, 78.79424285888672, 80.48738098144531, 82.18051147460938, 83.87364196777344, 85.5667724609375, 87.25990295410156, 88.95303344726562, 90.64616394042969, 92.33929443359375, 94.03242492675781, 95.72555541992188]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 2.0, 6.0, 6.0, 11.0, 9.0, 9.0, 20.0, 21.0, 22.0, 29.0, 25.0, 31.0, 32.0, 47.0, 34.0, 43.0, 48.0, 46.0, 40.0, 49.0, 49.0, 62.0, 26.0, 48.0, 49.0, 37.0, 37.0, 37.0, 25.0, 20.0, 20.0, 21.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.82101058959961, -55.9080924987793, -53.995174407958984, -52.08225631713867, -50.169334411621094, -48.25641632080078, -46.34349822998047, -44.430580139160156, -42.517662048339844, -40.60474395751953, -38.69182586669922, -36.778907775878906, -34.865989685058594, -32.95307159423828, -31.040149688720703, -29.12723159790039, -27.214313507080078, -25.301395416259766, -23.388477325439453, -21.475557327270508, -19.562639236450195, -17.649721145629883, -15.736802101135254, -13.823883056640625, -11.910964965820312, -9.998046875, -8.085127830505371, -6.1722092628479, -4.25929069519043, -2.346372604370117, -0.4334535598754883, 1.4794654846191406, 3.3923873901367188, 5.3053059577941895, 7.21822452545166, 9.131143569946289, 11.044061660766602, 12.956979751586914, 14.869898796081543, 16.782817840576172, 18.695735931396484, 20.608654022216797, 22.52157211303711, 24.434492111206055, 26.347410202026367, 28.26032829284668, 30.173248291015625, 32.08616638183594, 33.99908447265625, 35.91200256347656, 37.824920654296875, 39.73783874511719, 41.6507568359375, 43.56367492675781, 45.47659683227539, 47.3895149230957, 49.302433013916016, 51.21535110473633, 53.12826919555664, 55.04118728637695, 56.95410919189453, 58.867027282714844, 60.779945373535156, 62.69286346435547, 64.60578155517578]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 4.0, 8.0, 16.0, 14.0, 11.0, 17.0, 25.0, 19.0, 23.0, 20.0, 41.0, 31.0, 37.0, 40.0, 36.0, 47.0, 54.0, 44.0, 46.0, 55.0, 38.0, 27.0, 40.0, 46.0, 38.0, 27.0, 38.0, 28.0, 23.0, 25.0, 26.0, 11.0, 10.0, 10.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.97265625, -6.75579833984375, -6.5389404296875, -6.32208251953125, -6.105224609375, -5.88836669921875, -5.6715087890625, -5.45465087890625, -5.23779296875, -5.02093505859375, -4.8040771484375, -4.58721923828125, -4.370361328125, -4.15350341796875, -3.9366455078125, -3.71978759765625, -3.5029296875, -3.28607177734375, -3.0692138671875, -2.85235595703125, -2.635498046875, -2.41864013671875, -2.2017822265625, -1.98492431640625, -1.76806640625, -1.55120849609375, -1.3343505859375, -1.11749267578125, -0.900634765625, -0.68377685546875, -0.4669189453125, -0.25006103515625, -0.033203125, 0.18365478515625, 0.4005126953125, 0.61737060546875, 0.834228515625, 1.05108642578125, 1.2679443359375, 1.48480224609375, 1.70166015625, 1.91851806640625, 2.1353759765625, 2.35223388671875, 2.569091796875, 2.78594970703125, 3.0028076171875, 3.21966552734375, 3.4365234375, 3.65338134765625, 3.8702392578125, 4.08709716796875, 4.303955078125, 4.52081298828125, 4.7376708984375, 4.95452880859375, 5.17138671875, 5.38824462890625, 5.6051025390625, 5.82196044921875, 6.038818359375, 6.25567626953125, 6.4725341796875, 6.68939208984375, 6.90625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 4.0, 6.0, 7.0, 14.0, 19.0, 16.0, 17.0, 24.0, 28.0, 33.0, 28.0, 43.0, 47.0, 86.0, 295.0, 1455.0, 31883.0, 2953219.0, 1195165.0, 10505.0, 816.0, 193.0, 77.0, 45.0, 48.0, 33.0, 33.0, 30.0, 24.0, 17.0, 22.0, 13.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.53125, -25.642578125, -24.75390625, -23.865234375, -22.9765625, -22.087890625, -21.19921875, -20.310546875, -19.421875, -18.533203125, -17.64453125, -16.755859375, -15.8671875, -14.978515625, -14.08984375, -13.201171875, -12.3125, -11.423828125, -10.53515625, -9.646484375, -8.7578125, -7.869140625, -6.98046875, -6.091796875, -5.203125, -4.314453125, -3.42578125, -2.537109375, -1.6484375, -0.759765625, 0.12890625, 1.017578125, 1.90625, 2.794921875, 3.68359375, 4.572265625, 5.4609375, 6.349609375, 7.23828125, 8.126953125, 9.015625, 9.904296875, 10.79296875, 11.681640625, 12.5703125, 13.458984375, 14.34765625, 15.236328125, 16.125, 17.013671875, 17.90234375, 18.791015625, 19.6796875, 20.568359375, 21.45703125, 22.345703125, 23.234375, 24.123046875, 25.01171875, 25.900390625, 26.7890625, 27.677734375, 28.56640625, 29.455078125, 30.34375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 9.0, 6.0, 12.0, 18.0, 16.0, 29.0, 19.0, 54.0, 64.0, 83.0, 97.0, 160.0, 167.0, 239.0, 297.0, 397.0, 482.0, 432.0, 350.0, 286.0, 206.0, 173.0, 118.0, 82.0, 87.0, 40.0, 41.0, 33.0, 21.0, 16.0, 13.0, 6.0, 12.0, 7.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1484375, -12.7479248046875, -12.347412109375, -11.9468994140625, -11.54638671875, -11.1458740234375, -10.745361328125, -10.3448486328125, -9.9443359375, -9.5438232421875, -9.143310546875, -8.7427978515625, -8.34228515625, -7.9417724609375, -7.541259765625, -7.1407470703125, -6.740234375, -6.3397216796875, -5.939208984375, -5.5386962890625, -5.13818359375, -4.7376708984375, -4.337158203125, -3.9366455078125, -3.5361328125, -3.1356201171875, -2.735107421875, -2.3345947265625, -1.93408203125, -1.5335693359375, -1.133056640625, -0.7325439453125, -0.33203125, 0.0684814453125, 0.468994140625, 0.8695068359375, 1.27001953125, 1.6705322265625, 2.071044921875, 2.4715576171875, 2.8720703125, 3.2725830078125, 3.673095703125, 4.0736083984375, 4.47412109375, 4.8746337890625, 5.275146484375, 5.6756591796875, 6.076171875, 6.4766845703125, 6.877197265625, 7.2777099609375, 7.67822265625, 8.0787353515625, 8.479248046875, 8.8797607421875, 9.2802734375, 9.6807861328125, 10.081298828125, 10.4818115234375, 10.88232421875, 11.2828369140625, 11.683349609375, 12.0838623046875, 12.484375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 16.0, 17.0, 14.0, 26.0, 18.0, 26.0, 41.0, 49.0, 74.0, 84.0, 138.0, 173.0, 288.0, 554.0, 2531.0, 1972171.0, 2213831.0, 2561.0, 603.0, 310.0, 208.0, 136.0, 90.0, 79.0, 48.0, 26.0, 34.0, 25.0, 24.0, 9.0, 10.0, 9.0, 11.0, 14.0, 3.0, 4.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-65.375, -63.2666015625, -61.158203125, -59.0498046875, -56.94140625, -54.8330078125, -52.724609375, -50.6162109375, -48.5078125, -46.3994140625, -44.291015625, -42.1826171875, -40.07421875, -37.9658203125, -35.857421875, -33.7490234375, -31.640625, -29.5322265625, -27.423828125, -25.3154296875, -23.20703125, -21.0986328125, -18.990234375, -16.8818359375, -14.7734375, -12.6650390625, -10.556640625, -8.4482421875, -6.33984375, -4.2314453125, -2.123046875, -0.0146484375, 2.09375, 4.2021484375, 6.310546875, 8.4189453125, 10.52734375, 12.6357421875, 14.744140625, 16.8525390625, 18.9609375, 21.0693359375, 23.177734375, 25.2861328125, 27.39453125, 29.5029296875, 31.611328125, 33.7197265625, 35.828125, 37.9365234375, 40.044921875, 42.1533203125, 44.26171875, 46.3701171875, 48.478515625, 50.5869140625, 52.6953125, 54.8037109375, 56.912109375, 59.0205078125, 61.12890625, 63.2373046875, 65.345703125, 67.4541015625, 69.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [4.0, 5.0, 100.0, 481.0, 361.0, 65.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.876556396484375, -22.218677520751953, -14.560799598693848, -6.902921676635742, 0.7549571990966797, 8.412834167480469, 16.07071304321289, 23.728591918945312, 31.386470794677734, 39.044349670410156, 46.70222854614258, 54.360107421875, 62.017982482910156, 69.67585754394531, 77.333740234375, 84.99162292480469, 92.64949798583984, 100.307373046875, 107.96525573730469, 115.62313079833984, 123.28101348876953, 130.9388885498047, 138.59677124023438, 146.254638671875, 153.9125213623047, 161.57040405273438, 169.228271484375, 176.8861541748047, 184.54403686523438, 192.201904296875, 199.8597869873047, 207.51766967773438, 215.17555236816406, 222.83343505859375, 230.49130249023438, 238.14918518066406, 245.80706787109375, 253.46493530273438, 261.1228332519531, 268.78070068359375, 276.4385681152344, 284.096435546875, 291.75433349609375, 299.4122009277344, 307.070068359375, 314.72796630859375, 322.3858337402344, 330.043701171875, 337.70159912109375, 345.3594665527344, 353.0173645019531, 360.67523193359375, 368.3330993652344, 375.9909973144531, 383.64886474609375, 391.3067626953125, 398.9646301269531, 406.62249755859375, 414.2803955078125, 421.9382629394531, 429.59613037109375, 437.2540283203125, 444.9118957519531, 452.56976318359375, 460.2276611328125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 4.0, 8.0, 4.0, 13.0, 12.0, 22.0, 20.0, 16.0, 17.0, 26.0, 27.0, 19.0, 26.0, 20.0, 30.0, 44.0, 53.0, 39.0, 31.0, 43.0, 41.0, 43.0, 40.0, 40.0, 34.0, 29.0, 43.0, 31.0, 17.0, 25.0, 20.0, 28.0, 15.0, 18.0, 16.0, 17.0, 15.0, 8.0, 13.0, 5.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0], "bins": [-43.180816650390625, -41.95011520385742, -40.71941375732422, -39.488712310791016, -38.25801086425781, -37.02730941772461, -35.796607971191406, -34.56590270996094, -33.335205078125, -32.1045036315918, -30.873802185058594, -29.64310073852539, -28.412399291992188, -27.181697845458984, -25.95099449157715, -24.720293045043945, -23.48958969116211, -22.258888244628906, -21.028186798095703, -19.7974853515625, -18.566783905029297, -17.336082458496094, -16.105379104614258, -14.874677658081055, -13.643976211547852, -12.413274765014648, -11.182573318481445, -9.951870918273926, -8.721169471740723, -7.4904680252075195, -6.259766101837158, -5.029064178466797, -3.798358917236328, -2.567657232284546, -1.3369555473327637, -0.10625386238098145, 1.1244478225708008, 2.355149269104004, 3.5858511924743652, 4.816553115844727, 6.04725456237793, 7.277956008911133, 8.508657455444336, 9.739359855651855, 10.970061302185059, 12.200762748718262, 13.431465148925781, 14.662166595458984, 15.892868041992188, 17.12356948852539, 18.354270935058594, 19.584972381591797, 20.815673828125, 22.046375274658203, 23.27707862854004, 24.507780075073242, 25.738481521606445, 26.96918296813965, 28.19988441467285, 29.430585861206055, 30.66128921508789, 31.891990661621094, 33.1226921081543, 34.3533935546875, 35.5840950012207]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 13.0, 28.0, 30.0, 42.0, 59.0, 96.0, 119.0, 208.0, 312.0, 477.0, 735.0, 1123.0, 1750.0, 2727.0, 4466.0, 6779.0, 10907.0, 17343.0, 27910.0, 45204.0, 75650.0, 128731.0, 226243.0, 203187.0, 116444.0, 67905.0, 41163.0, 25756.0, 15902.0, 9932.0, 6246.0, 3893.0, 2545.0, 1611.0, 1035.0, 672.0, 477.0, 247.0, 191.0, 131.0, 80.0, 63.0, 38.0, 25.0, 14.0, 14.0, 7.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-1.0224609375, -0.9913864135742188, -0.9603118896484375, -0.9292373657226562, -0.898162841796875, -0.8670883178710938, -0.8360137939453125, -0.8049392700195312, -0.77386474609375, -0.7427902221679688, -0.7117156982421875, -0.6806411743164062, -0.649566650390625, -0.6184921264648438, -0.5874176025390625, -0.5563430786132812, -0.5252685546875, -0.49419403076171875, -0.4631195068359375, -0.43204498291015625, -0.400970458984375, -0.36989593505859375, -0.3388214111328125, -0.30774688720703125, -0.27667236328125, -0.24559783935546875, -0.2145233154296875, -0.18344879150390625, -0.152374267578125, -0.12129974365234375, -0.0902252197265625, -0.05915069580078125, -0.028076171875, 0.00299835205078125, 0.0340728759765625, 0.06514739990234375, 0.096221923828125, 0.12729644775390625, 0.1583709716796875, 0.18944549560546875, 0.22052001953125, 0.25159454345703125, 0.2826690673828125, 0.31374359130859375, 0.344818115234375, 0.37589263916015625, 0.4069671630859375, 0.43804168701171875, 0.4691162109375, 0.5001907348632812, 0.5312652587890625, 0.5623397827148438, 0.593414306640625, 0.6244888305664062, 0.6555633544921875, 0.6866378784179688, 0.71771240234375, 0.7487869262695312, 0.7798614501953125, 0.8109359741210938, 0.842010498046875, 0.8730850219726562, 0.9041595458984375, 0.9352340698242188, 0.96630859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 15.0, 10.0, 9.0, 22.0, 22.0, 31.0, 21.0, 35.0, 31.0, 28.0, 36.0, 25.0, 40.0, 44.0, 36.0, 21.0, 1074.0, 39.0, 47.0, 40.0, 45.0, 31.0, 31.0, 26.0, 33.0, 25.0, 22.0, 27.0, 15.0, 19.0, 13.0, 20.0, 10.0, 10.0, 6.0, 6.0, 1.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.23046875, -4.110504150390625, -3.99053955078125, -3.870574951171875, -3.7506103515625, -3.630645751953125, -3.51068115234375, -3.390716552734375, -3.270751953125, -3.150787353515625, -3.03082275390625, -2.910858154296875, -2.7908935546875, -2.670928955078125, -2.55096435546875, -2.430999755859375, -2.31103515625, -2.191070556640625, -2.07110595703125, -1.951141357421875, -1.8311767578125, -1.711212158203125, -1.59124755859375, -1.471282958984375, -1.351318359375, -1.231353759765625, -1.11138916015625, -0.991424560546875, -0.8714599609375, -0.751495361328125, -0.63153076171875, -0.511566162109375, -0.3916015625, -0.271636962890625, -0.15167236328125, -0.031707763671875, 0.0882568359375, 0.208221435546875, 0.32818603515625, 0.448150634765625, 0.568115234375, 0.688079833984375, 0.80804443359375, 0.928009033203125, 1.0479736328125, 1.167938232421875, 1.28790283203125, 1.407867431640625, 1.52783203125, 1.647796630859375, 1.76776123046875, 1.887725830078125, 2.0076904296875, 2.127655029296875, 2.24761962890625, 2.367584228515625, 2.487548828125, 2.607513427734375, 2.72747802734375, 2.847442626953125, 2.9674072265625, 3.087371826171875, 3.20733642578125, 3.327301025390625, 3.447265625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 1.0, 12.0, 9.0, 16.0, 36.0, 42.0, 60.0, 100.0, 137.0, 226.0, 321.0, 480.0, 745.0, 1147.0, 1760.0, 2647.0, 4067.0, 6166.0, 9447.0, 14891.0, 23799.0, 38560.0, 63901.0, 110809.0, 207837.0, 1290866.0, 128780.0, 73040.0, 43675.0, 26538.0, 16804.0, 10623.0, 6832.0, 4327.0, 2890.0, 1933.0, 1219.0, 840.0, 520.0, 336.0, 214.0, 177.0, 104.0, 82.0, 37.0, 36.0, 16.0, 11.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.89013671875, -0.8605880737304688, -0.8310394287109375, -0.8014907836914062, -0.771942138671875, -0.7423934936523438, -0.7128448486328125, -0.6832962036132812, -0.65374755859375, -0.6241989135742188, -0.5946502685546875, -0.5651016235351562, -0.535552978515625, -0.5060043334960938, -0.4764556884765625, -0.44690704345703125, -0.4173583984375, -0.38780975341796875, -0.3582611083984375, -0.32871246337890625, -0.299163818359375, -0.26961517333984375, -0.2400665283203125, -0.21051788330078125, -0.18096923828125, -0.15142059326171875, -0.1218719482421875, -0.09232330322265625, -0.062774658203125, -0.03322601318359375, -0.0036773681640625, 0.02587127685546875, 0.055419921875, 0.08496856689453125, 0.1145172119140625, 0.14406585693359375, 0.173614501953125, 0.20316314697265625, 0.2327117919921875, 0.26226043701171875, 0.29180908203125, 0.32135772705078125, 0.3509063720703125, 0.38045501708984375, 0.410003662109375, 0.43955230712890625, 0.4691009521484375, 0.49864959716796875, 0.5281982421875, 0.5577468872070312, 0.5872955322265625, 0.6168441772460938, 0.646392822265625, 0.6759414672851562, 0.7054901123046875, 0.7350387573242188, 0.76458740234375, 0.7941360473632812, 0.8236846923828125, 0.8532333374023438, 0.882781982421875, 0.9123306274414062, 0.9418792724609375, 0.9714279174804688, 1.0009765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 11.0, 8.0, 6.0, 14.0, 11.0, 16.0, 14.0, 23.0, 21.0, 31.0, 40.0, 57.0, 56.0, 68.0, 59.0, 74.0, 92.0, 77.0, 61.0, 63.0, 37.0, 29.0, 28.0, 25.0, 17.0, 14.0, 5.0, 10.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0008139610290527344, -0.0007902905344963074, -0.0007666200399398804, -0.0007429495453834534, -0.0007192790508270264, -0.0006956085562705994, -0.0006719380617141724, -0.0006482675671577454, -0.0006245970726013184, -0.0006009265780448914, -0.0005772560834884644, -0.0005535855889320374, -0.0005299150943756104, -0.0005062445998191833, -0.00048257410526275635, -0.00045890361070632935, -0.00043523311614990234, -0.00041156262159347534, -0.00038789212703704834, -0.00036422163248062134, -0.00034055113792419434, -0.00031688064336776733, -0.00029321014881134033, -0.00026953965425491333, -0.00024586915969848633, -0.00022219866514205933, -0.00019852817058563232, -0.00017485767602920532, -0.00015118718147277832, -0.00012751668691635132, -0.00010384619235992432, -8.017569780349731e-05, -5.650520324707031e-05, -3.283470869064331e-05, -9.164214134216309e-06, 1.4506280422210693e-05, 3.8176774978637695e-05, 6.18472695350647e-05, 8.55177640914917e-05, 0.0001091882586479187, 0.0001328587532043457, 0.0001565292477607727, 0.0001801997423171997, 0.0002038702368736267, 0.0002275407314300537, 0.0002512112259864807, 0.0002748817205429077, 0.0002985522150993347, 0.0003222227096557617, 0.0003458932042121887, 0.0003695636987686157, 0.0003932341933250427, 0.0004169046878814697, 0.00044057518243789673, 0.00046424567699432373, 0.00048791617155075073, 0.0005115866661071777, 0.0005352571606636047, 0.0005589276552200317, 0.0005825981497764587, 0.0006062686443328857, 0.0006299391388893127, 0.0006536096334457397, 0.0006772801280021667, 0.0007009506225585938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 11.0, 15.0, 18.0, 20.0, 40.0, 41.0, 80.0, 133.0, 251.0, 602.0, 3234.0, 1037664.0, 5091.0, 679.0, 228.0, 115.0, 77.0, 60.0, 36.0, 31.0, 16.0, 15.0, 6.0, 15.0, 9.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.017578125, -0.01702094078063965, -0.016463756561279297, -0.015906572341918945, -0.015349388122558594, -0.014792203903198242, -0.01423501968383789, -0.013677835464477539, -0.013120651245117188, -0.012563467025756836, -0.012006282806396484, -0.011449098587036133, -0.010891914367675781, -0.01033473014831543, -0.009777545928955078, -0.009220361709594727, -0.008663177490234375, -0.008105993270874023, -0.007548809051513672, -0.00699162483215332, -0.006434440612792969, -0.005877256393432617, -0.005320072174072266, -0.004762887954711914, -0.0042057037353515625, -0.003648519515991211, -0.0030913352966308594, -0.002534151077270508, -0.0019769668579101562, -0.0014197826385498047, -0.0008625984191894531, -0.00030541419982910156, 0.00025177001953125, 0.0008089542388916016, 0.0013661384582519531, 0.0019233226776123047, 0.0024805068969726562, 0.003037691116333008, 0.0035948753356933594, 0.004152059555053711, 0.0047092437744140625, 0.005266427993774414, 0.005823612213134766, 0.006380796432495117, 0.006937980651855469, 0.00749516487121582, 0.008052349090576172, 0.008609533309936523, 0.009166717529296875, 0.009723901748657227, 0.010281085968017578, 0.01083827018737793, 0.011395454406738281, 0.011952638626098633, 0.012509822845458984, 0.013067007064819336, 0.013624191284179688, 0.014181375503540039, 0.01473855972290039, 0.015295743942260742, 0.015852928161621094, 0.016410112380981445, 0.016967296600341797, 0.01752448081970215, 0.0180816650390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 231.0, 734.0, 47.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005053344066254795, -0.0004097155178897083, -0.0003140966291539371, -0.00021847771131433547, -0.00012285882257856429, -2.7239933842793107e-05, 6.837898399680853e-05, 0.0001639978727325797, 0.0002596167614683509, 0.00035523565020412207, 0.00045085453893989325, 0.0005464734276756644, 0.0006420923164114356, 0.0007377112051472068, 0.0008333301520906389, 0.0009289490408264101, 0.0010245679877698421, 0.0011201868765056133, 0.0012158057652413845, 0.0013114246539771557, 0.0014070435427129269, 0.001502662431448698, 0.0015982813201844692, 0.0016939002089202404, 0.0017895190976560116, 0.0018851379863917828, 0.001980756875127554, 0.002076375763863325, 0.0021719946525990963, 0.0022676135413348675, 0.0023632324300706387, 0.00245885131880641, 0.0025544704403728247, 0.002650089329108596, 0.002745708217844367, 0.002841327106580138, 0.0029369459953159094, 0.0030325648840516806, 0.0031281837727874517, 0.003223802661523223, 0.003319421550258994, 0.0034150404389947653, 0.0035106593277305365, 0.0036062782164663076, 0.003701897105202079, 0.00379751599393785, 0.003893134882673621, 0.003988754004240036, 0.004084372892975807, 0.004179991781711578, 0.0042756106704473495, 0.004371229559183121, 0.004466848447918892, 0.004562467336654663, 0.004658086225390434, 0.0047537051141262054, 0.004849324002861977, 0.004944942891597748, 0.005040561780333519, 0.00513618066906929, 0.005231799557805061, 0.0053274184465408325, 0.005423037335276604, 0.005518656224012375, 0.005614275112748146]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 1.0, 2.0, 9.0, 8.0, 8.0, 9.0, 9.0, 16.0, 12.0, 22.0, 19.0, 25.0, 31.0, 39.0, 35.0, 35.0, 32.0, 24.0, 34.0, 40.0, 33.0, 36.0, 54.0, 54.0, 41.0, 32.0, 35.0, 39.0, 27.0, 21.0, 23.0, 22.0, 17.0, 28.0, 17.0, 12.0, 17.0, 13.0, 8.0, 9.0, 11.0, 5.0, 9.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00034803152084350586, -0.00033771153539419174, -0.0003273915499448776, -0.0003170715644955635, -0.0003067515790462494, -0.00029643159359693527, -0.00028611160814762115, -0.00027579162269830704, -0.0002654716372489929, -0.0002551516517996788, -0.0002448316663503647, -0.00023451168090105057, -0.00022419169545173645, -0.00021387171000242233, -0.00020355172455310822, -0.0001932317391037941, -0.00018291175365447998, -0.00017259176820516586, -0.00016227178275585175, -0.00015195179730653763, -0.0001416318118572235, -0.0001313118264079094, -0.00012099184095859528, -0.00011067185550928116, -0.00010035187005996704, -9.003188461065292e-05, -7.97118991613388e-05, -6.939191371202469e-05, -5.907192826271057e-05, -4.8751942813396454e-05, -3.8431957364082336e-05, -2.811197191476822e-05, -1.77919864654541e-05, -7.472001016139984e-06, 2.8479844331741333e-06, 1.316796988248825e-05, 2.3487955331802368e-05, 3.3807940781116486e-05, 4.41279262304306e-05, 5.444791167974472e-05, 6.476789712905884e-05, 7.508788257837296e-05, 8.540786802768707e-05, 9.572785347700119e-05, 0.00010604783892631531, 0.00011636782437562943, 0.00012668780982494354, 0.00013700779527425766, 0.00014732778072357178, 0.0001576477661728859, 0.0001679677516222, 0.00017828773707151413, 0.00018860772252082825, 0.00019892770797014236, 0.00020924769341945648, 0.0002195676788687706, 0.00022988766431808472, 0.00024020764976739883, 0.00025052763521671295, 0.00026084762066602707, 0.0002711676061153412, 0.0002814875915646553, 0.0002918075770139694, 0.00030212756246328354, 0.00031244754791259766]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 16.0, 14.0, 23.0, 18.0, 30.0, 24.0, 28.0, 35.0, 36.0, 33.0, 42.0, 46.0, 50.0, 44.0, 41.0, 45.0, 50.0, 38.0, 34.0, 41.0, 40.0, 37.0, 37.0, 31.0, 27.0, 26.0, 18.0, 13.0, 11.0, 11.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.40625, -7.18658447265625, -6.9669189453125, -6.74725341796875, -6.527587890625, -6.30792236328125, -6.0882568359375, -5.86859130859375, -5.64892578125, -5.42926025390625, -5.2095947265625, -4.98992919921875, -4.770263671875, -4.55059814453125, -4.3309326171875, -4.11126708984375, -3.8916015625, -3.67193603515625, -3.4522705078125, -3.23260498046875, -3.012939453125, -2.79327392578125, -2.5736083984375, -2.35394287109375, -2.13427734375, -1.91461181640625, -1.6949462890625, -1.47528076171875, -1.255615234375, -1.03594970703125, -0.8162841796875, -0.59661865234375, -0.376953125, -0.15728759765625, 0.0623779296875, 0.28204345703125, 0.501708984375, 0.72137451171875, 0.9410400390625, 1.16070556640625, 1.38037109375, 1.60003662109375, 1.8197021484375, 2.03936767578125, 2.259033203125, 2.47869873046875, 2.6983642578125, 2.91802978515625, 3.1376953125, 3.35736083984375, 3.5770263671875, 3.79669189453125, 4.016357421875, 4.23602294921875, 4.4556884765625, 4.67535400390625, 4.89501953125, 5.11468505859375, 5.3343505859375, 5.55401611328125, 5.773681640625, 5.99334716796875, 6.2130126953125, 6.43267822265625, 6.65234375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 4.0, 6.0, 10.0, 13.0, 15.0, 35.0, 28.0, 52.0, 47.0, 86.0, 107.0, 177.0, 235.0, 363.0, 543.0, 940.0, 1699.0, 3707.0, 9049.0, 23893.0, 69892.0, 207955.0, 466905.0, 170120.0, 57509.0, 20433.0, 7543.0, 3199.0, 1536.0, 851.0, 491.0, 314.0, 241.0, 165.0, 103.0, 68.0, 61.0, 51.0, 32.0, 21.0, 16.0, 4.0, 8.0, 9.0, 10.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.453125, -5.2899169921875, -5.126708984375, -4.9635009765625, -4.80029296875, -4.6370849609375, -4.473876953125, -4.3106689453125, -4.1474609375, -3.9842529296875, -3.821044921875, -3.6578369140625, -3.49462890625, -3.3314208984375, -3.168212890625, -3.0050048828125, -2.841796875, -2.6785888671875, -2.515380859375, -2.3521728515625, -2.18896484375, -2.0257568359375, -1.862548828125, -1.6993408203125, -1.5361328125, -1.3729248046875, -1.209716796875, -1.0465087890625, -0.88330078125, -0.7200927734375, -0.556884765625, -0.3936767578125, -0.23046875, -0.0672607421875, 0.095947265625, 0.2591552734375, 0.42236328125, 0.5855712890625, 0.748779296875, 0.9119873046875, 1.0751953125, 1.2384033203125, 1.401611328125, 1.5648193359375, 1.72802734375, 1.8912353515625, 2.054443359375, 2.2176513671875, 2.380859375, 2.5440673828125, 2.707275390625, 2.8704833984375, 3.03369140625, 3.1968994140625, 3.360107421875, 3.5233154296875, 3.6865234375, 3.8497314453125, 4.012939453125, 4.1761474609375, 4.33935546875, 4.5025634765625, 4.665771484375, 4.8289794921875, 4.9921875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 8.0, 15.0, 13.0, 14.0, 13.0, 18.0, 28.0, 20.0, 26.0, 26.0, 37.0, 36.0, 38.0, 57.0, 80.0, 74.0, 317.0, 1597.0, 125.0, 70.0, 57.0, 59.0, 37.0, 45.0, 37.0, 28.0, 25.0, 23.0, 16.0, 20.0, 10.0, 8.0, 11.0, 11.0, 3.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.46875, -23.792236328125, -23.11572265625, -22.439208984375, -21.7626953125, -21.086181640625, -20.40966796875, -19.733154296875, -19.056640625, -18.380126953125, -17.70361328125, -17.027099609375, -16.3505859375, -15.674072265625, -14.99755859375, -14.321044921875, -13.64453125, -12.968017578125, -12.29150390625, -11.614990234375, -10.9384765625, -10.261962890625, -9.58544921875, -8.908935546875, -8.232421875, -7.555908203125, -6.87939453125, -6.202880859375, -5.5263671875, -4.849853515625, -4.17333984375, -3.496826171875, -2.8203125, -2.143798828125, -1.46728515625, -0.790771484375, -0.1142578125, 0.562255859375, 1.23876953125, 1.915283203125, 2.591796875, 3.268310546875, 3.94482421875, 4.621337890625, 5.2978515625, 5.974365234375, 6.65087890625, 7.327392578125, 8.00390625, 8.680419921875, 9.35693359375, 10.033447265625, 10.7099609375, 11.386474609375, 12.06298828125, 12.739501953125, 13.416015625, 14.092529296875, 14.76904296875, 15.445556640625, 16.1220703125, 16.798583984375, 17.47509765625, 18.151611328125, 18.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 20.0, 16.0, 19.0, 45.0, 53.0, 67.0, 105.0, 163.0, 217.0, 342.0, 694.0, 6205.0, 3121553.0, 14089.0, 876.0, 359.0, 227.0, 161.0, 124.0, 94.0, 54.0, 53.0, 30.0, 30.0, 26.0, 20.0, 14.0, 11.0, 4.0, 7.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-73.8125, -71.79443359375, -69.7763671875, -67.75830078125, -65.740234375, -63.72216796875, -61.7041015625, -59.68603515625, -57.66796875, -55.64990234375, -53.6318359375, -51.61376953125, -49.595703125, -47.57763671875, -45.5595703125, -43.54150390625, -41.5234375, -39.50537109375, -37.4873046875, -35.46923828125, -33.451171875, -31.43310546875, -29.4150390625, -27.39697265625, -25.37890625, -23.36083984375, -21.3427734375, -19.32470703125, -17.306640625, -15.28857421875, -13.2705078125, -11.25244140625, -9.234375, -7.21630859375, -5.1982421875, -3.18017578125, -1.162109375, 0.85595703125, 2.8740234375, 4.89208984375, 6.91015625, 8.92822265625, 10.9462890625, 12.96435546875, 14.982421875, 17.00048828125, 19.0185546875, 21.03662109375, 23.0546875, 25.07275390625, 27.0908203125, 29.10888671875, 31.126953125, 33.14501953125, 35.1630859375, 37.18115234375, 39.19921875, 41.21728515625, 43.2353515625, 45.25341796875, 47.271484375, 49.28955078125, 51.3076171875, 53.32568359375, 55.34375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 24.0, 117.0, 426.0, 339.0, 96.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.97565841674805, -46.39053726196289, -43.805416107177734, -41.22029113769531, -38.635169982910156, -36.050048828125, -33.464927673339844, -30.879804611206055, -28.2946834564209, -25.709562301635742, -23.124439239501953, -20.539318084716797, -17.95419692993164, -15.369073867797852, -12.783952713012695, -10.198829650878906, -7.61370849609375, -5.028586387634277, -2.443464756011963, 0.14165687561035156, 2.726778984069824, 5.311901092529297, 7.897022247314453, 10.482145309448242, 13.067266464233398, 15.652388572692871, 18.237510681152344, 20.8226318359375, 23.407752990722656, 25.992876052856445, 28.5779972076416, 31.16312026977539, 33.74823760986328, 36.33335876464844, 38.918479919433594, 41.50360107421875, 44.08872604370117, 46.67384719848633, 49.258968353271484, 51.844093322753906, 54.42921447753906, 57.01433563232422, 59.599456787109375, 62.18457794189453, 64.76969909667969, 67.35482788085938, 69.93994140625, 72.52507019042969, 75.11018371582031, 77.69530487060547, 80.28042602539062, 82.86554718017578, 85.45066833496094, 88.03579711914062, 90.62091064453125, 93.20603942871094, 95.7911605834961, 98.37628173828125, 100.9614028930664, 103.54652404785156, 106.13164520263672, 108.71676635742188, 111.30189514160156, 113.88701629638672, 116.47213745117188]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 7.0, 8.0, 8.0, 3.0, 7.0, 10.0, 13.0, 17.0, 15.0, 26.0, 20.0, 29.0, 21.0, 32.0, 36.0, 39.0, 39.0, 35.0, 35.0, 42.0, 41.0, 40.0, 28.0, 44.0, 52.0, 46.0, 26.0, 40.0, 27.0, 32.0, 22.0, 27.0, 24.0, 19.0, 12.0, 12.0, 16.0, 7.0, 9.0, 1.0, 11.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-63.36546325683594, -61.41703414916992, -59.46860885620117, -57.520179748535156, -55.571754455566406, -53.62332534790039, -51.674896240234375, -49.726470947265625, -47.77804183959961, -45.829612731933594, -43.881187438964844, -41.93275833129883, -39.98432922363281, -38.03590393066406, -36.08747482299805, -34.13904571533203, -32.19062042236328, -30.2421932220459, -28.293766021728516, -26.3453369140625, -24.396909713745117, -22.448482513427734, -20.50005340576172, -18.551626205444336, -16.603199005126953, -14.65477180480957, -12.706343650817871, -10.757915496826172, -8.809488296508789, -6.861061096191406, -4.912632942199707, -2.964204788208008, -1.015777587890625, 0.932650089263916, 2.881077766418457, 4.829505443572998, 6.777933120727539, 8.726360321044922, 10.674788475036621, 12.62321662902832, 14.571643829345703, 16.520071029663086, 18.46849822998047, 20.416927337646484, 22.365354537963867, 24.31378173828125, 26.262210845947266, 28.21063804626465, 30.15906524658203, 32.10749435424805, 34.0559196472168, 36.00434875488281, 37.95277404785156, 39.90120315551758, 41.849632263183594, 43.798057556152344, 45.74648666381836, 47.694915771484375, 49.643341064453125, 51.59177017211914, 53.540199279785156, 55.488624572753906, 57.43705368041992, 59.38548278808594, 61.33390808105469]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 17.0, 19.0, 21.0, 22.0, 16.0, 28.0, 20.0, 44.0, 30.0, 30.0, 41.0, 47.0, 48.0, 44.0, 50.0, 41.0, 34.0, 34.0, 38.0, 37.0, 37.0, 40.0, 41.0, 32.0, 28.0, 21.0, 20.0, 18.0, 20.0, 14.0, 9.0, 9.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.2109375, -6.98712158203125, -6.7633056640625, -6.53948974609375, -6.315673828125, -6.09185791015625, -5.8680419921875, -5.64422607421875, -5.42041015625, -5.19659423828125, -4.9727783203125, -4.74896240234375, -4.525146484375, -4.30133056640625, -4.0775146484375, -3.85369873046875, -3.6298828125, -3.40606689453125, -3.1822509765625, -2.95843505859375, -2.734619140625, -2.51080322265625, -2.2869873046875, -2.06317138671875, -1.83935546875, -1.61553955078125, -1.3917236328125, -1.16790771484375, -0.944091796875, -0.72027587890625, -0.4964599609375, -0.27264404296875, -0.048828125, 0.17498779296875, 0.3988037109375, 0.62261962890625, 0.846435546875, 1.07025146484375, 1.2940673828125, 1.51788330078125, 1.74169921875, 1.96551513671875, 2.1893310546875, 2.41314697265625, 2.636962890625, 2.86077880859375, 3.0845947265625, 3.30841064453125, 3.5322265625, 3.75604248046875, 3.9798583984375, 4.20367431640625, 4.427490234375, 4.65130615234375, 4.8751220703125, 5.09893798828125, 5.32275390625, 5.54656982421875, 5.7703857421875, 5.99420166015625, 6.218017578125, 6.44183349609375, 6.6656494140625, 6.88946533203125, 7.11328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 16.0, 11.0, 10.0, 17.0, 18.0, 24.0, 28.0, 23.0, 31.0, 40.0, 41.0, 72.0, 169.0, 553.0, 2700.0, 61131.0, 3086468.0, 1028382.0, 12504.0, 1251.0, 338.0, 106.0, 62.0, 41.0, 33.0, 35.0, 30.0, 12.0, 21.0, 23.0, 19.0, 11.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.171875, -24.3544921875, -23.537109375, -22.7197265625, -21.90234375, -21.0849609375, -20.267578125, -19.4501953125, -18.6328125, -17.8154296875, -16.998046875, -16.1806640625, -15.36328125, -14.5458984375, -13.728515625, -12.9111328125, -12.09375, -11.2763671875, -10.458984375, -9.6416015625, -8.82421875, -8.0068359375, -7.189453125, -6.3720703125, -5.5546875, -4.7373046875, -3.919921875, -3.1025390625, -2.28515625, -1.4677734375, -0.650390625, 0.1669921875, 0.984375, 1.8017578125, 2.619140625, 3.4365234375, 4.25390625, 5.0712890625, 5.888671875, 6.7060546875, 7.5234375, 8.3408203125, 9.158203125, 9.9755859375, 10.79296875, 11.6103515625, 12.427734375, 13.2451171875, 14.0625, 14.8798828125, 15.697265625, 16.5146484375, 17.33203125, 18.1494140625, 18.966796875, 19.7841796875, 20.6015625, 21.4189453125, 22.236328125, 23.0537109375, 23.87109375, 24.6884765625, 25.505859375, 26.3232421875, 27.140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 11.0, 7.0, 15.0, 19.0, 17.0, 32.0, 46.0, 43.0, 91.0, 103.0, 129.0, 168.0, 230.0, 320.0, 378.0, 442.0, 487.0, 385.0, 304.0, 218.0, 162.0, 123.0, 78.0, 64.0, 45.0, 46.0, 28.0, 20.0, 14.0, 10.0, 10.0, 5.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.071533203125, -10.65869140625, -10.245849609375, -9.8330078125, -9.420166015625, -9.00732421875, -8.594482421875, -8.181640625, -7.768798828125, -7.35595703125, -6.943115234375, -6.5302734375, -6.117431640625, -5.70458984375, -5.291748046875, -4.87890625, -4.466064453125, -4.05322265625, -3.640380859375, -3.2275390625, -2.814697265625, -2.40185546875, -1.989013671875, -1.576171875, -1.163330078125, -0.75048828125, -0.337646484375, 0.0751953125, 0.488037109375, 0.90087890625, 1.313720703125, 1.7265625, 2.139404296875, 2.55224609375, 2.965087890625, 3.3779296875, 3.790771484375, 4.20361328125, 4.616455078125, 5.029296875, 5.442138671875, 5.85498046875, 6.267822265625, 6.6806640625, 7.093505859375, 7.50634765625, 7.919189453125, 8.33203125, 8.744873046875, 9.15771484375, 9.570556640625, 9.9833984375, 10.396240234375, 10.80908203125, 11.221923828125, 11.634765625, 12.047607421875, 12.46044921875, 12.873291015625, 13.2861328125, 13.698974609375, 14.11181640625, 14.524658203125, 14.9375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 16.0, 18.0, 24.0, 23.0, 42.0, 51.0, 64.0, 82.0, 97.0, 139.0, 191.0, 237.0, 403.0, 732.0, 6149.0, 4022252.0, 160889.0, 1190.0, 476.0, 314.0, 206.0, 154.0, 121.0, 90.0, 73.0, 48.0, 38.0, 31.0, 29.0, 17.0, 13.0, 13.0, 14.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.59375, -60.48876953125, -58.3837890625, -56.27880859375, -54.173828125, -52.06884765625, -49.9638671875, -47.85888671875, -45.75390625, -43.64892578125, -41.5439453125, -39.43896484375, -37.333984375, -35.22900390625, -33.1240234375, -31.01904296875, -28.9140625, -26.80908203125, -24.7041015625, -22.59912109375, -20.494140625, -18.38916015625, -16.2841796875, -14.17919921875, -12.07421875, -9.96923828125, -7.8642578125, -5.75927734375, -3.654296875, -1.54931640625, 0.5556640625, 2.66064453125, 4.765625, 6.87060546875, 8.9755859375, 11.08056640625, 13.185546875, 15.29052734375, 17.3955078125, 19.50048828125, 21.60546875, 23.71044921875, 25.8154296875, 27.92041015625, 30.025390625, 32.13037109375, 34.2353515625, 36.34033203125, 38.4453125, 40.55029296875, 42.6552734375, 44.76025390625, 46.865234375, 48.97021484375, 51.0751953125, 53.18017578125, 55.28515625, 57.39013671875, 59.4951171875, 61.60009765625, 63.705078125, 65.81005859375, 67.9150390625, 70.02001953125, 72.125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 26.0, 204.0, 473.0, 267.0, 38.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.7817611694336, -80.40135955810547, -74.02095794677734, -67.64056396484375, -61.26015853881836, -54.879756927490234, -48.499359130859375, -42.11895751953125, -35.738555908203125, -29.358154296875, -22.977754592895508, -16.597354888916016, -10.21695327758789, -3.8365516662597656, 2.5438461303710938, 8.924247741699219, 15.304649353027344, 21.68505096435547, 28.06545066833496, 34.44585037231445, 40.82625198364258, 47.2066535949707, 53.58705139160156, 59.96745300292969, 66.34785461425781, 72.72825622558594, 79.10865783691406, 85.48905944824219, 91.86946105957031, 98.24986267089844, 104.63025665283203, 111.01065826416016, 117.39105224609375, 123.77145385742188, 130.15185546875, 136.53225708007812, 142.91265869140625, 149.29306030273438, 155.6734619140625, 162.05386352539062, 168.43426513671875, 174.81466674804688, 181.195068359375, 187.57546997070312, 193.95587158203125, 200.33627319335938, 206.7166748046875, 213.09707641601562, 219.4774627685547, 225.8578643798828, 232.23826599121094, 238.61866760253906, 244.9990692138672, 251.3794708251953, 257.7598571777344, 264.1402587890625, 270.5206604003906, 276.90106201171875, 283.2814636230469, 289.661865234375, 296.0422668457031, 302.42266845703125, 308.8030700683594, 315.1834716796875, 321.5638732910156]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 6.0, 12.0, 13.0, 17.0, 20.0, 17.0, 13.0, 29.0, 24.0, 23.0, 29.0, 35.0, 33.0, 29.0, 40.0, 39.0, 39.0, 28.0, 40.0, 41.0, 37.0, 32.0, 46.0, 41.0, 30.0, 32.0, 27.0, 30.0, 12.0, 36.0, 25.0, 22.0, 16.0, 5.0, 12.0, 11.0, 6.0, 7.0, 8.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.13287353515625, -38.885887145996094, -37.6389045715332, -36.39191818237305, -35.144935607910156, -33.89794921875, -32.650962829589844, -31.40397834777832, -30.156993865966797, -28.910009384155273, -27.66302490234375, -26.416038513183594, -25.16905403137207, -23.922069549560547, -22.67508316040039, -21.428098678588867, -20.181114196777344, -18.93412971496582, -17.687145233154297, -16.44015884399414, -15.193174362182617, -13.946189880371094, -12.699204444885254, -11.452219009399414, -10.20523452758789, -8.958250045776367, -7.711264610290527, -6.464279651641846, -5.217294692993164, -3.9703097343444824, -2.723324775695801, -1.476339340209961, -0.2293548583984375, 1.0176301002502441, 2.264615058898926, 3.5116000175476074, 4.758584976196289, 6.005569934844971, 7.252554893493652, 8.499540328979492, 9.746524810791016, 10.993509292602539, 12.240494728088379, 13.487480163574219, 14.734464645385742, 15.981449127197266, 17.228435516357422, 18.475419998168945, 19.72240447998047, 20.969388961791992, 22.216373443603516, 23.463359832763672, 24.710344314575195, 25.95732879638672, 27.204315185546875, 28.4512996673584, 29.698284149169922, 30.945268630981445, 32.19225311279297, 33.439239501953125, 34.68622589111328, 35.93320846557617, 37.18019485473633, 38.42717742919922, 39.674163818359375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 21.0, 32.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 10.0, 15.0, 11.0, 26.0, 34.0, 45.0, 93.0, 132.0, 163.0, 278.0, 359.0, 503.0, 746.0, 1191.0, 1588.0, 2343.0, 3371.0, 5073.0, 7756.0, 11658.0, 17886.0, 27850.0, 43930.0, 69396.0, 114518.0, 196334.0, 210764.0, 124608.0, 74774.0, 46853.0, 29598.0, 19131.0, 12575.0, 8177.0, 5334.0, 3716.0, 2416.0, 1658.0, 1124.0, 725.0, 549.0, 382.0, 265.0, 198.0, 132.0, 89.0, 63.0, 43.0, 32.0, 16.0, 6.0, 8.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.95849609375, -0.9286117553710938, -0.8987274169921875, -0.8688430786132812, -0.838958740234375, -0.8090744018554688, -0.7791900634765625, -0.7493057250976562, -0.71942138671875, -0.6895370483398438, -0.6596527099609375, -0.6297683715820312, -0.599884033203125, -0.5699996948242188, -0.5401153564453125, -0.5102310180664062, -0.4803466796875, -0.45046234130859375, -0.4205780029296875, -0.39069366455078125, -0.360809326171875, -0.33092498779296875, -0.3010406494140625, -0.27115631103515625, -0.24127197265625, -0.21138763427734375, -0.1815032958984375, -0.15161895751953125, -0.121734619140625, -0.09185028076171875, -0.0619659423828125, -0.03208160400390625, -0.002197265625, 0.02768707275390625, 0.0575714111328125, 0.08745574951171875, 0.117340087890625, 0.14722442626953125, 0.1771087646484375, 0.20699310302734375, 0.23687744140625, 0.26676177978515625, 0.2966461181640625, 0.32653045654296875, 0.356414794921875, 0.38629913330078125, 0.4161834716796875, 0.44606781005859375, 0.4759521484375, 0.5058364868164062, 0.5357208251953125, 0.5656051635742188, 0.595489501953125, 0.6253738403320312, 0.6552581787109375, 0.6851425170898438, 0.71502685546875, 0.7449111938476562, 0.7747955322265625, 0.8046798706054688, 0.834564208984375, 0.8644485473632812, 0.8943328857421875, 0.9242172241210938, 0.9541015625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 0.0, 3.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 12.0, 12.0, 17.0, 20.0, 18.0, 23.0, 32.0, 35.0, 36.0, 36.0, 33.0, 41.0, 35.0, 61.0, 35.0, 1077.0, 41.0, 42.0, 47.0, 40.0, 27.0, 50.0, 26.0, 26.0, 25.0, 25.0, 19.0, 17.0, 11.0, 14.0, 8.0, 13.0, 6.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.41015625, -4.27276611328125, -4.1353759765625, -3.99798583984375, -3.860595703125, -3.72320556640625, -3.5858154296875, -3.44842529296875, -3.31103515625, -3.17364501953125, -3.0362548828125, -2.89886474609375, -2.761474609375, -2.62408447265625, -2.4866943359375, -2.34930419921875, -2.2119140625, -2.07452392578125, -1.9371337890625, -1.79974365234375, -1.662353515625, -1.52496337890625, -1.3875732421875, -1.25018310546875, -1.11279296875, -0.97540283203125, -0.8380126953125, -0.70062255859375, -0.563232421875, -0.42584228515625, -0.2884521484375, -0.15106201171875, -0.013671875, 0.12371826171875, 0.2611083984375, 0.39849853515625, 0.535888671875, 0.67327880859375, 0.8106689453125, 0.94805908203125, 1.08544921875, 1.22283935546875, 1.3602294921875, 1.49761962890625, 1.635009765625, 1.77239990234375, 1.9097900390625, 2.04718017578125, 2.1845703125, 2.32196044921875, 2.4593505859375, 2.59674072265625, 2.734130859375, 2.87152099609375, 3.0089111328125, 3.14630126953125, 3.28369140625, 3.42108154296875, 3.5584716796875, 3.69586181640625, 3.833251953125, 3.97064208984375, 4.1080322265625, 4.24542236328125, 4.3828125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 15.0, 20.0, 26.0, 47.0, 78.0, 120.0, 142.0, 252.0, 351.0, 507.0, 855.0, 1294.0, 2107.0, 3119.0, 4958.0, 7604.0, 12587.0, 20164.0, 34104.0, 58667.0, 107009.0, 209666.0, 1317679.0, 135846.0, 73397.0, 41919.0, 24468.0, 14898.0, 9211.0, 5696.0, 3616.0, 2314.0, 1574.0, 1021.0, 612.0, 396.0, 254.0, 174.0, 135.0, 68.0, 52.0, 44.0, 19.0, 19.0, 8.0, 8.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0498046875, -1.016143798828125, -0.98248291015625, -0.948822021484375, -0.9151611328125, -0.881500244140625, -0.84783935546875, -0.814178466796875, -0.780517578125, -0.746856689453125, -0.71319580078125, -0.679534912109375, -0.6458740234375, -0.612213134765625, -0.57855224609375, -0.544891357421875, -0.51123046875, -0.477569580078125, -0.44390869140625, -0.410247802734375, -0.3765869140625, -0.342926025390625, -0.30926513671875, -0.275604248046875, -0.241943359375, -0.208282470703125, -0.17462158203125, -0.140960693359375, -0.1072998046875, -0.073638916015625, -0.03997802734375, -0.006317138671875, 0.02734375, 0.061004638671875, 0.09466552734375, 0.128326416015625, 0.1619873046875, 0.195648193359375, 0.22930908203125, 0.262969970703125, 0.296630859375, 0.330291748046875, 0.36395263671875, 0.397613525390625, 0.4312744140625, 0.464935302734375, 0.49859619140625, 0.532257080078125, 0.56591796875, 0.599578857421875, 0.63323974609375, 0.666900634765625, 0.7005615234375, 0.734222412109375, 0.76788330078125, 0.801544189453125, 0.835205078125, 0.868865966796875, 0.90252685546875, 0.936187744140625, 0.9698486328125, 1.003509521484375, 1.03717041015625, 1.070831298828125, 1.1044921875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 5.0, 15.0, 11.0, 16.0, 17.0, 21.0, 27.0, 26.0, 41.0, 32.0, 34.0, 49.0, 90.0, 70.0, 77.0, 54.0, 67.0, 55.0, 51.0, 49.0, 27.0, 25.0, 21.0, 16.0, 12.0, 10.0, 14.0, 6.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006728172302246094, -0.0006508305668830872, -0.0006288439035415649, -0.0006068572402000427, -0.0005848705768585205, -0.0005628839135169983, -0.0005408972501754761, -0.0005189105868339539, -0.0004969239234924316, -0.0004749372601509094, -0.0004529505968093872, -0.000430963933467865, -0.0004089772701263428, -0.00038699060678482056, -0.00036500394344329834, -0.0003430172801017761, -0.0003210306167602539, -0.0002990439534187317, -0.00027705729007720947, -0.00025507062673568726, -0.00023308396339416504, -0.00021109730005264282, -0.0001891106367111206, -0.0001671239733695984, -0.00014513731002807617, -0.00012315064668655396, -0.00010116398334503174, -7.917732000350952e-05, -5.7190656661987305e-05, -3.520399332046509e-05, -1.3217329978942871e-05, 8.769333362579346e-06, 3.075599670410156e-05, 5.274266004562378e-05, 7.4729323387146e-05, 9.671598672866821e-05, 0.00011870265007019043, 0.00014068931341171265, 0.00016267597675323486, 0.00018466264009475708, 0.0002066493034362793, 0.00022863596677780151, 0.00025062263011932373, 0.00027260929346084595, 0.00029459595680236816, 0.0003165826201438904, 0.0003385692834854126, 0.0003605559468269348, 0.00038254261016845703, 0.00040452927350997925, 0.00042651593685150146, 0.0004485026001930237, 0.0004704892635345459, 0.0004924759268760681, 0.0005144625902175903, 0.0005364492535591125, 0.0005584359169006348, 0.000580422580242157, 0.0006024092435836792, 0.0006243959069252014, 0.0006463825702667236, 0.0006683692336082458, 0.0006903558969497681, 0.0007123425602912903, 0.0007343292236328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 1.0, 8.0, 7.0, 6.0, 9.0, 10.0, 15.0, 10.0, 23.0, 28.0, 31.0, 40.0, 60.0, 89.0, 120.0, 252.0, 799.0, 9936.0, 1033213.0, 2591.0, 610.0, 230.0, 106.0, 80.0, 64.0, 34.0, 26.0, 38.0, 15.0, 22.0, 12.0, 15.0, 13.0, 7.0, 10.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.016326904296875, -0.015822649002075195, -0.01531839370727539, -0.014814138412475586, -0.014309883117675781, -0.013805627822875977, -0.013301372528076172, -0.012797117233276367, -0.012292861938476562, -0.011788606643676758, -0.011284351348876953, -0.010780096054077148, -0.010275840759277344, -0.009771585464477539, -0.009267330169677734, -0.00876307487487793, -0.008258819580078125, -0.00775456428527832, -0.007250308990478516, -0.006746053695678711, -0.006241798400878906, -0.0057375431060791016, -0.005233287811279297, -0.004729032516479492, -0.0042247772216796875, -0.003720521926879883, -0.003216266632080078, -0.0027120113372802734, -0.0022077560424804688, -0.001703500747680664, -0.0011992454528808594, -0.0006949901580810547, -0.00019073486328125, 0.0003135204315185547, 0.0008177757263183594, 0.001322031021118164, 0.0018262863159179688, 0.0023305416107177734, 0.002834796905517578, 0.003339052200317383, 0.0038433074951171875, 0.004347562789916992, 0.004851818084716797, 0.0053560733795166016, 0.005860328674316406, 0.006364583969116211, 0.006868839263916016, 0.00737309455871582, 0.007877349853515625, 0.00838160514831543, 0.008885860443115234, 0.009390115737915039, 0.009894371032714844, 0.010398626327514648, 0.010902881622314453, 0.011407136917114258, 0.011911392211914062, 0.012415647506713867, 0.012919902801513672, 0.013424158096313477, 0.013928413391113281, 0.014432668685913086, 0.01493692398071289, 0.015441179275512695, 0.0159454345703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 14.0, 81.0, 199.0, 341.0, 241.0, 99.0, 26.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013728872872889042, -0.0013427898520603776, -0.001312692416831851, -0.0012825950980186462, -0.0012524976627901196, -0.001222400227561593, -0.0011923027923330665, -0.0011622053571045399, -0.0011321079218760133, -0.0011020104866474867, -0.00107191305141896, -0.0010418156161904335, -0.0010117182973772287, -0.0009816208621487021, -0.0009515234269201756, -0.000921425991691649, -0.0008913286728784442, -0.0008612312376499176, -0.0008311338606290519, -0.0008010364254005253, -0.0007709389901719987, -0.0007408416131511331, -0.0007107441779226065, -0.0006806467426940799, -0.0006505493074655533, -0.0006204518722370267, -0.000590354495216161, -0.0005602570599876344, -0.0005301596247591078, -0.0005000622477382421, -0.00046996481250971556, -0.0004398674063850194, -0.0004097700002603233, -0.00037967259413562715, -0.00034957515890710056, -0.0003194777527824044, -0.0002893803466577083, -0.00025928294053301215, -0.00022918550530448556, -0.00019908809917978942, -0.00016899067850317806, -0.0001388932578265667, -0.00010879585170187056, -7.86984310252592e-05, -4.860101762460545e-05, -1.8503604223951697e-05, 1.1593816452659667e-05, 4.16912225773558e-05, 7.178864325396717e-05, 0.00010188605665462092, 0.00013198347005527467, 0.00016208089073188603, 0.00019217829685658216, 0.00022227571753319353, 0.0002523731382098049, 0.00028247054433450103, 0.0003125679795630276, 0.00034266538568772376, 0.00037276282091625035, 0.0004028602270409465, 0.0004329576331656426, 0.00046305503929033875, 0.0004931524745188653, 0.000523249851539731, 0.0005533472867682576]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 6.0, 4.0, 5.0, 2.0, 3.0, 9.0, 13.0, 11.0, 11.0, 15.0, 18.0, 25.0, 26.0, 18.0, 30.0, 25.0, 26.0, 29.0, 37.0, 27.0, 44.0, 38.0, 41.0, 56.0, 40.0, 39.0, 32.0, 37.0, 25.0, 26.0, 16.0, 19.0, 34.0, 21.0, 28.0, 25.0, 21.0, 15.0, 15.0, 17.0, 11.0, 6.0, 17.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0003209710121154785, -0.0003109695389866829, -0.00030096806585788727, -0.00029096659272909164, -0.000280965119600296, -0.0002709636464715004, -0.0002609621733427048, -0.00025096070021390915, -0.00024095922708511353, -0.0002309577539563179, -0.00022095628082752228, -0.00021095480769872665, -0.00020095333456993103, -0.0001909518614411354, -0.00018095038831233978, -0.00017094891518354416, -0.00016094744205474854, -0.0001509459689259529, -0.0001409444957971573, -0.00013094302266836166, -0.00012094154953956604, -0.00011094007641077042, -0.00010093860328197479, -9.093713015317917e-05, -8.093565702438354e-05, -7.093418389558792e-05, -6.09327107667923e-05, -5.0931237637996674e-05, -4.092976450920105e-05, -3.0928291380405426e-05, -2.0926818251609802e-05, -1.0925345122814178e-05, -9.238719940185547e-07, 9.077601134777069e-06, 1.9079074263572693e-05, 2.9080547392368317e-05, 3.908202052116394e-05, 4.9083493649959564e-05, 5.908496677875519e-05, 6.908643990755081e-05, 7.908791303634644e-05, 8.908938616514206e-05, 9.909085929393768e-05, 0.00010909233242273331, 0.00011909380555152893, 0.00012909527868032455, 0.00013909675180912018, 0.0001490982249379158, 0.00015909969806671143, 0.00016910117119550705, 0.00017910264432430267, 0.0001891041174530983, 0.00019910559058189392, 0.00020910706371068954, 0.00021910853683948517, 0.0002291100099682808, 0.00023911148309707642, 0.00024911295622587204, 0.00025911442935466766, 0.0002691159024834633, 0.0002791173756122589, 0.00028911884874105453, 0.00029912032186985016, 0.0003091217949986458, 0.0003191232681274414]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 4.0, 11.0, 15.0, 13.0, 24.0, 22.0, 31.0, 19.0, 33.0, 26.0, 44.0, 29.0, 41.0, 48.0, 41.0, 41.0, 32.0, 43.0, 43.0, 39.0, 36.0, 33.0, 42.0, 30.0, 30.0, 47.0, 33.0, 25.0, 13.0, 15.0, 14.0, 13.0, 12.0, 7.0, 11.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.84375, -6.6307373046875, -6.417724609375, -6.2047119140625, -5.99169921875, -5.7786865234375, -5.565673828125, -5.3526611328125, -5.1396484375, -4.9266357421875, -4.713623046875, -4.5006103515625, -4.28759765625, -4.0745849609375, -3.861572265625, -3.6485595703125, -3.435546875, -3.2225341796875, -3.009521484375, -2.7965087890625, -2.58349609375, -2.3704833984375, -2.157470703125, -1.9444580078125, -1.7314453125, -1.5184326171875, -1.305419921875, -1.0924072265625, -0.87939453125, -0.6663818359375, -0.453369140625, -0.2403564453125, -0.02734375, 0.1856689453125, 0.398681640625, 0.6116943359375, 0.82470703125, 1.0377197265625, 1.250732421875, 1.4637451171875, 1.6767578125, 1.8897705078125, 2.102783203125, 2.3157958984375, 2.52880859375, 2.7418212890625, 2.954833984375, 3.1678466796875, 3.380859375, 3.5938720703125, 3.806884765625, 4.0198974609375, 4.23291015625, 4.4459228515625, 4.658935546875, 4.8719482421875, 5.0849609375, 5.2979736328125, 5.510986328125, 5.7239990234375, 5.93701171875, 6.1500244140625, 6.363037109375, 6.5760498046875, 6.7890625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 32.0, 49.0, 73.0, 91.0, 131.0, 138.0, 227.0, 404.0, 658.0, 1118.0, 1902.0, 3429.0, 6830.0, 14724.0, 35121.0, 93736.0, 283319.0, 387929.0, 132503.0, 47770.0, 19549.0, 8787.0, 4395.0, 2235.0, 1255.0, 709.0, 444.0, 306.0, 195.0, 116.0, 101.0, 70.0, 40.0, 31.0, 25.0, 20.0, 18.0, 10.0, 3.0, 4.0, 5.0, 0.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.12109375, -4.97119140625, -4.8212890625, -4.67138671875, -4.521484375, -4.37158203125, -4.2216796875, -4.07177734375, -3.921875, -3.77197265625, -3.6220703125, -3.47216796875, -3.322265625, -3.17236328125, -3.0224609375, -2.87255859375, -2.72265625, -2.57275390625, -2.4228515625, -2.27294921875, -2.123046875, -1.97314453125, -1.8232421875, -1.67333984375, -1.5234375, -1.37353515625, -1.2236328125, -1.07373046875, -0.923828125, -0.77392578125, -0.6240234375, -0.47412109375, -0.32421875, -0.17431640625, -0.0244140625, 0.12548828125, 0.275390625, 0.42529296875, 0.5751953125, 0.72509765625, 0.875, 1.02490234375, 1.1748046875, 1.32470703125, 1.474609375, 1.62451171875, 1.7744140625, 1.92431640625, 2.07421875, 2.22412109375, 2.3740234375, 2.52392578125, 2.673828125, 2.82373046875, 2.9736328125, 3.12353515625, 3.2734375, 3.42333984375, 3.5732421875, 3.72314453125, 3.873046875, 4.02294921875, 4.1728515625, 4.32275390625, 4.47265625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 14.0, 12.0, 10.0, 16.0, 18.0, 29.0, 21.0, 23.0, 23.0, 47.0, 35.0, 51.0, 45.0, 56.0, 93.0, 316.0, 1582.0, 123.0, 94.0, 57.0, 47.0, 38.0, 39.0, 33.0, 34.0, 32.0, 23.0, 15.0, 27.0, 10.0, 14.0, 8.0, 7.0, 7.0, 9.0, 6.0, 1.0, 1.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.484375, -21.80712890625, -21.1298828125, -20.45263671875, -19.775390625, -19.09814453125, -18.4208984375, -17.74365234375, -17.06640625, -16.38916015625, -15.7119140625, -15.03466796875, -14.357421875, -13.68017578125, -13.0029296875, -12.32568359375, -11.6484375, -10.97119140625, -10.2939453125, -9.61669921875, -8.939453125, -8.26220703125, -7.5849609375, -6.90771484375, -6.23046875, -5.55322265625, -4.8759765625, -4.19873046875, -3.521484375, -2.84423828125, -2.1669921875, -1.48974609375, -0.8125, -0.13525390625, 0.5419921875, 1.21923828125, 1.896484375, 2.57373046875, 3.2509765625, 3.92822265625, 4.60546875, 5.28271484375, 5.9599609375, 6.63720703125, 7.314453125, 7.99169921875, 8.6689453125, 9.34619140625, 10.0234375, 10.70068359375, 11.3779296875, 12.05517578125, 12.732421875, 13.40966796875, 14.0869140625, 14.76416015625, 15.44140625, 16.11865234375, 16.7958984375, 17.47314453125, 18.150390625, 18.82763671875, 19.5048828125, 20.18212890625, 20.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 12.0, 13.0, 32.0, 54.0, 95.0, 182.0, 273.0, 495.0, 1754.0, 3133674.0, 7738.0, 613.0, 311.0, 187.0, 109.0, 59.0, 36.0, 21.0, 20.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.875, -137.41015625, -133.9453125, -130.48046875, -127.015625, -123.55078125, -120.0859375, -116.62109375, -113.15625, -109.69140625, -106.2265625, -102.76171875, -99.296875, -95.83203125, -92.3671875, -88.90234375, -85.4375, -81.97265625, -78.5078125, -75.04296875, -71.578125, -68.11328125, -64.6484375, -61.18359375, -57.71875, -54.25390625, -50.7890625, -47.32421875, -43.859375, -40.39453125, -36.9296875, -33.46484375, -30.0, -26.53515625, -23.0703125, -19.60546875, -16.140625, -12.67578125, -9.2109375, -5.74609375, -2.28125, 1.18359375, 4.6484375, 8.11328125, 11.578125, 15.04296875, 18.5078125, 21.97265625, 25.4375, 28.90234375, 32.3671875, 35.83203125, 39.296875, 42.76171875, 46.2265625, 49.69140625, 53.15625, 56.62109375, 60.0859375, 63.55078125, 67.015625, 70.48046875, 73.9453125, 77.41015625, 80.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [4.0, 937.0, 80.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.38177490234375, -7.355345726013184, 2.671083450317383, 12.697513580322266, 22.723941802978516, 32.750370025634766, 42.77680206298828, 52.80323028564453, 62.82965850830078, 72.85608673095703, 82.88251495361328, 92.90895080566406, 102.93537902832031, 112.96180725097656, 122.98823547363281, 133.01466369628906, 143.0410919189453, 153.06752014160156, 163.0939483642578, 173.12037658691406, 183.1468048095703, 193.17323303222656, 203.19967651367188, 213.22610473632812, 223.25253295898438, 233.27896118164062, 243.30538940429688, 253.33181762695312, 263.3582458496094, 273.3846740722656, 283.4111022949219, 293.4375305175781, 303.4639587402344, 313.4903869628906, 323.5168151855469, 333.5432434082031, 343.5696716308594, 353.5960998535156, 363.6225280761719, 373.6489562988281, 383.6753845214844, 393.7018127441406, 403.7282409667969, 413.7546691894531, 423.7810974121094, 433.8075256347656, 443.8339538574219, 453.8603820800781, 463.8868408203125, 473.91326904296875, 483.939697265625, 493.96612548828125, 503.9925537109375, 514.0189819335938, 524.04541015625, 534.0718383789062, 544.0982666015625, 554.1246948242188, 564.151123046875, 574.1775512695312, 584.2039794921875, 594.2304077148438, 604.2568359375, 614.2832641601562, 624.3096923828125]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 8.0, 10.0, 14.0, 14.0, 14.0, 18.0, 20.0, 35.0, 25.0, 26.0, 30.0, 32.0, 29.0, 32.0, 45.0, 48.0, 43.0, 51.0, 43.0, 37.0, 45.0, 37.0, 35.0, 33.0, 32.0, 28.0, 31.0, 22.0, 23.0, 24.0, 12.0, 17.0, 10.0, 15.0, 14.0, 10.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.804561614990234, -57.924407958984375, -56.044254302978516, -54.164100646972656, -52.2839469909668, -50.40379333496094, -48.523643493652344, -46.64348602294922, -44.763336181640625, -42.883182525634766, -41.003028869628906, -39.12287521362305, -37.24272155761719, -35.36256790161133, -33.48241424560547, -31.602262496948242, -29.72210693359375, -27.84195327758789, -25.96179962158203, -24.081645965576172, -22.201492309570312, -20.321338653564453, -18.441186904907227, -16.561033248901367, -14.680879592895508, -12.800725936889648, -10.920572280883789, -9.040419578552246, -7.160265922546387, -5.280112266540527, -3.3999595642089844, -1.519805908203125, 0.3603477478027344, 2.2405011653900146, 4.120654582977295, 6.000807762145996, 7.8809614181518555, 9.761115074157715, 11.641267776489258, 13.521421432495117, 15.401575088500977, 17.281728744506836, 19.161882400512695, 21.042034149169922, 22.92218780517578, 24.80234146118164, 26.6824951171875, 28.56264877319336, 30.44280242919922, 32.32295608520508, 34.20310974121094, 36.0832633972168, 37.963417053222656, 39.843570709228516, 41.723724365234375, 43.60387420654297, 45.484031677246094, 47.36418533325195, 49.24433898925781, 51.12449264526367, 53.00464630126953, 54.88479995727539, 56.76495361328125, 58.645103454589844, 60.5252571105957]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 11.0, 6.0, 8.0, 16.0, 16.0, 17.0, 14.0, 21.0, 28.0, 30.0, 37.0, 42.0, 31.0, 43.0, 44.0, 41.0, 47.0, 42.0, 43.0, 37.0, 44.0, 33.0, 32.0, 33.0, 35.0, 33.0, 44.0, 36.0, 31.0, 16.0, 15.0, 8.0, 6.0, 16.0, 12.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12109375, -6.8931884765625, -6.665283203125, -6.4373779296875, -6.20947265625, -5.9815673828125, -5.753662109375, -5.5257568359375, -5.2978515625, -5.0699462890625, -4.842041015625, -4.6141357421875, -4.38623046875, -4.1583251953125, -3.930419921875, -3.7025146484375, -3.474609375, -3.2467041015625, -3.018798828125, -2.7908935546875, -2.56298828125, -2.3350830078125, -2.107177734375, -1.8792724609375, -1.6513671875, -1.4234619140625, -1.195556640625, -0.9676513671875, -0.73974609375, -0.5118408203125, -0.283935546875, -0.0560302734375, 0.171875, 0.3997802734375, 0.627685546875, 0.8555908203125, 1.08349609375, 1.3114013671875, 1.539306640625, 1.7672119140625, 1.9951171875, 2.2230224609375, 2.450927734375, 2.6788330078125, 2.90673828125, 3.1346435546875, 3.362548828125, 3.5904541015625, 3.818359375, 4.0462646484375, 4.274169921875, 4.5020751953125, 4.72998046875, 4.9578857421875, 5.185791015625, 5.4136962890625, 5.6416015625, 5.8695068359375, 6.097412109375, 6.3253173828125, 6.55322265625, 6.7811279296875, 7.009033203125, 7.2369384765625, 7.46484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 12.0, 12.0, 10.0, 19.0, 27.0, 21.0, 31.0, 43.0, 49.0, 87.0, 116.0, 279.0, 796.0, 3136.0, 34569.0, 1201812.0, 2781809.0, 161368.0, 7689.0, 1352.0, 414.0, 176.0, 102.0, 76.0, 48.0, 33.0, 29.0, 24.0, 24.0, 18.0, 13.0, 9.0, 10.0, 6.0, 9.0, 6.0, 3.0, 7.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.540283203125, -16.93994140625, -16.339599609375, -15.7392578125, -15.138916015625, -14.53857421875, -13.938232421875, -13.337890625, -12.737548828125, -12.13720703125, -11.536865234375, -10.9365234375, -10.336181640625, -9.73583984375, -9.135498046875, -8.53515625, -7.934814453125, -7.33447265625, -6.734130859375, -6.1337890625, -5.533447265625, -4.93310546875, -4.332763671875, -3.732421875, -3.132080078125, -2.53173828125, -1.931396484375, -1.3310546875, -0.730712890625, -0.13037109375, 0.469970703125, 1.0703125, 1.670654296875, 2.27099609375, 2.871337890625, 3.4716796875, 4.072021484375, 4.67236328125, 5.272705078125, 5.873046875, 6.473388671875, 7.07373046875, 7.674072265625, 8.2744140625, 8.874755859375, 9.47509765625, 10.075439453125, 10.67578125, 11.276123046875, 11.87646484375, 12.476806640625, 13.0771484375, 13.677490234375, 14.27783203125, 14.878173828125, 15.478515625, 16.078857421875, 16.67919921875, 17.279541015625, 17.8798828125, 18.480224609375, 19.08056640625, 19.680908203125, 20.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 13.0, 6.0, 3.0, 9.0, 17.0, 12.0, 28.0, 24.0, 33.0, 39.0, 34.0, 63.0, 73.0, 90.0, 108.0, 140.0, 184.0, 232.0, 269.0, 372.0, 364.0, 344.0, 286.0, 280.0, 238.0, 165.0, 125.0, 112.0, 90.0, 63.0, 65.0, 41.0, 32.0, 29.0, 22.0, 14.0, 14.0, 5.0, 9.0, 6.0, 6.0, 7.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5743408203125, -8.265869140625, -7.9573974609375, -7.64892578125, -7.3404541015625, -7.031982421875, -6.7235107421875, -6.4150390625, -6.1065673828125, -5.798095703125, -5.4896240234375, -5.18115234375, -4.8726806640625, -4.564208984375, -4.2557373046875, -3.947265625, -3.6387939453125, -3.330322265625, -3.0218505859375, -2.71337890625, -2.4049072265625, -2.096435546875, -1.7879638671875, -1.4794921875, -1.1710205078125, -0.862548828125, -0.5540771484375, -0.24560546875, 0.0628662109375, 0.371337890625, 0.6798095703125, 0.98828125, 1.2967529296875, 1.605224609375, 1.9136962890625, 2.22216796875, 2.5306396484375, 2.839111328125, 3.1475830078125, 3.4560546875, 3.7645263671875, 4.072998046875, 4.3814697265625, 4.68994140625, 4.9984130859375, 5.306884765625, 5.6153564453125, 5.923828125, 6.2322998046875, 6.540771484375, 6.8492431640625, 7.15771484375, 7.4661865234375, 7.774658203125, 8.0831298828125, 8.3916015625, 8.7000732421875, 9.008544921875, 9.3170166015625, 9.62548828125, 9.9339599609375, 10.242431640625, 10.5509033203125, 10.859375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 20.0, 25.0, 28.0, 38.0, 38.0, 78.0, 108.0, 117.0, 160.0, 195.0, 344.0, 641.0, 3144.0, 4060837.0, 126119.0, 894.0, 441.0, 254.0, 188.0, 148.0, 114.0, 73.0, 58.0, 46.0, 40.0, 29.0, 19.0, 20.0, 10.0, 7.0, 3.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.625, -81.21875, -78.8125, -76.40625, -74.0, -71.59375, -69.1875, -66.78125, -64.375, -61.96875, -59.5625, -57.15625, -54.75, -52.34375, -49.9375, -47.53125, -45.125, -42.71875, -40.3125, -37.90625, -35.5, -33.09375, -30.6875, -28.28125, -25.875, -23.46875, -21.0625, -18.65625, -16.25, -13.84375, -11.4375, -9.03125, -6.625, -4.21875, -1.8125, 0.59375, 3.0, 5.40625, 7.8125, 10.21875, 12.625, 15.03125, 17.4375, 19.84375, 22.25, 24.65625, 27.0625, 29.46875, 31.875, 34.28125, 36.6875, 39.09375, 41.5, 43.90625, 46.3125, 48.71875, 51.125, 53.53125, 55.9375, 58.34375, 60.75, 63.15625, 65.5625, 67.96875, 70.375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 17.0, 31.0, 31.0, 47.0, 59.0, 90.0, 85.0, 104.0, 91.0, 87.0, 76.0, 78.0, 66.0, 36.0, 31.0, 21.0, 10.0, 12.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.27195739746094, -32.10111999511719, -30.930282592773438, -29.759445190429688, -28.588607788085938, -27.417770385742188, -26.24693489074707, -25.07609748840332, -23.90526008605957, -22.73442268371582, -21.56358528137207, -20.39274787902832, -19.221912384033203, -18.051074981689453, -16.880237579345703, -15.709400177001953, -14.538562774658203, -13.367725372314453, -12.196887969970703, -11.02605152130127, -9.85521411895752, -8.68437671661377, -7.513539791107178, -6.342702865600586, -5.171865463256836, -4.001028060913086, -2.830191135406494, -1.6593539714813232, -0.48851680755615234, 0.6823205947875977, 1.8531575202941895, 3.0239944458007812, 4.194828033447266, 5.365665435791016, 6.536502361297607, 7.707339286804199, 8.87817668914795, 10.0490140914917, 11.219850540161133, 12.390687942504883, 13.561525344848633, 14.732362747192383, 15.903200149536133, 17.074037551879883, 18.244873046875, 19.41571044921875, 20.5865478515625, 21.75738525390625, 22.92822265625, 24.09906005859375, 25.2698974609375, 26.44073486328125, 27.611572265625, 28.78240966796875, 29.953245162963867, 31.124082565307617, 32.294921875, 33.46575927734375, 34.6365966796875, 35.80743408203125, 36.978271484375, 38.14910888671875, 39.3199462890625, 40.49078369140625, 41.661617279052734]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 10.0, 5.0, 9.0, 6.0, 11.0, 14.0, 12.0, 17.0, 17.0, 27.0, 25.0, 15.0, 29.0, 28.0, 38.0, 33.0, 31.0, 37.0, 49.0, 36.0, 33.0, 39.0, 47.0, 36.0, 47.0, 37.0, 29.0, 35.0, 24.0, 32.0, 28.0, 28.0, 25.0, 21.0, 11.0, 14.0, 16.0, 14.0, 7.0, 5.0, 5.0, 5.0, 6.0, 7.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.13691711425781, -37.85509490966797, -36.57327651977539, -35.29145431518555, -34.0096321105957, -32.72780990600586, -31.44599151611328, -30.164169311523438, -28.882347106933594, -27.600526809692383, -26.31870460510254, -25.036884307861328, -23.755062103271484, -22.473241806030273, -21.191421508789062, -19.90959930419922, -18.627779006958008, -17.345958709716797, -16.064136505126953, -14.782316207885742, -13.500494003295898, -12.218673706054688, -10.93685245513916, -9.655031204223633, -8.373209953308105, -7.091388702392578, -5.809567451477051, -4.527746677398682, -3.2459254264831543, -1.964104175567627, -0.6822834014892578, 0.5995378494262695, 1.8813591003417969, 3.163180351257324, 4.445001602172852, 5.726822376251221, 7.008643627166748, 8.290464401245117, 9.572285652160645, 10.854106903076172, 12.1359281539917, 13.417749404907227, 14.699570655822754, 15.981391906738281, 17.263212203979492, 18.545034408569336, 19.826854705810547, 21.10867691040039, 22.3904972076416, 23.672317504882812, 24.954139709472656, 26.235960006713867, 27.51778221130371, 28.799602508544922, 30.081424713134766, 31.363245010375977, 32.64506530761719, 33.92688751220703, 35.20870590209961, 36.49052810668945, 37.7723503112793, 39.05417251586914, 40.33599090576172, 41.61781311035156, 42.899635314941406]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 0.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 12.0, 10.0, 22.0, 42.0, 36.0, 74.0, 109.0, 172.0, 292.0, 463.0, 720.0, 1156.0, 1990.0, 3265.0, 5284.0, 8844.0, 15321.0, 26684.0, 47120.0, 85639.0, 162992.0, 283631.0, 185092.0, 95783.0, 52748.0, 29515.0, 16812.0, 9780.0, 5862.0, 3493.0, 2084.0, 1284.0, 825.0, 482.0, 336.0, 188.0, 129.0, 91.0, 56.0, 37.0, 25.0, 15.0, 12.0, 18.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.3193359375, -1.280059814453125, -1.24078369140625, -1.201507568359375, -1.1622314453125, -1.122955322265625, -1.08367919921875, -1.044403076171875, -1.005126953125, -0.965850830078125, -0.92657470703125, -0.887298583984375, -0.8480224609375, -0.808746337890625, -0.76947021484375, -0.730194091796875, -0.69091796875, -0.651641845703125, -0.61236572265625, -0.573089599609375, -0.5338134765625, -0.494537353515625, -0.45526123046875, -0.415985107421875, -0.376708984375, -0.337432861328125, -0.29815673828125, -0.258880615234375, -0.2196044921875, -0.180328369140625, -0.14105224609375, -0.101776123046875, -0.0625, -0.023223876953125, 0.01605224609375, 0.055328369140625, 0.0946044921875, 0.133880615234375, 0.17315673828125, 0.212432861328125, 0.251708984375, 0.290985107421875, 0.33026123046875, 0.369537353515625, 0.4088134765625, 0.448089599609375, 0.48736572265625, 0.526641845703125, 0.56591796875, 0.605194091796875, 0.64447021484375, 0.683746337890625, 0.7230224609375, 0.762298583984375, 0.80157470703125, 0.840850830078125, 0.880126953125, 0.919403076171875, 0.95867919921875, 0.997955322265625, 1.0372314453125, 1.076507568359375, 1.11578369140625, 1.155059814453125, 1.1943359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 5.0, 7.0, 12.0, 7.0, 14.0, 13.0, 14.0, 20.0, 19.0, 24.0, 24.0, 29.0, 30.0, 31.0, 28.0, 36.0, 29.0, 25.0, 50.0, 33.0, 1061.0, 56.0, 51.0, 39.0, 41.0, 42.0, 29.0, 27.0, 37.0, 17.0, 24.0, 19.0, 21.0, 19.0, 9.0, 18.0, 16.0, 9.0, 7.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.67169189453125, -3.5465087890625, -3.42132568359375, -3.296142578125, -3.17095947265625, -3.0457763671875, -2.92059326171875, -2.79541015625, -2.67022705078125, -2.5450439453125, -2.41986083984375, -2.294677734375, -2.16949462890625, -2.0443115234375, -1.91912841796875, -1.7939453125, -1.66876220703125, -1.5435791015625, -1.41839599609375, -1.293212890625, -1.16802978515625, -1.0428466796875, -0.91766357421875, -0.79248046875, -0.66729736328125, -0.5421142578125, -0.41693115234375, -0.291748046875, -0.16656494140625, -0.0413818359375, 0.08380126953125, 0.208984375, 0.33416748046875, 0.4593505859375, 0.58453369140625, 0.709716796875, 0.83489990234375, 0.9600830078125, 1.08526611328125, 1.21044921875, 1.33563232421875, 1.4608154296875, 1.58599853515625, 1.711181640625, 1.83636474609375, 1.9615478515625, 2.08673095703125, 2.2119140625, 2.33709716796875, 2.4622802734375, 2.58746337890625, 2.712646484375, 2.83782958984375, 2.9630126953125, 3.08819580078125, 3.21337890625, 3.33856201171875, 3.4637451171875, 3.58892822265625, 3.714111328125, 3.83929443359375, 3.9644775390625, 4.08966064453125, 4.21484375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 12.0, 4.0, 9.0, 21.0, 28.0, 38.0, 56.0, 98.0, 139.0, 210.0, 315.0, 411.0, 636.0, 858.0, 1263.0, 1948.0, 2850.0, 4228.0, 6351.0, 9725.0, 14716.0, 22595.0, 35422.0, 57620.0, 95504.0, 173869.0, 1296970.0, 146503.0, 83497.0, 50449.0, 31439.0, 19929.0, 13267.0, 8578.0, 5797.0, 3756.0, 2492.0, 1715.0, 1206.0, 847.0, 562.0, 373.0, 262.0, 172.0, 136.0, 79.0, 65.0, 37.0, 20.0, 23.0, 18.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9287109375, -0.9000167846679688, -0.8713226318359375, -0.8426284790039062, -0.813934326171875, -0.7852401733398438, -0.7565460205078125, -0.7278518676757812, -0.69915771484375, -0.6704635620117188, -0.6417694091796875, -0.6130752563476562, -0.584381103515625, -0.5556869506835938, -0.5269927978515625, -0.49829864501953125, -0.4696044921875, -0.44091033935546875, -0.4122161865234375, -0.38352203369140625, -0.354827880859375, -0.32613372802734375, -0.2974395751953125, -0.26874542236328125, -0.24005126953125, -0.21135711669921875, -0.1826629638671875, -0.15396881103515625, -0.125274658203125, -0.09658050537109375, -0.0678863525390625, -0.03919219970703125, -0.010498046875, 0.01819610595703125, 0.0468902587890625, 0.07558441162109375, 0.104278564453125, 0.13297271728515625, 0.1616668701171875, 0.19036102294921875, 0.21905517578125, 0.24774932861328125, 0.2764434814453125, 0.30513763427734375, 0.333831787109375, 0.36252593994140625, 0.3912200927734375, 0.41991424560546875, 0.4486083984375, 0.47730255126953125, 0.5059967041015625, 0.5346908569335938, 0.563385009765625, 0.5920791625976562, 0.6207733154296875, 0.6494674682617188, 0.67816162109375, 0.7068557739257812, 0.7355499267578125, 0.7642440795898438, 0.792938232421875, 0.8216323852539062, 0.8503265380859375, 0.8790206909179688, 0.90771484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 10.0, 12.0, 15.0, 20.0, 16.0, 31.0, 41.0, 39.0, 56.0, 67.0, 77.0, 75.0, 78.0, 77.0, 61.0, 56.0, 44.0, 44.0, 25.0, 30.0, 20.0, 19.0, 16.0, 6.0, 10.0, 10.0, 9.0, 6.0, 1.0, 4.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.0007271766662597656, -0.0007058605551719666, -0.0006845444440841675, -0.0006632283329963684, -0.0006419122219085693, -0.0006205961108207703, -0.0005992799997329712, -0.0005779638886451721, -0.000556647777557373, -0.000535331666469574, -0.0005140155553817749, -0.0004926994442939758, -0.00047138333320617676, -0.0004500672221183777, -0.0004287511110305786, -0.00040743499994277954, -0.00038611888885498047, -0.0003648027777671814, -0.0003434866666793823, -0.00032217055559158325, -0.0003008544445037842, -0.0002795383334159851, -0.00025822222232818604, -0.00023690611124038696, -0.0002155900001525879, -0.00019427388906478882, -0.00017295777797698975, -0.00015164166688919067, -0.0001303255558013916, -0.00010900944471359253, -8.769333362579346e-05, -6.637722253799438e-05, -4.506111145019531e-05, -2.374500036239624e-05, -2.428889274597168e-06, 1.8887221813201904e-05, 4.0203332901000977e-05, 6.151944398880005e-05, 8.283555507659912e-05, 0.0001041516661643982, 0.00012546777725219727, 0.00014678388833999634, 0.0001680999994277954, 0.00018941611051559448, 0.00021073222160339355, 0.00023204833269119263, 0.0002533644437789917, 0.00027468055486679077, 0.00029599666595458984, 0.0003173127770423889, 0.000338628888130188, 0.00035994499921798706, 0.00038126111030578613, 0.0004025772213935852, 0.0004238933324813843, 0.00044520944356918335, 0.0004665255546569824, 0.0004878416657447815, 0.0005091577768325806, 0.0005304738879203796, 0.0005517899990081787, 0.0005731061100959778, 0.0005944222211837769, 0.0006157383322715759, 0.000637054443359375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 5.0, 12.0, 11.0, 12.0, 17.0, 19.0, 21.0, 26.0, 35.0, 57.0, 64.0, 91.0, 162.0, 267.0, 784.0, 27787.0, 1016309.0, 1830.0, 431.0, 205.0, 120.0, 83.0, 46.0, 33.0, 32.0, 17.0, 16.0, 8.0, 14.0, 11.0, 4.0, 2.0, 2.0, 3.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01488494873046875, -0.014392971992492676, -0.013900995254516602, -0.013409018516540527, -0.012917041778564453, -0.012425065040588379, -0.011933088302612305, -0.01144111156463623, -0.010949134826660156, -0.010457158088684082, -0.009965181350708008, -0.009473204612731934, -0.00898122787475586, -0.008489251136779785, -0.007997274398803711, -0.007505297660827637, -0.0070133209228515625, -0.006521344184875488, -0.006029367446899414, -0.00553739070892334, -0.005045413970947266, -0.004553437232971191, -0.004061460494995117, -0.003569483757019043, -0.0030775070190429688, -0.0025855302810668945, -0.0020935535430908203, -0.001601576805114746, -0.0011096000671386719, -0.0006176233291625977, -0.00012564659118652344, 0.0003663301467895508, 0.000858306884765625, 0.0013502836227416992, 0.0018422603607177734, 0.0023342370986938477, 0.002826213836669922, 0.003318190574645996, 0.0038101673126220703, 0.0043021440505981445, 0.004794120788574219, 0.005286097526550293, 0.005778074264526367, 0.006270051002502441, 0.006762027740478516, 0.00725400447845459, 0.007745981216430664, 0.008237957954406738, 0.008729934692382812, 0.009221911430358887, 0.009713888168334961, 0.010205864906311035, 0.01069784164428711, 0.011189818382263184, 0.011681795120239258, 0.012173771858215332, 0.012665748596191406, 0.01315772533416748, 0.013649702072143555, 0.014141678810119629, 0.014633655548095703, 0.015125632286071777, 0.015617609024047852, 0.016109585762023926, 0.0166015625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 20.0, 33.0, 74.0, 99.0, 139.0, 186.0, 153.0, 128.0, 75.0, 46.0, 18.0, 17.0, 8.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003211433067917824, -0.00030575686832889915, -0.00029037045896984637, -0.00027498402050696313, -0.00025959761114791036, -0.0002442111726850271, -0.00022882474877405912, -0.0002134383248630911, -0.0001980519009521231, -0.0001826654770411551, -0.0001672790531301871, -0.0001518926292192191, -0.00013650619075633585, -0.00012111977412132546, -0.00010573334293439984, -9.034691902343184e-05, -7.496049511246383e-05, -5.9574071201495826e-05, -4.4187643652549013e-05, -2.88012161036022e-05, -1.3414792192634195e-05, 1.9716317183338106e-06, 1.735806290525943e-05, 3.2744486816227436e-05, 4.813091072719544e-05, 6.351733463816345e-05, 7.890375854913145e-05, 9.429018973605707e-05, 0.00010967661364702508, 0.00012506303028203547, 0.0001404494687449187, 0.0001558358926558867, 0.00017122231656685472, 0.00018660874047782272, 0.00020199516438879073, 0.00021738160285167396, 0.00023276801221072674, 0.00024815445067360997, 0.0002635408891364932, 0.000278927298495546, 0.00029431370785459876, 0.000309700146317482, 0.00032508655567653477, 0.000340472994139418, 0.0003558594034984708, 0.000371245841961354, 0.00038663228042423725, 0.00040201868978329003, 0.00041740512824617326, 0.0004327915667090565, 0.0004481779760681093, 0.0004635644145309925, 0.0004789508238900453, 0.0004943372332490981, 0.0005097236717119813, 0.0005251101101748645, 0.0005404965486377478, 0.000555882987100631, 0.0005712694255635142, 0.0005866558058187366, 0.0006020422442816198, 0.000617428682744503, 0.0006328151212073863, 0.0006482015596702695, 0.0006635879399254918]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 9.0, 14.0, 7.0, 10.0, 14.0, 15.0, 15.0, 20.0, 26.0, 27.0, 27.0, 24.0, 35.0, 24.0, 27.0, 28.0, 38.0, 30.0, 33.0, 32.0, 36.0, 33.0, 44.0, 48.0, 29.0, 41.0, 21.0, 29.0, 24.0, 22.0, 34.0, 22.0, 14.0, 22.0, 14.0, 21.0, 17.0, 19.0, 11.0, 7.0, 3.0, 3.0, 9.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00028628110885620117, -0.0002773944288492203, -0.0002685077488422394, -0.0002596210688352585, -0.0002507343888282776, -0.0002418477088212967, -0.0002329610288143158, -0.0002240743488073349, -0.000215187668800354, -0.0002063009887933731, -0.0001974143087863922, -0.00018852762877941132, -0.00017964094877243042, -0.00017075426876544952, -0.00016186758875846863, -0.00015298090875148773, -0.00014409422874450684, -0.00013520754873752594, -0.00012632086873054504, -0.00011743418872356415, -0.00010854750871658325, -9.966082870960236e-05, -9.077414870262146e-05, -8.188746869564056e-05, -7.300078868865967e-05, -6.411410868167877e-05, -5.5227428674697876e-05, -4.634074866771698e-05, -3.7454068660736084e-05, -2.8567388653755188e-05, -1.9680708646774292e-05, -1.0794028639793396e-05, -1.9073486328125e-06, 6.979331374168396e-06, 1.5866011381149292e-05, 2.4752691388130188e-05, 3.3639371395111084e-05, 4.252605140209198e-05, 5.1412731409072876e-05, 6.029941141605377e-05, 6.918609142303467e-05, 7.807277143001556e-05, 8.695945143699646e-05, 9.584613144397736e-05, 0.00010473281145095825, 0.00011361949145793915, 0.00012250617146492004, 0.00013139285147190094, 0.00014027953147888184, 0.00014916621148586273, 0.00015805289149284363, 0.00016693957149982452, 0.00017582625150680542, 0.00018471293151378632, 0.0001935996115207672, 0.0002024862915277481, 0.000211372971534729, 0.0002202596515417099, 0.0002291463315486908, 0.0002380330115556717, 0.0002469196915626526, 0.0002558063715696335, 0.0002646930515766144, 0.0002735797315835953, 0.00028246641159057617]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 8.0, 10.0, 7.0, 6.0, 10.0, 9.0, 14.0, 25.0, 29.0, 21.0, 39.0, 35.0, 29.0, 33.0, 45.0, 53.0, 45.0, 39.0, 46.0, 47.0, 32.0, 43.0, 38.0, 36.0, 36.0, 48.0, 27.0, 38.0, 21.0, 27.0, 13.0, 20.0, 15.0, 16.0, 8.0, 13.0, 5.0, 10.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.73858642578125, -6.5162353515625, -6.29388427734375, -6.071533203125, -5.84918212890625, -5.6268310546875, -5.40447998046875, -5.18212890625, -4.95977783203125, -4.7374267578125, -4.51507568359375, -4.292724609375, -4.07037353515625, -3.8480224609375, -3.62567138671875, -3.4033203125, -3.18096923828125, -2.9586181640625, -2.73626708984375, -2.513916015625, -2.29156494140625, -2.0692138671875, -1.84686279296875, -1.62451171875, -1.40216064453125, -1.1798095703125, -0.95745849609375, -0.735107421875, -0.51275634765625, -0.2904052734375, -0.06805419921875, 0.154296875, 0.37664794921875, 0.5989990234375, 0.82135009765625, 1.043701171875, 1.26605224609375, 1.4884033203125, 1.71075439453125, 1.93310546875, 2.15545654296875, 2.3778076171875, 2.60015869140625, 2.822509765625, 3.04486083984375, 3.2672119140625, 3.48956298828125, 3.7119140625, 3.93426513671875, 4.1566162109375, 4.37896728515625, 4.601318359375, 4.82366943359375, 5.0460205078125, 5.26837158203125, 5.49072265625, 5.71307373046875, 5.9354248046875, 6.15777587890625, 6.380126953125, 6.60247802734375, 6.8248291015625, 7.04718017578125, 7.26953125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 0.0, 8.0, 10.0, 8.0, 10.0, 19.0, 27.0, 27.0, 50.0, 60.0, 81.0, 143.0, 238.0, 332.0, 682.0, 1499.0, 4242.0, 13220.0, 51743.0, 250789.0, 555620.0, 127779.0, 28861.0, 7977.0, 2707.0, 1118.0, 529.0, 266.0, 162.0, 94.0, 68.0, 44.0, 38.0, 21.0, 23.0, 13.0, 19.0, 6.0, 13.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.5380859375, -6.322265625, -6.1064453125, -5.890625, -5.6748046875, -5.458984375, -5.2431640625, -5.02734375, -4.8115234375, -4.595703125, -4.3798828125, -4.1640625, -3.9482421875, -3.732421875, -3.5166015625, -3.30078125, -3.0849609375, -2.869140625, -2.6533203125, -2.4375, -2.2216796875, -2.005859375, -1.7900390625, -1.57421875, -1.3583984375, -1.142578125, -0.9267578125, -0.7109375, -0.4951171875, -0.279296875, -0.0634765625, 0.15234375, 0.3681640625, 0.583984375, 0.7998046875, 1.015625, 1.2314453125, 1.447265625, 1.6630859375, 1.87890625, 2.0947265625, 2.310546875, 2.5263671875, 2.7421875, 2.9580078125, 3.173828125, 3.3896484375, 3.60546875, 3.8212890625, 4.037109375, 4.2529296875, 4.46875, 4.6845703125, 4.900390625, 5.1162109375, 5.33203125, 5.5478515625, 5.763671875, 5.9794921875, 6.1953125, 6.4111328125, 6.626953125, 6.8427734375, 7.05859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 11.0, 10.0, 16.0, 21.0, 19.0, 28.0, 40.0, 40.0, 31.0, 37.0, 27.0, 45.0, 59.0, 110.0, 371.0, 1586.0, 111.0, 51.0, 42.0, 46.0, 32.0, 34.0, 39.0, 23.0, 29.0, 23.0, 15.0, 19.0, 21.0, 18.0, 9.0, 7.0, 11.0, 8.0, 5.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.5, -19.819580078125, -19.13916015625, -18.458740234375, -17.7783203125, -17.097900390625, -16.41748046875, -15.737060546875, -15.056640625, -14.376220703125, -13.69580078125, -13.015380859375, -12.3349609375, -11.654541015625, -10.97412109375, -10.293701171875, -9.61328125, -8.932861328125, -8.25244140625, -7.572021484375, -6.8916015625, -6.211181640625, -5.53076171875, -4.850341796875, -4.169921875, -3.489501953125, -2.80908203125, -2.128662109375, -1.4482421875, -0.767822265625, -0.08740234375, 0.593017578125, 1.2734375, 1.953857421875, 2.63427734375, 3.314697265625, 3.9951171875, 4.675537109375, 5.35595703125, 6.036376953125, 6.716796875, 7.397216796875, 8.07763671875, 8.758056640625, 9.4384765625, 10.118896484375, 10.79931640625, 11.479736328125, 12.16015625, 12.840576171875, 13.52099609375, 14.201416015625, 14.8818359375, 15.562255859375, 16.24267578125, 16.923095703125, 17.603515625, 18.283935546875, 18.96435546875, 19.644775390625, 20.3251953125, 21.005615234375, 21.68603515625, 22.366455078125, 23.046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 9.0, 13.0, 19.0, 28.0, 49.0, 58.0, 87.0, 133.0, 260.0, 422.0, 1275.0, 94034.0, 3046052.0, 2007.0, 512.0, 263.0, 179.0, 97.0, 63.0, 43.0, 28.0, 18.0, 11.0, 12.0, 6.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.3125, -76.5888671875, -73.865234375, -71.1416015625, -68.41796875, -65.6943359375, -62.970703125, -60.2470703125, -57.5234375, -54.7998046875, -52.076171875, -49.3525390625, -46.62890625, -43.9052734375, -41.181640625, -38.4580078125, -35.734375, -33.0107421875, -30.287109375, -27.5634765625, -24.83984375, -22.1162109375, -19.392578125, -16.6689453125, -13.9453125, -11.2216796875, -8.498046875, -5.7744140625, -3.05078125, -0.3271484375, 2.396484375, 5.1201171875, 7.84375, 10.5673828125, 13.291015625, 16.0146484375, 18.73828125, 21.4619140625, 24.185546875, 26.9091796875, 29.6328125, 32.3564453125, 35.080078125, 37.8037109375, 40.52734375, 43.2509765625, 45.974609375, 48.6982421875, 51.421875, 54.1455078125, 56.869140625, 59.5927734375, 62.31640625, 65.0400390625, 67.763671875, 70.4873046875, 73.2109375, 75.9345703125, 78.658203125, 81.3818359375, 84.10546875, 86.8291015625, 89.552734375, 92.2763671875, 95.0]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1010.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.07209396362305, -45.55060958862305, -33.02912139892578, -20.50763702392578, -7.986152648925781, 4.535331726074219, 17.056819915771484, 29.578304290771484, 42.099788665771484, 54.621273040771484, 67.14276123046875, 79.66424560546875, 92.18572998046875, 104.70721435546875, 117.22869873046875, 129.75018310546875, 142.27166748046875, 154.79315185546875, 167.31463623046875, 179.83612060546875, 192.35760498046875, 204.87908935546875, 217.40057373046875, 229.92205810546875, 242.4435577392578, 254.9650421142578, 267.4865417480469, 280.0080261230469, 292.5295104980469, 305.0509948730469, 317.5724792480469, 330.0939636230469, 342.6154479980469, 355.1369323730469, 367.6584167480469, 380.1799011230469, 392.7013854980469, 405.2228698730469, 417.7443542480469, 430.2658386230469, 442.7873229980469, 455.3088073730469, 467.8302917480469, 480.3517761230469, 492.8732604980469, 505.3947448730469, 517.916259765625, 530.437744140625, 542.959228515625, 555.480712890625, 568.002197265625, 580.523681640625, 593.045166015625, 605.566650390625, 618.088134765625, 630.609619140625, 643.131103515625, 655.652587890625, 668.174072265625, 680.695556640625, 693.217041015625, 705.738525390625, 718.260009765625, 730.781494140625, 743.302978515625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 9.0, 12.0, 17.0, 18.0, 15.0, 26.0, 23.0, 24.0, 33.0, 31.0, 25.0, 34.0, 40.0, 37.0, 30.0, 39.0, 39.0, 40.0, 43.0, 41.0, 44.0, 33.0, 29.0, 50.0, 34.0, 21.0, 23.0, 26.0, 22.0, 19.0, 19.0, 14.0, 8.0, 9.0, 17.0, 4.0, 3.0, 6.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-65.43413543701172, -63.51478576660156, -61.59543991088867, -59.676090240478516, -57.756744384765625, -55.83739471435547, -53.91804504394531, -51.99869918823242, -50.07935333251953, -48.160003662109375, -46.240657806396484, -44.32130813598633, -42.40196228027344, -40.48261260986328, -38.563262939453125, -36.643917083740234, -34.72456741333008, -32.80521774291992, -30.88587188720703, -28.966522216796875, -27.047176361083984, -25.127826690673828, -23.208478927612305, -21.28913116455078, -19.369783401489258, -17.450435638427734, -15.531087875366211, -13.611739158630371, -11.692391395568848, -9.773043632507324, -7.853694915771484, -5.934347152709961, -4.0149993896484375, -2.095651388168335, -0.17630338668823242, 1.7430448532104492, 3.6623926162719727, 5.581740379333496, 7.501089096069336, 9.42043685913086, 11.339784622192383, 13.259132385253906, 15.17848014831543, 17.097827911376953, 19.01717758178711, 20.9365234375, 22.855873107910156, 24.77522087097168, 26.694568634033203, 28.613916397094727, 30.53326416015625, 32.452613830566406, 34.3719596862793, 36.29130935668945, 38.210655212402344, 40.1300048828125, 42.049354553222656, 43.96870422363281, 45.8880500793457, 47.80739974975586, 49.72674560546875, 51.646095275878906, 53.56544494628906, 55.48479080200195, 57.404136657714844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 10.0, 9.0, 4.0, 7.0, 8.0, 16.0, 18.0, 21.0, 28.0, 30.0, 21.0, 45.0, 34.0, 39.0, 50.0, 42.0, 46.0, 54.0, 44.0, 42.0, 40.0, 39.0, 35.0, 37.0, 34.0, 37.0, 38.0, 35.0, 18.0, 20.0, 15.0, 19.0, 13.0, 15.0, 15.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.72265625, -6.48919677734375, -6.2557373046875, -6.02227783203125, -5.788818359375, -5.55535888671875, -5.3218994140625, -5.08843994140625, -4.85498046875, -4.62152099609375, -4.3880615234375, -4.15460205078125, -3.921142578125, -3.68768310546875, -3.4542236328125, -3.22076416015625, -2.9873046875, -2.75384521484375, -2.5203857421875, -2.28692626953125, -2.053466796875, -1.82000732421875, -1.5865478515625, -1.35308837890625, -1.11962890625, -0.88616943359375, -0.6527099609375, -0.41925048828125, -0.185791015625, 0.04766845703125, 0.2811279296875, 0.51458740234375, 0.748046875, 0.98150634765625, 1.2149658203125, 1.44842529296875, 1.681884765625, 1.91534423828125, 2.1488037109375, 2.38226318359375, 2.61572265625, 2.84918212890625, 3.0826416015625, 3.31610107421875, 3.549560546875, 3.78302001953125, 4.0164794921875, 4.24993896484375, 4.4833984375, 4.71685791015625, 4.9503173828125, 5.18377685546875, 5.417236328125, 5.65069580078125, 5.8841552734375, 6.11761474609375, 6.35107421875, 6.58453369140625, 6.8179931640625, 7.05145263671875, 7.284912109375, 7.51837158203125, 7.7518310546875, 7.98529052734375, 8.21875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 0.0, 13.0, 10.0, 19.0, 18.0, 21.0, 32.0, 34.0, 37.0, 48.0, 60.0, 70.0, 136.0, 140.0, 246.0, 425.0, 1276.0, 6121.0, 110931.0, 2250592.0, 1753481.0, 63394.0, 4861.0, 1052.0, 391.0, 226.0, 151.0, 92.0, 72.0, 51.0, 46.0, 40.0, 40.0, 34.0, 34.0, 14.0, 12.0, 14.0, 10.0, 11.0, 6.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.1875, -15.60791015625, -15.0283203125, -14.44873046875, -13.869140625, -13.28955078125, -12.7099609375, -12.13037109375, -11.55078125, -10.97119140625, -10.3916015625, -9.81201171875, -9.232421875, -8.65283203125, -8.0732421875, -7.49365234375, -6.9140625, -6.33447265625, -5.7548828125, -5.17529296875, -4.595703125, -4.01611328125, -3.4365234375, -2.85693359375, -2.27734375, -1.69775390625, -1.1181640625, -0.53857421875, 0.041015625, 0.62060546875, 1.2001953125, 1.77978515625, 2.359375, 2.93896484375, 3.5185546875, 4.09814453125, 4.677734375, 5.25732421875, 5.8369140625, 6.41650390625, 6.99609375, 7.57568359375, 8.1552734375, 8.73486328125, 9.314453125, 9.89404296875, 10.4736328125, 11.05322265625, 11.6328125, 12.21240234375, 12.7919921875, 13.37158203125, 13.951171875, 14.53076171875, 15.1103515625, 15.68994140625, 16.26953125, 16.84912109375, 17.4287109375, 18.00830078125, 18.587890625, 19.16748046875, 19.7470703125, 20.32666015625, 20.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 13.0, 16.0, 14.0, 8.0, 21.0, 27.0, 38.0, 52.0, 69.0, 75.0, 97.0, 145.0, 192.0, 259.0, 335.0, 417.0, 428.0, 431.0, 343.0, 241.0, 219.0, 129.0, 110.0, 93.0, 79.0, 56.0, 37.0, 18.0, 24.0, 18.0, 16.0, 9.0, 8.0, 8.0, 6.0, 4.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.453125, -10.087158203125, -9.72119140625, -9.355224609375, -8.9892578125, -8.623291015625, -8.25732421875, -7.891357421875, -7.525390625, -7.159423828125, -6.79345703125, -6.427490234375, -6.0615234375, -5.695556640625, -5.32958984375, -4.963623046875, -4.59765625, -4.231689453125, -3.86572265625, -3.499755859375, -3.1337890625, -2.767822265625, -2.40185546875, -2.035888671875, -1.669921875, -1.303955078125, -0.93798828125, -0.572021484375, -0.2060546875, 0.159912109375, 0.52587890625, 0.891845703125, 1.2578125, 1.623779296875, 1.98974609375, 2.355712890625, 2.7216796875, 3.087646484375, 3.45361328125, 3.819580078125, 4.185546875, 4.551513671875, 4.91748046875, 5.283447265625, 5.6494140625, 6.015380859375, 6.38134765625, 6.747314453125, 7.11328125, 7.479248046875, 7.84521484375, 8.211181640625, 8.5771484375, 8.943115234375, 9.30908203125, 9.675048828125, 10.041015625, 10.406982421875, 10.77294921875, 11.138916015625, 11.5048828125, 11.870849609375, 12.23681640625, 12.602783203125, 12.96875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 7.0, 7.0, 10.0, 7.0, 13.0, 19.0, 14.0, 23.0, 26.0, 42.0, 50.0, 61.0, 97.0, 89.0, 121.0, 154.0, 177.0, 235.0, 367.0, 582.0, 3389.0, 3810469.0, 375065.0, 1336.0, 536.0, 336.0, 219.0, 165.0, 134.0, 104.0, 72.0, 78.0, 59.0, 45.0, 39.0, 36.0, 26.0, 18.0, 23.0, 10.0, 7.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.875, -61.8037109375, -59.732421875, -57.6611328125, -55.58984375, -53.5185546875, -51.447265625, -49.3759765625, -47.3046875, -45.2333984375, -43.162109375, -41.0908203125, -39.01953125, -36.9482421875, -34.876953125, -32.8056640625, -30.734375, -28.6630859375, -26.591796875, -24.5205078125, -22.44921875, -20.3779296875, -18.306640625, -16.2353515625, -14.1640625, -12.0927734375, -10.021484375, -7.9501953125, -5.87890625, -3.8076171875, -1.736328125, 0.3349609375, 2.40625, 4.4775390625, 6.548828125, 8.6201171875, 10.69140625, 12.7626953125, 14.833984375, 16.9052734375, 18.9765625, 21.0478515625, 23.119140625, 25.1904296875, 27.26171875, 29.3330078125, 31.404296875, 33.4755859375, 35.546875, 37.6181640625, 39.689453125, 41.7607421875, 43.83203125, 45.9033203125, 47.974609375, 50.0458984375, 52.1171875, 54.1884765625, 56.259765625, 58.3310546875, 60.40234375, 62.4736328125, 64.544921875, 66.6162109375, 68.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 62.0, 550.0, 379.0, 22.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.54374694824219, -113.67644500732422, -104.80913543701172, -95.94183349609375, -87.07452392578125, -78.20722198486328, -69.33992004394531, -60.47261428833008, -51.605308532714844, -42.73800277709961, -33.870697021484375, -25.003395080566406, -16.136089324951172, -7.2687835693359375, 1.5985183715820312, 10.465824127197266, 19.3331298828125, 28.200435638427734, 37.06774139404297, 45.93504333496094, 54.80234909057617, 63.669654846191406, 72.53695678710938, 81.40426635742188, 90.27156829833984, 99.13887023925781, 108.00617980957031, 116.87348175048828, 125.74078369140625, 134.60809326171875, 143.47540283203125, 152.3426971435547, 161.21002197265625, 170.07733154296875, 178.9446258544922, 187.8119354248047, 196.6792449951172, 205.54653930664062, 214.41384887695312, 223.28115844726562, 232.14846801757812, 241.01577758789062, 249.88307189941406, 258.7503662109375, 267.61767578125, 276.4849853515625, 285.352294921875, 294.2196044921875, 303.0869140625, 311.9542236328125, 320.821533203125, 329.6888427734375, 338.5561218261719, 347.4234313964844, 356.2907409667969, 365.1580505371094, 374.02532958984375, 382.89263916015625, 391.75994873046875, 400.62725830078125, 409.4945373535156, 418.3618469238281, 427.2291564941406, 436.0964660644531, 444.9637756347656]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 9.0, 16.0, 11.0, 16.0, 12.0, 26.0, 21.0, 32.0, 39.0, 35.0, 36.0, 45.0, 32.0, 38.0, 40.0, 38.0, 58.0, 48.0, 56.0, 44.0, 38.0, 29.0, 35.0, 32.0, 33.0, 31.0, 17.0, 29.0, 20.0, 10.0, 9.0, 9.0, 10.0, 9.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.27734375, -44.82401657104492, -43.370689392089844, -41.917362213134766, -40.46403503417969, -39.010711669921875, -37.5573844909668, -36.10405731201172, -34.65073013305664, -33.19740295410156, -31.744075775146484, -30.29075050354004, -28.83742332458496, -27.384096145629883, -25.930770874023438, -24.47744369506836, -23.02411651611328, -21.570789337158203, -20.117462158203125, -18.66413688659668, -17.2108097076416, -15.757482528686523, -14.304156303405762, -12.850830078125, -11.397502899169922, -9.944175720214844, -8.490849494934082, -7.037522792816162, -5.584196090698242, -4.130869388580322, -2.6775426864624023, -1.2242164611816406, 0.2291107177734375, 1.6824374198913574, 3.1357641220092773, 4.589090824127197, 6.042417526245117, 7.495744228363037, 8.949070930480957, 10.402397155761719, 11.855724334716797, 13.309051513671875, 14.762377738952637, 16.2157039642334, 17.669031143188477, 19.122358322143555, 20.57568359375, 22.029010772705078, 23.482337951660156, 24.935665130615234, 26.388992309570312, 27.842317581176758, 29.295644760131836, 30.748971939086914, 32.20229721069336, 33.65562438964844, 35.108951568603516, 36.562278747558594, 38.01560592651367, 39.46893310546875, 40.92225646972656, 42.37558364868164, 43.82891082763672, 45.2822380065918, 46.735565185546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 24.0, 30.0, 33.0, 76.0, 90.0, 157.0, 233.0, 338.0, 539.0, 821.0, 1303.0, 2094.0, 3360.0, 5206.0, 8046.0, 13163.0, 20698.0, 34112.0, 57358.0, 101977.0, 196468.0, 267024.0, 141850.0, 77084.0, 44286.0, 26736.0, 16659.0, 10733.0, 6523.0, 4103.0, 2656.0, 1748.0, 1058.0, 701.0, 490.0, 277.0, 179.0, 117.0, 55.0, 48.0, 37.0, 16.0, 15.0, 12.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.17578125, -1.1414642333984375, -1.107147216796875, -1.0728302001953125, -1.03851318359375, -1.0041961669921875, -0.969879150390625, -0.9355621337890625, -0.9012451171875, -0.8669281005859375, -0.832611083984375, -0.7982940673828125, -0.76397705078125, -0.7296600341796875, -0.695343017578125, -0.6610260009765625, -0.626708984375, -0.5923919677734375, -0.558074951171875, -0.5237579345703125, -0.48944091796875, -0.4551239013671875, -0.420806884765625, -0.3864898681640625, -0.3521728515625, -0.3178558349609375, -0.283538818359375, -0.2492218017578125, -0.21490478515625, -0.1805877685546875, -0.146270751953125, -0.1119537353515625, -0.07763671875, -0.0433197021484375, -0.009002685546875, 0.0253143310546875, 0.05963134765625, 0.0939483642578125, 0.128265380859375, 0.1625823974609375, 0.1968994140625, 0.2312164306640625, 0.265533447265625, 0.2998504638671875, 0.33416748046875, 0.3684844970703125, 0.402801513671875, 0.4371185302734375, 0.471435546875, 0.5057525634765625, 0.540069580078125, 0.5743865966796875, 0.60870361328125, 0.6430206298828125, 0.677337646484375, 0.7116546630859375, 0.7459716796875, 0.7802886962890625, 0.814605712890625, 0.8489227294921875, 0.88323974609375, 0.9175567626953125, 0.951873779296875, 0.9861907958984375, 1.0205078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 8.0, 3.0, 7.0, 13.0, 13.0, 9.0, 12.0, 21.0, 12.0, 23.0, 16.0, 24.0, 32.0, 18.0, 32.0, 38.0, 44.0, 35.0, 38.0, 37.0, 37.0, 1048.0, 30.0, 51.0, 29.0, 48.0, 43.0, 29.0, 34.0, 30.0, 28.0, 24.0, 22.0, 17.0, 10.0, 20.0, 13.0, 16.0, 12.0, 6.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.68359375, -3.56640625, -3.44921875, -3.33203125, -3.21484375, -3.09765625, -2.98046875, -2.86328125, -2.74609375, -2.62890625, -2.51171875, -2.39453125, -2.27734375, -2.16015625, -2.04296875, -1.92578125, -1.80859375, -1.69140625, -1.57421875, -1.45703125, -1.33984375, -1.22265625, -1.10546875, -0.98828125, -0.87109375, -0.75390625, -0.63671875, -0.51953125, -0.40234375, -0.28515625, -0.16796875, -0.05078125, 0.06640625, 0.18359375, 0.30078125, 0.41796875, 0.53515625, 0.65234375, 0.76953125, 0.88671875, 1.00390625, 1.12109375, 1.23828125, 1.35546875, 1.47265625, 1.58984375, 1.70703125, 1.82421875, 1.94140625, 2.05859375, 2.17578125, 2.29296875, 2.41015625, 2.52734375, 2.64453125, 2.76171875, 2.87890625, 2.99609375, 3.11328125, 3.23046875, 3.34765625, 3.46484375, 3.58203125, 3.69921875, 3.81640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 13.0, 16.0, 21.0, 23.0, 47.0, 70.0, 105.0, 142.0, 218.0, 322.0, 465.0, 670.0, 951.0, 1319.0, 1787.0, 2746.0, 4008.0, 5913.0, 8744.0, 13147.0, 20511.0, 32149.0, 51895.0, 85973.0, 148626.0, 1289126.0, 169847.0, 96840.0, 58146.0, 36081.0, 22562.0, 14548.0, 9400.0, 6615.0, 4325.0, 2935.0, 2102.0, 1411.0, 1005.0, 724.0, 489.0, 356.0, 246.0, 151.0, 116.0, 70.0, 48.0, 40.0, 29.0, 15.0, 8.0, 7.0, 7.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.90478515625, -0.877044677734375, -0.84930419921875, -0.821563720703125, -0.7938232421875, -0.766082763671875, -0.73834228515625, -0.710601806640625, -0.682861328125, -0.655120849609375, -0.62738037109375, -0.599639892578125, -0.5718994140625, -0.544158935546875, -0.51641845703125, -0.488677978515625, -0.4609375, -0.433197021484375, -0.40545654296875, -0.377716064453125, -0.3499755859375, -0.322235107421875, -0.29449462890625, -0.266754150390625, -0.239013671875, -0.211273193359375, -0.18353271484375, -0.155792236328125, -0.1280517578125, -0.100311279296875, -0.07257080078125, -0.044830322265625, -0.01708984375, 0.010650634765625, 0.03839111328125, 0.066131591796875, 0.0938720703125, 0.121612548828125, 0.14935302734375, 0.177093505859375, 0.204833984375, 0.232574462890625, 0.26031494140625, 0.288055419921875, 0.3157958984375, 0.343536376953125, 0.37127685546875, 0.399017333984375, 0.4267578125, 0.454498291015625, 0.48223876953125, 0.509979248046875, 0.5377197265625, 0.565460205078125, 0.59320068359375, 0.620941162109375, 0.648681640625, 0.676422119140625, 0.70416259765625, 0.731903076171875, 0.7596435546875, 0.787384033203125, 0.81512451171875, 0.842864990234375, 0.87060546875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 13.0, 19.0, 27.0, 38.0, 45.0, 72.0, 76.0, 104.0, 124.0, 101.0, 91.0, 77.0, 49.0, 42.0, 30.0, 16.0, 26.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009589195251464844, -0.0009312108159065247, -0.0009035021066665649, -0.0008757933974266052, -0.0008480846881866455, -0.0008203759789466858, -0.0007926672697067261, -0.0007649585604667664, -0.0007372498512268066, -0.0007095411419868469, -0.0006818324327468872, -0.0006541237235069275, -0.0006264150142669678, -0.0005987063050270081, -0.0005709975957870483, -0.0005432888865470886, -0.0005155801773071289, -0.0004878714680671692, -0.00046016275882720947, -0.00043245404958724976, -0.00040474534034729004, -0.0003770366311073303, -0.0003493279218673706, -0.0003216192126274109, -0.00029391050338745117, -0.00026620179414749146, -0.00023849308490753174, -0.00021078437566757202, -0.0001830756664276123, -0.0001553669571876526, -0.00012765824794769287, -9.994953870773315e-05, -7.224082946777344e-05, -4.453212022781372e-05, -1.6823410987854004e-05, 1.0885298252105713e-05, 3.859400749206543e-05, 6.630271673202515e-05, 9.401142597198486e-05, 0.00012172013521194458, 0.0001494288444519043, 0.00017713755369186401, 0.00020484626293182373, 0.00023255497217178345, 0.00026026368141174316, 0.0002879723906517029, 0.0003156810998916626, 0.0003433898091316223, 0.00037109851837158203, 0.00039880722761154175, 0.00042651593685150146, 0.0004542246460914612, 0.0004819333553314209, 0.0005096420645713806, 0.0005373507738113403, 0.0005650594830513, 0.0005927681922912598, 0.0006204769015312195, 0.0006481856107711792, 0.0006758943200111389, 0.0007036030292510986, 0.0007313117384910583, 0.0007590204477310181, 0.0007867291569709778, 0.0008144378662109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 10.0, 7.0, 15.0, 14.0, 18.0, 38.0, 54.0, 85.0, 136.0, 224.0, 812.0, 788461.0, 257434.0, 661.0, 223.0, 120.0, 64.0, 52.0, 29.0, 26.0, 21.0, 12.0, 8.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019439697265625, -0.018790721893310547, -0.018141746520996094, -0.01749277114868164, -0.016843795776367188, -0.016194820404052734, -0.015545845031738281, -0.014896869659423828, -0.014247894287109375, -0.013598918914794922, -0.012949943542480469, -0.012300968170166016, -0.011651992797851562, -0.01100301742553711, -0.010354042053222656, -0.009705066680908203, -0.00905609130859375, -0.008407115936279297, -0.007758140563964844, -0.007109165191650391, -0.0064601898193359375, -0.005811214447021484, -0.005162239074707031, -0.004513263702392578, -0.003864288330078125, -0.003215312957763672, -0.0025663375854492188, -0.0019173622131347656, -0.0012683868408203125, -0.0006194114685058594, 2.956390380859375e-05, 0.0006785392761230469, 0.0013275146484375, 0.001976490020751953, 0.0026254653930664062, 0.0032744407653808594, 0.0039234161376953125, 0.004572391510009766, 0.005221366882324219, 0.005870342254638672, 0.006519317626953125, 0.007168292999267578, 0.007817268371582031, 0.008466243743896484, 0.009115219116210938, 0.00976419448852539, 0.010413169860839844, 0.011062145233154297, 0.01171112060546875, 0.012360095977783203, 0.013009071350097656, 0.01365804672241211, 0.014307022094726562, 0.014955997467041016, 0.015604972839355469, 0.016253948211669922, 0.016902923583984375, 0.017551898956298828, 0.01820087432861328, 0.018849849700927734, 0.019498825073242188, 0.02014780044555664, 0.020796775817871094, 0.021445751190185547, 0.0220947265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 295.0, 711.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005777199403382838, -0.00046610942808911204, -0.0003544989158399403, -0.00024288837448693812, -0.00013127786223776639, -1.9667320884764194e-05, 9.194319136440754e-05, 0.00020355370361357927, 0.000315164215862751, 0.00042677472811192274, 0.0005383852403610945, 0.0006499957526102662, 0.0007616062648594379, 0.0008732168353162706, 0.0009848272893577814, 0.001096437918022275, 0.0012080483138561249, 0.0013196588261052966, 0.0014312693383544683, 0.00154287985060364, 0.0016544903628528118, 0.0017661009915173054, 0.0018777113873511553, 0.001989322016015649, 0.0021009324118494987, 0.0022125430405139923, 0.002324153436347842, 0.0024357640650123358, 0.0025473744608461857, 0.0026589850895106792, 0.002770595485344529, 0.0028822061140090227, 0.0029938167426735163, 0.00310542737133801, 0.0032170377671718597, 0.0033286483958363533, 0.003440258791670203, 0.0035518694203346968, 0.0036634798161685467, 0.0037750904448330402, 0.00388670084066689, 0.00399831123650074, 0.004109921865165234, 0.004221532493829727, 0.004333143122494221, 0.004444753285497427, 0.0045563639141619205, 0.004667974542826414, 0.004779585171490908, 0.004891195800155401, 0.005002806428819895, 0.005114416591823101, 0.005226027220487595, 0.005337637849152088, 0.005449248477816582, 0.005560858640819788, 0.0056724692694842815, 0.005784079898148775, 0.005895690526813269, 0.006007300689816475, 0.0061189113184809685, 0.006230521947145462, 0.006342132575809956, 0.006453742738813162, 0.006565353367477655]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 11.0, 10.0, 11.0, 16.0, 19.0, 19.0, 20.0, 10.0, 25.0, 28.0, 27.0, 35.0, 32.0, 33.0, 24.0, 34.0, 53.0, 38.0, 40.0, 42.0, 43.0, 37.0, 47.0, 35.0, 34.0, 33.0, 30.0, 28.0, 24.0, 18.0, 20.0, 15.0, 14.0, 11.0, 15.0, 10.0, 17.0, 6.0, 6.0, 3.0, 4.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026416778564453125, -0.0002552289515733719, -0.0002462901175022125, -0.00023735128343105316, -0.0002284124493598938, -0.00021947361528873444, -0.00021053478121757507, -0.0002015959471464157, -0.00019265711307525635, -0.00018371827900409698, -0.00017477944493293762, -0.00016584061086177826, -0.0001569017767906189, -0.00014796294271945953, -0.00013902410864830017, -0.0001300852745771408, -0.00012114644050598145, -0.00011220760643482208, -0.00010326877236366272, -9.432993829250336e-05, -8.5391104221344e-05, -7.645227015018463e-05, -6.751343607902527e-05, -5.8574602007865906e-05, -4.963576793670654e-05, -4.069693386554718e-05, -3.175809979438782e-05, -2.2819265723228455e-05, -1.3880431652069092e-05, -4.941597580909729e-06, 3.997236490249634e-06, 1.2936070561408997e-05, 2.187490463256836e-05, 3.081373870372772e-05, 3.9752572774887085e-05, 4.869140684604645e-05, 5.763024091720581e-05, 6.656907498836517e-05, 7.550790905952454e-05, 8.44467431306839e-05, 9.338557720184326e-05, 0.00010232441127300262, 0.00011126324534416199, 0.00012020207941532135, 0.0001291409134864807, 0.00013807974755764008, 0.00014701858162879944, 0.0001559574156999588, 0.00016489624977111816, 0.00017383508384227753, 0.0001827739179134369, 0.00019171275198459625, 0.00020065158605575562, 0.00020959042012691498, 0.00021852925419807434, 0.0002274680882692337, 0.00023640692234039307, 0.00024534575641155243, 0.0002542845904827118, 0.00026322342455387115, 0.0002721622586250305, 0.0002811010926961899, 0.00029003992676734924, 0.0002989787608385086, 0.00030791759490966797]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 8.0, 16.0, 11.0, 17.0, 25.0, 28.0, 32.0, 40.0, 22.0, 34.0, 34.0, 40.0, 36.0, 49.0, 30.0, 51.0, 47.0, 48.0, 42.0, 43.0, 34.0, 33.0, 34.0, 36.0, 28.0, 23.0, 23.0, 27.0, 18.0, 17.0, 9.0, 16.0, 15.0, 8.0, 7.0, 2.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.515625, -6.2955322265625, -6.075439453125, -5.8553466796875, -5.63525390625, -5.4151611328125, -5.195068359375, -4.9749755859375, -4.7548828125, -4.5347900390625, -4.314697265625, -4.0946044921875, -3.87451171875, -3.6544189453125, -3.434326171875, -3.2142333984375, -2.994140625, -2.7740478515625, -2.553955078125, -2.3338623046875, -2.11376953125, -1.8936767578125, -1.673583984375, -1.4534912109375, -1.2333984375, -1.0133056640625, -0.793212890625, -0.5731201171875, -0.35302734375, -0.1329345703125, 0.087158203125, 0.3072509765625, 0.52734375, 0.7474365234375, 0.967529296875, 1.1876220703125, 1.40771484375, 1.6278076171875, 1.847900390625, 2.0679931640625, 2.2880859375, 2.5081787109375, 2.728271484375, 2.9483642578125, 3.16845703125, 3.3885498046875, 3.608642578125, 3.8287353515625, 4.048828125, 4.2689208984375, 4.489013671875, 4.7091064453125, 4.92919921875, 5.1492919921875, 5.369384765625, 5.5894775390625, 5.8095703125, 6.0296630859375, 6.249755859375, 6.4698486328125, 6.68994140625, 6.9100341796875, 7.130126953125, 7.3502197265625, 7.5703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 10.0, 6.0, 14.0, 11.0, 14.0, 26.0, 36.0, 44.0, 69.0, 138.0, 243.0, 410.0, 855.0, 1628.0, 3221.0, 6738.0, 14392.0, 32769.0, 82577.0, 225869.0, 405137.0, 165105.0, 61806.0, 25324.0, 11166.0, 5352.0, 2615.0, 1345.0, 681.0, 389.0, 210.0, 118.0, 57.0, 52.0, 32.0, 12.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.955078125, -3.8203125, -3.685546875, -3.55078125, -3.416015625, -3.28125, -3.146484375, -3.01171875, -2.876953125, -2.7421875, -2.607421875, -2.47265625, -2.337890625, -2.203125, -2.068359375, -1.93359375, -1.798828125, -1.6640625, -1.529296875, -1.39453125, -1.259765625, -1.125, -0.990234375, -0.85546875, -0.720703125, -0.5859375, -0.451171875, -0.31640625, -0.181640625, -0.046875, 0.087890625, 0.22265625, 0.357421875, 0.4921875, 0.626953125, 0.76171875, 0.896484375, 1.03125, 1.166015625, 1.30078125, 1.435546875, 1.5703125, 1.705078125, 1.83984375, 1.974609375, 2.109375, 2.244140625, 2.37890625, 2.513671875, 2.6484375, 2.783203125, 2.91796875, 3.052734375, 3.1875, 3.322265625, 3.45703125, 3.591796875, 3.7265625, 3.861328125, 3.99609375, 4.130859375, 4.265625, 4.400390625, 4.53515625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 11.0, 7.0, 8.0, 7.0, 11.0, 10.0, 13.0, 21.0, 15.0, 17.0, 25.0, 31.0, 31.0, 42.0, 39.0, 50.0, 54.0, 87.0, 179.0, 1693.0, 186.0, 85.0, 58.0, 41.0, 38.0, 33.0, 33.0, 33.0, 29.0, 31.0, 20.0, 25.0, 10.0, 19.0, 10.0, 6.0, 4.0, 8.0, 8.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-21.3125, -20.634765625, -19.95703125, -19.279296875, -18.6015625, -17.923828125, -17.24609375, -16.568359375, -15.890625, -15.212890625, -14.53515625, -13.857421875, -13.1796875, -12.501953125, -11.82421875, -11.146484375, -10.46875, -9.791015625, -9.11328125, -8.435546875, -7.7578125, -7.080078125, -6.40234375, -5.724609375, -5.046875, -4.369140625, -3.69140625, -3.013671875, -2.3359375, -1.658203125, -0.98046875, -0.302734375, 0.375, 1.052734375, 1.73046875, 2.408203125, 3.0859375, 3.763671875, 4.44140625, 5.119140625, 5.796875, 6.474609375, 7.15234375, 7.830078125, 8.5078125, 9.185546875, 9.86328125, 10.541015625, 11.21875, 11.896484375, 12.57421875, 13.251953125, 13.9296875, 14.607421875, 15.28515625, 15.962890625, 16.640625, 17.318359375, 17.99609375, 18.673828125, 19.3515625, 20.029296875, 20.70703125, 21.384765625, 22.0625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 10.0, 12.0, 9.0, 9.0, 24.0, 21.0, 24.0, 32.0, 49.0, 61.0, 71.0, 105.0, 110.0, 139.0, 205.0, 332.0, 601.0, 2288.0, 419133.0, 2717268.0, 3339.0, 652.0, 296.0, 221.0, 148.0, 135.0, 73.0, 70.0, 54.0, 39.0, 40.0, 25.0, 19.0, 13.0, 11.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.53125, -51.9130859375, -50.294921875, -48.6767578125, -47.05859375, -45.4404296875, -43.822265625, -42.2041015625, -40.5859375, -38.9677734375, -37.349609375, -35.7314453125, -34.11328125, -32.4951171875, -30.876953125, -29.2587890625, -27.640625, -26.0224609375, -24.404296875, -22.7861328125, -21.16796875, -19.5498046875, -17.931640625, -16.3134765625, -14.6953125, -13.0771484375, -11.458984375, -9.8408203125, -8.22265625, -6.6044921875, -4.986328125, -3.3681640625, -1.75, -0.1318359375, 1.486328125, 3.1044921875, 4.72265625, 6.3408203125, 7.958984375, 9.5771484375, 11.1953125, 12.8134765625, 14.431640625, 16.0498046875, 17.66796875, 19.2861328125, 20.904296875, 22.5224609375, 24.140625, 25.7587890625, 27.376953125, 28.9951171875, 30.61328125, 32.2314453125, 33.849609375, 35.4677734375, 37.0859375, 38.7041015625, 40.322265625, 41.9404296875, 43.55859375, 45.1767578125, 46.794921875, 48.4130859375, 50.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 9.0, 220.0, 652.0, 125.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.327392578125, -16.333105087280273, -13.338817596435547, -10.34453010559082, -7.350242614746094, -4.355955123901367, -1.3616676330566406, 1.632619857788086, 4.6269073486328125, 7.621194839477539, 10.615482330322266, 13.609769821166992, 16.60405731201172, 19.598344802856445, 22.592632293701172, 25.5869197845459, 28.581207275390625, 31.57549476623535, 34.56978225708008, 37.56407165527344, 40.55835723876953, 43.552642822265625, 46.546932220458984, 49.541221618652344, 52.53550720214844, 55.52979278564453, 58.52408218383789, 61.51837158203125, 64.51265716552734, 67.50694274902344, 70.50123596191406, 73.49552154541016, 76.48980712890625, 79.48409271240234, 82.47837829589844, 85.47267150878906, 88.46695709228516, 91.46124267578125, 94.45553588867188, 97.44982147216797, 100.44410705566406, 103.43839263916016, 106.43267822265625, 109.42697143554688, 112.42125701904297, 115.41554260253906, 118.40983581542969, 121.40412139892578, 124.39840698242188, 127.39269256591797, 130.38697814941406, 133.3812713623047, 136.37554931640625, 139.36984252929688, 142.3641357421875, 145.35841369628906, 148.3527069091797, 151.3470001220703, 154.34127807617188, 157.3355712890625, 160.32986450195312, 163.3241424560547, 166.3184356689453, 169.31271362304688, 172.3070068359375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 7.0, 7.0, 6.0, 11.0, 13.0, 20.0, 21.0, 11.0, 22.0, 29.0, 26.0, 27.0, 27.0, 28.0, 30.0, 37.0, 42.0, 38.0, 40.0, 37.0, 46.0, 48.0, 32.0, 46.0, 27.0, 39.0, 29.0, 28.0, 19.0, 28.0, 32.0, 18.0, 23.0, 20.0, 18.0, 14.0, 11.0, 9.0, 5.0, 8.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.3079833984375, -46.60369110107422, -44.89939880371094, -43.195106506347656, -41.490814208984375, -39.786521911621094, -38.08222961425781, -36.37793731689453, -34.67364501953125, -32.96935272216797, -31.265060424804688, -29.560768127441406, -27.856475830078125, -26.152183532714844, -24.44788932800293, -22.74359703063965, -21.039302825927734, -19.335010528564453, -17.630718231201172, -15.926424980163574, -14.222132682800293, -12.517840385437012, -10.813547134399414, -9.109254837036133, -7.404962539672852, -5.70067024230957, -3.996377468109131, -2.2920846939086914, -0.5877923965454102, 1.116499900817871, 2.8207931518554688, 4.52508544921875, 6.229377746582031, 7.9336700439453125, 9.637962341308594, 11.342255592346191, 13.046547889709473, 14.750840187072754, 16.45513343811035, 18.159425735473633, 19.863718032836914, 21.568010330200195, 23.272302627563477, 24.97659683227539, 26.680889129638672, 28.385181427001953, 30.089473724365234, 31.793766021728516, 33.4980583190918, 35.20235061645508, 36.90664291381836, 38.61093521118164, 40.31522750854492, 42.0195198059082, 43.72381591796875, 45.42810821533203, 47.13240051269531, 48.836692810058594, 50.540985107421875, 52.245277404785156, 53.94956970214844, 55.65386199951172, 57.358154296875, 59.06244659423828, 60.76673889160156]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 3.0, 8.0, 11.0, 11.0, 14.0, 18.0, 16.0, 27.0, 34.0, 32.0, 33.0, 21.0, 48.0, 36.0, 47.0, 38.0, 41.0, 45.0, 42.0, 33.0, 51.0, 41.0, 35.0, 39.0, 42.0, 36.0, 26.0, 23.0, 18.0, 24.0, 15.0, 19.0, 16.0, 16.0, 8.0, 10.0, 8.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.2794189453125, -6.051025390625, -5.8226318359375, -5.59423828125, -5.3658447265625, -5.137451171875, -4.9090576171875, -4.6806640625, -4.4522705078125, -4.223876953125, -3.9954833984375, -3.76708984375, -3.5386962890625, -3.310302734375, -3.0819091796875, -2.853515625, -2.6251220703125, -2.396728515625, -2.1683349609375, -1.93994140625, -1.7115478515625, -1.483154296875, -1.2547607421875, -1.0263671875, -0.7979736328125, -0.569580078125, -0.3411865234375, -0.11279296875, 0.1156005859375, 0.343994140625, 0.5723876953125, 0.80078125, 1.0291748046875, 1.257568359375, 1.4859619140625, 1.71435546875, 1.9427490234375, 2.171142578125, 2.3995361328125, 2.6279296875, 2.8563232421875, 3.084716796875, 3.3131103515625, 3.54150390625, 3.7698974609375, 3.998291015625, 4.2266845703125, 4.455078125, 4.6834716796875, 4.911865234375, 5.1402587890625, 5.36865234375, 5.5970458984375, 5.825439453125, 6.0538330078125, 6.2822265625, 6.5106201171875, 6.739013671875, 6.9674072265625, 7.19580078125, 7.4241943359375, 7.652587890625, 7.8809814453125, 8.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 13.0, 6.0, 13.0, 10.0, 22.0, 24.0, 33.0, 17.0, 48.0, 42.0, 66.0, 110.0, 220.0, 603.0, 2116.0, 20680.0, 1442369.0, 2674540.0, 48384.0, 3341.0, 813.0, 309.0, 159.0, 80.0, 39.0, 40.0, 33.0, 18.0, 17.0, 19.0, 17.0, 18.0, 11.0, 10.0, 10.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.63671875, -20.8671875, -20.09765625, -19.328125, -18.55859375, -17.7890625, -17.01953125, -16.25, -15.48046875, -14.7109375, -13.94140625, -13.171875, -12.40234375, -11.6328125, -10.86328125, -10.09375, -9.32421875, -8.5546875, -7.78515625, -7.015625, -6.24609375, -5.4765625, -4.70703125, -3.9375, -3.16796875, -2.3984375, -1.62890625, -0.859375, -0.08984375, 0.6796875, 1.44921875, 2.21875, 2.98828125, 3.7578125, 4.52734375, 5.296875, 6.06640625, 6.8359375, 7.60546875, 8.375, 9.14453125, 9.9140625, 10.68359375, 11.453125, 12.22265625, 12.9921875, 13.76171875, 14.53125, 15.30078125, 16.0703125, 16.83984375, 17.609375, 18.37890625, 19.1484375, 19.91796875, 20.6875, 21.45703125, 22.2265625, 22.99609375, 23.765625, 24.53515625, 25.3046875, 26.07421875, 26.84375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 6.0, 14.0, 12.0, 13.0, 14.0, 36.0, 42.0, 46.0, 81.0, 99.0, 139.0, 214.0, 319.0, 456.0, 557.0, 570.0, 392.0, 316.0, 222.0, 149.0, 108.0, 85.0, 58.0, 37.0, 29.0, 25.0, 10.0, 11.0, 6.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.828125, -17.3585205078125, -16.888916015625, -16.4193115234375, -15.94970703125, -15.4801025390625, -15.010498046875, -14.5408935546875, -14.0712890625, -13.6016845703125, -13.132080078125, -12.6624755859375, -12.19287109375, -11.7232666015625, -11.253662109375, -10.7840576171875, -10.314453125, -9.8448486328125, -9.375244140625, -8.9056396484375, -8.43603515625, -7.9664306640625, -7.496826171875, -7.0272216796875, -6.5576171875, -6.0880126953125, -5.618408203125, -5.1488037109375, -4.67919921875, -4.2095947265625, -3.739990234375, -3.2703857421875, -2.80078125, -2.3311767578125, -1.861572265625, -1.3919677734375, -0.92236328125, -0.4527587890625, 0.016845703125, 0.4864501953125, 0.9560546875, 1.4256591796875, 1.895263671875, 2.3648681640625, 2.83447265625, 3.3040771484375, 3.773681640625, 4.2432861328125, 4.712890625, 5.1824951171875, 5.652099609375, 6.1217041015625, 6.59130859375, 7.0609130859375, 7.530517578125, 8.0001220703125, 8.4697265625, 8.9393310546875, 9.408935546875, 9.8785400390625, 10.34814453125, 10.8177490234375, 11.287353515625, 11.7569580078125, 12.2265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 19.0, 22.0, 36.0, 44.0, 67.0, 86.0, 124.0, 165.0, 232.0, 322.0, 523.0, 1701.0, 4063190.0, 125500.0, 856.0, 397.0, 269.0, 176.0, 137.0, 104.0, 80.0, 67.0, 49.0, 29.0, 29.0, 20.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.875, -107.8623046875, -104.849609375, -101.8369140625, -98.82421875, -95.8115234375, -92.798828125, -89.7861328125, -86.7734375, -83.7607421875, -80.748046875, -77.7353515625, -74.72265625, -71.7099609375, -68.697265625, -65.6845703125, -62.671875, -59.6591796875, -56.646484375, -53.6337890625, -50.62109375, -47.6083984375, -44.595703125, -41.5830078125, -38.5703125, -35.5576171875, -32.544921875, -29.5322265625, -26.51953125, -23.5068359375, -20.494140625, -17.4814453125, -14.46875, -11.4560546875, -8.443359375, -5.4306640625, -2.41796875, 0.5947265625, 3.607421875, 6.6201171875, 9.6328125, 12.6455078125, 15.658203125, 18.6708984375, 21.68359375, 24.6962890625, 27.708984375, 30.7216796875, 33.734375, 36.7470703125, 39.759765625, 42.7724609375, 45.78515625, 48.7978515625, 51.810546875, 54.8232421875, 57.8359375, 60.8486328125, 63.861328125, 66.8740234375, 69.88671875, 72.8994140625, 75.912109375, 78.9248046875, 81.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 164.0, 574.0, 249.0, 22.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-285.2158508300781, -278.1891784667969, -271.1625061035156, -264.1358337402344, -257.1091613769531, -250.0824737548828, -243.05580139160156, -236.0291290283203, -229.00245666503906, -221.9757843017578, -214.94911193847656, -207.92242431640625, -200.895751953125, -193.86907958984375, -186.8424072265625, -179.81573486328125, -172.7890625, -165.76239013671875, -158.7357177734375, -151.70904541015625, -144.68235778808594, -137.6556854248047, -130.62901306152344, -123.60234069824219, -116.57565307617188, -109.54898071289062, -102.52230072021484, -95.4956283569336, -88.46895599365234, -81.44227600097656, -74.41560363769531, -67.38893127441406, -60.36225891113281, -53.3355827331543, -46.30891036987305, -39.28223419189453, -32.25556182861328, -25.228885650634766, -18.20220947265625, -11.175537109375, -4.148860931396484, 2.8778138160705566, 9.904488563537598, 16.931163787841797, 23.95783805847168, 30.984512329101562, 38.01118850708008, 45.03786087036133, 52.064537048339844, 59.09121322631836, 66.11788940429688, 73.14456176757812, 80.17123413085938, 87.19790649414062, 94.2245864868164, 101.25125885009766, 108.27793884277344, 115.30461120605469, 122.33129119873047, 129.35797119140625, 136.3846435546875, 143.41131591796875, 150.43798828125, 157.46466064453125, 164.4913330078125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 15.0, 10.0, 15.0, 15.0, 11.0, 24.0, 17.0, 27.0, 32.0, 25.0, 21.0, 43.0, 36.0, 26.0, 37.0, 33.0, 35.0, 36.0, 48.0, 38.0, 36.0, 54.0, 47.0, 40.0, 30.0, 28.0, 28.0, 23.0, 21.0, 25.0, 17.0, 8.0, 16.0, 15.0, 14.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.587913513183594, -39.29560470581055, -38.003292083740234, -36.71098327636719, -35.41867446899414, -34.12636184692383, -32.83405303955078, -31.5417423248291, -30.249431610107422, -28.957120895385742, -27.664812088012695, -26.372501373291016, -25.080190658569336, -23.787879943847656, -22.49557113647461, -21.20326042175293, -19.910951614379883, -18.618640899658203, -17.326332092285156, -16.034021377563477, -14.741710662841797, -13.449400901794434, -12.15709114074707, -10.86478042602539, -9.572470664978027, -8.280160903930664, -6.987850189208984, -5.695540428161621, -4.4032301902771, -3.110919952392578, -1.8186101913452148, -0.5262994766235352, 0.7660102844238281, 2.0583205223083496, 3.350630521774292, 4.642940521240234, 5.935250759124756, 7.227560997009277, 8.51987075805664, 9.81218147277832, 11.104491233825684, 12.396800994873047, 13.689111709594727, 14.98142147064209, 16.273731231689453, 17.566041946411133, 18.858352661132812, 20.15066146850586, 21.44297218322754, 22.73528289794922, 24.027591705322266, 25.319902420043945, 26.612213134765625, 27.904521942138672, 29.19683265686035, 30.48914337158203, 31.781452178955078, 33.073760986328125, 34.36607360839844, 35.658382415771484, 36.95069122314453, 38.243003845214844, 39.53531265258789, 40.82762145996094, 42.11993408203125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 5.0, 11.0, 14.0, 15.0, 37.0, 42.0, 55.0, 103.0, 116.0, 186.0, 268.0, 370.0, 499.0, 701.0, 995.0, 1431.0, 2021.0, 2871.0, 4241.0, 6083.0, 8718.0, 12652.0, 18859.0, 29384.0, 45377.0, 72180.0, 115096.0, 191436.0, 198293.0, 121336.0, 75060.0, 47404.0, 29989.0, 20092.0, 13219.0, 8885.0, 6005.0, 4349.0, 2995.0, 2126.0, 1541.0, 1089.0, 713.0, 547.0, 353.0, 240.0, 177.0, 107.0, 79.0, 59.0, 49.0, 24.0, 18.0, 16.0, 17.0, 5.0, 8.0, 3.0, 2.0, 2.0], "bins": [-0.89111328125, -0.8633041381835938, -0.8354949951171875, -0.8076858520507812, -0.779876708984375, -0.7520675659179688, -0.7242584228515625, -0.6964492797851562, -0.66864013671875, -0.6408309936523438, -0.6130218505859375, -0.5852127075195312, -0.557403564453125, -0.5295944213867188, -0.5017852783203125, -0.47397613525390625, -0.4461669921875, -0.41835784912109375, -0.3905487060546875, -0.36273956298828125, -0.334930419921875, -0.30712127685546875, -0.2793121337890625, -0.25150299072265625, -0.22369384765625, -0.19588470458984375, -0.1680755615234375, -0.14026641845703125, -0.112457275390625, -0.08464813232421875, -0.0568389892578125, -0.02902984619140625, -0.001220703125, 0.02658843994140625, 0.0543975830078125, 0.08220672607421875, 0.110015869140625, 0.13782501220703125, 0.1656341552734375, 0.19344329833984375, 0.22125244140625, 0.24906158447265625, 0.2768707275390625, 0.30467987060546875, 0.332489013671875, 0.36029815673828125, 0.3881072998046875, 0.41591644287109375, 0.4437255859375, 0.47153472900390625, 0.4993438720703125, 0.5271530151367188, 0.554962158203125, 0.5827713012695312, 0.6105804443359375, 0.6383895874023438, 0.66619873046875, 0.6940078735351562, 0.7218170166015625, 0.7496261596679688, 0.777435302734375, 0.8052444458007812, 0.8330535888671875, 0.8608627319335938, 0.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 9.0, 4.0, 7.0, 4.0, 4.0, 8.0, 10.0, 9.0, 10.0, 19.0, 19.0, 20.0, 13.0, 28.0, 20.0, 23.0, 20.0, 24.0, 21.0, 26.0, 28.0, 28.0, 32.0, 38.0, 27.0, 1052.0, 27.0, 29.0, 38.0, 36.0, 22.0, 31.0, 41.0, 32.0, 23.0, 28.0, 26.0, 23.0, 25.0, 18.0, 28.0, 21.0, 6.0, 18.0, 11.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.123046875, -3.01348876953125, -2.9039306640625, -2.79437255859375, -2.684814453125, -2.57525634765625, -2.4656982421875, -2.35614013671875, -2.24658203125, -2.13702392578125, -2.0274658203125, -1.91790771484375, -1.808349609375, -1.69879150390625, -1.5892333984375, -1.47967529296875, -1.3701171875, -1.26055908203125, -1.1510009765625, -1.04144287109375, -0.931884765625, -0.82232666015625, -0.7127685546875, -0.60321044921875, -0.49365234375, -0.38409423828125, -0.2745361328125, -0.16497802734375, -0.055419921875, 0.05413818359375, 0.1636962890625, 0.27325439453125, 0.3828125, 0.49237060546875, 0.6019287109375, 0.71148681640625, 0.821044921875, 0.93060302734375, 1.0401611328125, 1.14971923828125, 1.25927734375, 1.36883544921875, 1.4783935546875, 1.58795166015625, 1.697509765625, 1.80706787109375, 1.9166259765625, 2.02618408203125, 2.1357421875, 2.24530029296875, 2.3548583984375, 2.46441650390625, 2.573974609375, 2.68353271484375, 2.7930908203125, 2.90264892578125, 3.01220703125, 3.12176513671875, 3.2313232421875, 3.34088134765625, 3.450439453125, 3.55999755859375, 3.6695556640625, 3.77911376953125, 3.888671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 7.0, 15.0, 13.0, 23.0, 33.0, 43.0, 76.0, 86.0, 165.0, 213.0, 314.0, 485.0, 682.0, 918.0, 1274.0, 1900.0, 2636.0, 3690.0, 5464.0, 7725.0, 11066.0, 15582.0, 23066.0, 34593.0, 51036.0, 79182.0, 126756.0, 1258390.0, 169149.0, 100755.0, 65098.0, 42784.0, 28927.0, 19746.0, 13450.0, 9479.0, 6679.0, 4618.0, 3335.0, 2235.0, 1643.0, 1184.0, 770.0, 597.0, 385.0, 272.0, 197.0, 134.0, 91.0, 55.0, 38.0, 37.0, 23.0, 6.0, 10.0, 4.0, 2.0, 2.0], "bins": [-0.8681640625, -0.8424606323242188, -0.8167572021484375, -0.7910537719726562, -0.765350341796875, -0.7396469116210938, -0.7139434814453125, -0.6882400512695312, -0.66253662109375, -0.6368331909179688, -0.6111297607421875, -0.5854263305664062, -0.559722900390625, -0.5340194702148438, -0.5083160400390625, -0.48261260986328125, -0.4569091796875, -0.43120574951171875, -0.4055023193359375, -0.37979888916015625, -0.354095458984375, -0.32839202880859375, -0.3026885986328125, -0.27698516845703125, -0.25128173828125, -0.22557830810546875, -0.1998748779296875, -0.17417144775390625, -0.148468017578125, -0.12276458740234375, -0.0970611572265625, -0.07135772705078125, -0.045654296875, -0.01995086669921875, 0.0057525634765625, 0.03145599365234375, 0.057159423828125, 0.08286285400390625, 0.1085662841796875, 0.13426971435546875, 0.15997314453125, 0.18567657470703125, 0.2113800048828125, 0.23708343505859375, 0.262786865234375, 0.28849029541015625, 0.3141937255859375, 0.33989715576171875, 0.3656005859375, 0.39130401611328125, 0.4170074462890625, 0.44271087646484375, 0.468414306640625, 0.49411773681640625, 0.5198211669921875, 0.5455245971679688, 0.57122802734375, 0.5969314575195312, 0.6226348876953125, 0.6483383178710938, 0.674041748046875, 0.6997451782226562, 0.7254486083984375, 0.7511520385742188, 0.77685546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 10.0, 14.0, 19.0, 24.0, 26.0, 20.0, 37.0, 38.0, 26.0, 45.0, 64.0, 52.0, 74.0, 63.0, 65.0, 58.0, 54.0, 50.0, 39.0, 30.0, 33.0, 24.0, 28.0, 25.0, 8.0, 16.0, 5.0, 8.0, 7.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0006403923034667969, -0.0006232447922229767, -0.0006060972809791565, -0.0005889497697353363, -0.0005718022584915161, -0.0005546547472476959, -0.0005375072360038757, -0.0005203597247600555, -0.0005032122135162354, -0.00048606470227241516, -0.00046891719102859497, -0.0004517696797847748, -0.0004346221685409546, -0.0004174746572971344, -0.0004003271460533142, -0.000383179634809494, -0.00036603212356567383, -0.00034888461232185364, -0.00033173710107803345, -0.00031458958983421326, -0.00029744207859039307, -0.0002802945673465729, -0.0002631470561027527, -0.0002459995448589325, -0.0002288520336151123, -0.00021170452237129211, -0.00019455701112747192, -0.00017740949988365173, -0.00016026198863983154, -0.00014311447739601135, -0.00012596696615219116, -0.00010881945490837097, -9.167194366455078e-05, -7.452443242073059e-05, -5.73769211769104e-05, -4.022940993309021e-05, -2.308189868927002e-05, -5.934387445449829e-06, 1.1213123798370361e-05, 2.8360635042190552e-05, 4.550814628601074e-05, 6.265565752983093e-05, 7.980316877365112e-05, 9.695068001747131e-05, 0.0001140981912612915, 0.0001312457025051117, 0.00014839321374893188, 0.00016554072499275208, 0.00018268823623657227, 0.00019983574748039246, 0.00021698325872421265, 0.00023413076996803284, 0.00025127828121185303, 0.0002684257924556732, 0.0002855733036994934, 0.0003027208149433136, 0.0003198683261871338, 0.000337015837430954, 0.00035416334867477417, 0.00037131085991859436, 0.00038845837116241455, 0.00040560588240623474, 0.00042275339365005493, 0.0004399009048938751, 0.0004570484161376953]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 3.0, 11.0, 3.0, 7.0, 11.0, 16.0, 17.0, 24.0, 22.0, 35.0, 26.0, 43.0, 44.0, 63.0, 92.0, 149.0, 243.0, 594.0, 4455.0, 1032496.0, 8656.0, 703.0, 259.0, 140.0, 94.0, 75.0, 51.0, 47.0, 31.0, 28.0, 23.0, 23.0, 14.0, 8.0, 15.0, 8.0, 4.0, 7.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010380744934082031, -0.010004043579101562, -0.009627342224121094, -0.009250640869140625, -0.008873939514160156, -0.008497238159179688, -0.008120536804199219, -0.00774383544921875, -0.007367134094238281, -0.0069904327392578125, -0.006613731384277344, -0.006237030029296875, -0.005860328674316406, -0.0054836273193359375, -0.005106925964355469, -0.004730224609375, -0.004353523254394531, -0.0039768218994140625, -0.0036001205444335938, -0.003223419189453125, -0.0028467178344726562, -0.0024700164794921875, -0.0020933151245117188, -0.00171661376953125, -0.0013399124145507812, -0.0009632110595703125, -0.0005865097045898438, -0.000209808349609375, 0.00016689300537109375, 0.0005435943603515625, 0.0009202957153320312, 0.0012969970703125, 0.0016736984252929688, 0.0020503997802734375, 0.0024271011352539062, 0.002803802490234375, 0.0031805038452148438, 0.0035572052001953125, 0.003933906555175781, 0.00431060791015625, 0.004687309265136719, 0.0050640106201171875, 0.005440711975097656, 0.005817413330078125, 0.006194114685058594, 0.0065708160400390625, 0.006947517395019531, 0.00732421875, 0.007700920104980469, 0.008077621459960938, 0.008454322814941406, 0.008831024169921875, 0.009207725524902344, 0.009584426879882812, 0.009961128234863281, 0.01033782958984375, 0.010714530944824219, 0.011091232299804688, 0.011467933654785156, 0.011844635009765625, 0.012221336364746094, 0.012598037719726562, 0.012974739074707031, 0.0133514404296875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 37.0, 287.0, 506.0, 162.0, 16.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024123857729136944, -0.0023662885650992393, -0.0023201913572847843, -0.0022740941494703293, -0.0022279969416558743, -0.0021818997338414192, -0.002135802526026964, -0.002089705318212509, -0.002043608110398054, -0.001997510902583599, -0.001951413694769144, -0.001905316486954689, -0.001859219279140234, -0.001813122071325779, -0.001767024863511324, -0.001720927655696869, -0.0016748305642977357, -0.0016287333564832807, -0.0015826361486688256, -0.0015365389408543706, -0.0014904417330399156, -0.0014443445252254605, -0.0013982474338263273, -0.0013521502260118723, -0.0013060530181974173, -0.0012599558103829622, -0.0012138586025685072, -0.0011677613947540522, -0.0011216641869395971, -0.001075566979125142, -0.001029469771310687, -0.000983372563496232, -0.0009372754138894379, -0.0008911782060749829, -0.0008450809982605278, -0.0007989838486537337, -0.0007528866408392787, -0.0007067894330248237, -0.0006606922252103686, -0.0006145950173959136, -0.0005684978095814586, -0.0005224006017670035, -0.0004763033939525485, -0.00043020621524192393, -0.0003841090074274689, -0.00033801179961301386, -0.0002919146209023893, -0.00024581741308793426, -0.00019972020527347922, -0.0001536229974590242, -0.00010752580419648439, -6.142861093394458e-05, -1.533140311948955e-05, 3.076580469496548e-05, 7.686298340559006e-05, 0.0001229601912200451, 0.00016905739903450012, 0.00021515460684895515, 0.0002612518146634102, 0.00030734899337403476, 0.0003534462011884898, 0.0003995434090029448, 0.0004456405877135694, 0.0004917377955280244, 0.0005378350033424795]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 5.0, 11.0, 8.0, 13.0, 12.0, 18.0, 17.0, 15.0, 20.0, 27.0, 23.0, 29.0, 30.0, 25.0, 36.0, 36.0, 36.0, 33.0, 58.0, 35.0, 36.0, 43.0, 44.0, 33.0, 42.0, 45.0, 27.0, 28.0, 20.0, 30.0, 20.0, 19.0, 14.0, 17.0, 15.0, 10.0, 11.0, 13.0, 6.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00025594234466552734, -0.0002481583505868912, -0.000240374356508255, -0.00023259036242961884, -0.00022480636835098267, -0.0002170223742723465, -0.00020923838019371033, -0.00020145438611507416, -0.000193670392036438, -0.00018588639795780182, -0.00017810240387916565, -0.00017031840980052948, -0.0001625344157218933, -0.00015475042164325714, -0.00014696642756462097, -0.0001391824334859848, -0.00013139843940734863, -0.00012361444532871246, -0.0001158304512500763, -0.00010804645717144012, -0.00010026246309280396, -9.247846901416779e-05, -8.469447493553162e-05, -7.691048085689545e-05, -6.912648677825928e-05, -6.134249269962311e-05, -5.355849862098694e-05, -4.577450454235077e-05, -3.79905104637146e-05, -3.020651638507843e-05, -2.242252230644226e-05, -1.4638528227806091e-05, -6.854534149169922e-06, 9.294599294662476e-07, 8.713454008102417e-06, 1.6497448086738586e-05, 2.4281442165374756e-05, 3.2065436244010925e-05, 3.9849430322647095e-05, 4.7633424401283264e-05, 5.5417418479919434e-05, 6.32014125585556e-05, 7.098540663719177e-05, 7.876940071582794e-05, 8.655339479446411e-05, 9.433738887310028e-05, 0.00010212138295173645, 0.00010990537703037262, 0.00011768937110900879, 0.00012547336518764496, 0.00013325735926628113, 0.0001410413533449173, 0.00014882534742355347, 0.00015660934150218964, 0.0001643933355808258, 0.00017217732965946198, 0.00017996132373809814, 0.00018774531781673431, 0.00019552931189537048, 0.00020331330597400665, 0.00021109730005264282, 0.000218881294131279, 0.00022666528820991516, 0.00023444928228855133, 0.0002422332763671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 8.0, 15.0, 13.0, 12.0, 15.0, 11.0, 23.0, 28.0, 33.0, 32.0, 31.0, 39.0, 42.0, 30.0, 48.0, 35.0, 37.0, 36.0, 35.0, 42.0, 56.0, 41.0, 35.0, 26.0, 24.0, 21.0, 32.0, 26.0, 27.0, 20.0, 29.0, 11.0, 18.0, 12.0, 10.0, 6.0, 7.0, 5.0, 4.0, 7.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.68359375, -6.473876953125, -6.26416015625, -6.054443359375, -5.8447265625, -5.635009765625, -5.42529296875, -5.215576171875, -5.005859375, -4.796142578125, -4.58642578125, -4.376708984375, -4.1669921875, -3.957275390625, -3.74755859375, -3.537841796875, -3.328125, -3.118408203125, -2.90869140625, -2.698974609375, -2.4892578125, -2.279541015625, -2.06982421875, -1.860107421875, -1.650390625, -1.440673828125, -1.23095703125, -1.021240234375, -0.8115234375, -0.601806640625, -0.39208984375, -0.182373046875, 0.02734375, 0.237060546875, 0.44677734375, 0.656494140625, 0.8662109375, 1.075927734375, 1.28564453125, 1.495361328125, 1.705078125, 1.914794921875, 2.12451171875, 2.334228515625, 2.5439453125, 2.753662109375, 2.96337890625, 3.173095703125, 3.3828125, 3.592529296875, 3.80224609375, 4.011962890625, 4.2216796875, 4.431396484375, 4.64111328125, 4.850830078125, 5.060546875, 5.270263671875, 5.47998046875, 5.689697265625, 5.8994140625, 6.109130859375, 6.31884765625, 6.528564453125, 6.73828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 10.0, 7.0, 10.0, 18.0, 14.0, 28.0, 41.0, 50.0, 64.0, 87.0, 103.0, 133.0, 176.0, 316.0, 546.0, 1190.0, 2891.0, 8457.0, 27007.0, 87651.0, 316758.0, 432949.0, 116460.0, 35437.0, 11276.0, 3724.0, 1384.0, 636.0, 300.0, 221.0, 142.0, 120.0, 82.0, 59.0, 51.0, 29.0, 38.0, 27.0, 12.0, 7.0, 9.0, 5.0, 10.0, 6.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.9609375, -6.74420166015625, -6.5274658203125, -6.31072998046875, -6.093994140625, -5.87725830078125, -5.6605224609375, -5.44378662109375, -5.22705078125, -5.01031494140625, -4.7935791015625, -4.57684326171875, -4.360107421875, -4.14337158203125, -3.9266357421875, -3.70989990234375, -3.4931640625, -3.27642822265625, -3.0596923828125, -2.84295654296875, -2.626220703125, -2.40948486328125, -2.1927490234375, -1.97601318359375, -1.75927734375, -1.54254150390625, -1.3258056640625, -1.10906982421875, -0.892333984375, -0.67559814453125, -0.4588623046875, -0.24212646484375, -0.025390625, 0.19134521484375, 0.4080810546875, 0.62481689453125, 0.841552734375, 1.05828857421875, 1.2750244140625, 1.49176025390625, 1.70849609375, 1.92523193359375, 2.1419677734375, 2.35870361328125, 2.575439453125, 2.79217529296875, 3.0089111328125, 3.22564697265625, 3.4423828125, 3.65911865234375, 3.8758544921875, 4.09259033203125, 4.309326171875, 4.52606201171875, 4.7427978515625, 4.95953369140625, 5.17626953125, 5.39300537109375, 5.6097412109375, 5.82647705078125, 6.043212890625, 6.25994873046875, 6.4766845703125, 6.69342041015625, 6.91015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 7.0, 9.0, 11.0, 17.0, 23.0, 26.0, 30.0, 30.0, 31.0, 46.0, 45.0, 32.0, 50.0, 74.0, 119.0, 1814.0, 237.0, 68.0, 49.0, 49.0, 43.0, 36.0, 35.0, 24.0, 26.0, 30.0, 21.0, 15.0, 22.0, 14.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.25, -28.43115234375, -27.6123046875, -26.79345703125, -25.974609375, -25.15576171875, -24.3369140625, -23.51806640625, -22.69921875, -21.88037109375, -21.0615234375, -20.24267578125, -19.423828125, -18.60498046875, -17.7861328125, -16.96728515625, -16.1484375, -15.32958984375, -14.5107421875, -13.69189453125, -12.873046875, -12.05419921875, -11.2353515625, -10.41650390625, -9.59765625, -8.77880859375, -7.9599609375, -7.14111328125, -6.322265625, -5.50341796875, -4.6845703125, -3.86572265625, -3.046875, -2.22802734375, -1.4091796875, -0.59033203125, 0.228515625, 1.04736328125, 1.8662109375, 2.68505859375, 3.50390625, 4.32275390625, 5.1416015625, 5.96044921875, 6.779296875, 7.59814453125, 8.4169921875, 9.23583984375, 10.0546875, 10.87353515625, 11.6923828125, 12.51123046875, 13.330078125, 14.14892578125, 14.9677734375, 15.78662109375, 16.60546875, 17.42431640625, 18.2431640625, 19.06201171875, 19.880859375, 20.69970703125, 21.5185546875, 22.33740234375, 23.15625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 10.0, 6.0, 8.0, 20.0, 23.0, 62.0, 61.0, 81.0, 121.0, 179.0, 297.0, 606.0, 3398.0, 3129633.0, 9421.0, 817.0, 349.0, 201.0, 119.0, 98.0, 61.0, 44.0, 29.0, 23.0, 13.0, 10.0, 8.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.2763671875, -65.802734375, -63.3291015625, -60.85546875, -58.3818359375, -55.908203125, -53.4345703125, -50.9609375, -48.4873046875, -46.013671875, -43.5400390625, -41.06640625, -38.5927734375, -36.119140625, -33.6455078125, -31.171875, -28.6982421875, -26.224609375, -23.7509765625, -21.27734375, -18.8037109375, -16.330078125, -13.8564453125, -11.3828125, -8.9091796875, -6.435546875, -3.9619140625, -1.48828125, 0.9853515625, 3.458984375, 5.9326171875, 8.40625, 10.8798828125, 13.353515625, 15.8271484375, 18.30078125, 20.7744140625, 23.248046875, 25.7216796875, 28.1953125, 30.6689453125, 33.142578125, 35.6162109375, 38.08984375, 40.5634765625, 43.037109375, 45.5107421875, 47.984375, 50.4580078125, 52.931640625, 55.4052734375, 57.87890625, 60.3525390625, 62.826171875, 65.2998046875, 67.7734375, 70.2470703125, 72.720703125, 75.1943359375, 77.66796875, 80.1416015625, 82.615234375, 85.0888671875, 87.5625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 41.0, 667.0, 294.0, 11.0, 1.0, 0.0, 1.0], "bins": [-240.0944366455078, -236.007080078125, -231.91973876953125, -227.83238220214844, -223.74502563476562, -219.65768432617188, -215.57032775878906, -211.48297119140625, -207.3956298828125, -203.3082733154297, -199.22093200683594, -195.13357543945312, -191.0462188720703, -186.9588623046875, -182.87152099609375, -178.78416442871094, -174.69680786132812, -170.6094512939453, -166.52210998535156, -162.43475341796875, -158.34739685058594, -154.26004028320312, -150.17269897460938, -146.08534240722656, -141.99798583984375, -137.91062927246094, -133.8232879638672, -129.73593139648438, -125.64857482910156, -121.56122589111328, -117.473876953125, -113.38652038574219, -109.29917907714844, -105.21183013916016, -101.12447357177734, -97.03712463378906, -92.94976806640625, -88.86241912841797, -84.77507019042969, -80.68771362304688, -76.6003646850586, -72.51301574707031, -68.4256591796875, -64.33831024169922, -60.25095748901367, -56.163604736328125, -52.076255798339844, -47.9889030456543, -43.90155029296875, -39.8141975402832, -35.726844787597656, -31.639495849609375, -27.552143096923828, -23.46479034423828, -19.377439498901367, -15.290088653564453, -11.202737808227539, -7.115386009216309, -3.028034210205078, 1.0593175888061523, 5.146669387817383, 9.23402214050293, 13.321372985839844, 17.408723831176758, 21.496076583862305]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 6.0, 9.0, 11.0, 15.0, 12.0, 6.0, 23.0, 20.0, 26.0, 25.0, 21.0, 24.0, 41.0, 27.0, 35.0, 36.0, 46.0, 38.0, 40.0, 50.0, 42.0, 41.0, 41.0, 38.0, 37.0, 34.0, 27.0, 39.0, 17.0, 23.0, 23.0, 23.0, 15.0, 9.0, 13.0, 13.0, 11.0, 5.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-59.17918395996094, -57.40391540527344, -55.62864685058594, -53.8533821105957, -52.0781135559082, -50.3028450012207, -48.52758026123047, -46.75231170654297, -44.97704315185547, -43.20177459716797, -41.42650604248047, -39.651241302490234, -37.875972747802734, -36.100704193115234, -34.325439453125, -32.5501708984375, -30.77490234375, -28.9996337890625, -27.224367141723633, -25.449100494384766, -23.673831939697266, -21.898563385009766, -20.1232967376709, -18.34803009033203, -16.57276153564453, -14.797493934631348, -13.022226333618164, -11.24695873260498, -9.471691131591797, -7.696423530578613, -5.92115592956543, -4.145888328552246, -2.370624542236328, -0.5953569412231445, 1.179910659790039, 2.9551782608032227, 4.730445861816406, 6.50571346282959, 8.280981063842773, 10.056248664855957, 11.83151626586914, 13.606783866882324, 15.382051467895508, 17.157318115234375, 18.932586669921875, 20.707855224609375, 22.483121871948242, 24.25838851928711, 26.03365707397461, 27.80892562866211, 29.584192276000977, 31.359458923339844, 33.134727478027344, 34.909996032714844, 36.685264587402344, 38.46052932739258, 40.23579788208008, 42.01106643676758, 43.78633117675781, 45.56159973144531, 47.33686828613281, 49.11213684082031, 50.88740539550781, 52.66267013549805, 54.43793869018555]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 6.0, 7.0, 8.0, 9.0, 12.0, 17.0, 19.0, 14.0, 12.0, 26.0, 28.0, 33.0, 37.0, 39.0, 27.0, 39.0, 39.0, 33.0, 39.0, 30.0, 34.0, 43.0, 36.0, 45.0, 37.0, 42.0, 26.0, 21.0, 29.0, 28.0, 21.0, 25.0, 20.0, 21.0, 17.0, 16.0, 12.0, 6.0, 10.0, 7.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.7109375, -6.50421142578125, -6.2974853515625, -6.09075927734375, -5.884033203125, -5.67730712890625, -5.4705810546875, -5.26385498046875, -5.05712890625, -4.85040283203125, -4.6436767578125, -4.43695068359375, -4.230224609375, -4.02349853515625, -3.8167724609375, -3.61004638671875, -3.4033203125, -3.19659423828125, -2.9898681640625, -2.78314208984375, -2.576416015625, -2.36968994140625, -2.1629638671875, -1.95623779296875, -1.74951171875, -1.54278564453125, -1.3360595703125, -1.12933349609375, -0.922607421875, -0.71588134765625, -0.5091552734375, -0.30242919921875, -0.095703125, 0.11102294921875, 0.3177490234375, 0.52447509765625, 0.731201171875, 0.93792724609375, 1.1446533203125, 1.35137939453125, 1.55810546875, 1.76483154296875, 1.9715576171875, 2.17828369140625, 2.385009765625, 2.59173583984375, 2.7984619140625, 3.00518798828125, 3.2119140625, 3.41864013671875, 3.6253662109375, 3.83209228515625, 4.038818359375, 4.24554443359375, 4.4522705078125, 4.65899658203125, 4.86572265625, 5.07244873046875, 5.2791748046875, 5.48590087890625, 5.692626953125, 5.89935302734375, 6.1060791015625, 6.31280517578125, 6.51953125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 6.0, 5.0, 9.0, 6.0, 9.0, 18.0, 12.0, 19.0, 19.0, 31.0, 48.0, 60.0, 75.0, 91.0, 156.0, 202.0, 415.0, 1106.0, 6842.0, 290235.0, 3570370.0, 314713.0, 7392.0, 1223.0, 417.0, 229.0, 126.0, 97.0, 71.0, 63.0, 42.0, 48.0, 23.0, 20.0, 16.0, 8.0, 13.0, 8.0, 7.0, 8.0, 6.0, 7.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.015625, -24.290771484375, -23.56591796875, -22.841064453125, -22.1162109375, -21.391357421875, -20.66650390625, -19.941650390625, -19.216796875, -18.491943359375, -17.76708984375, -17.042236328125, -16.3173828125, -15.592529296875, -14.86767578125, -14.142822265625, -13.41796875, -12.693115234375, -11.96826171875, -11.243408203125, -10.5185546875, -9.793701171875, -9.06884765625, -8.343994140625, -7.619140625, -6.894287109375, -6.16943359375, -5.444580078125, -4.7197265625, -3.994873046875, -3.27001953125, -2.545166015625, -1.8203125, -1.095458984375, -0.37060546875, 0.354248046875, 1.0791015625, 1.803955078125, 2.52880859375, 3.253662109375, 3.978515625, 4.703369140625, 5.42822265625, 6.153076171875, 6.8779296875, 7.602783203125, 8.32763671875, 9.052490234375, 9.77734375, 10.502197265625, 11.22705078125, 11.951904296875, 12.6767578125, 13.401611328125, 14.12646484375, 14.851318359375, 15.576171875, 16.301025390625, 17.02587890625, 17.750732421875, 18.4755859375, 19.200439453125, 19.92529296875, 20.650146484375, 21.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 18.0, 26.0, 38.0, 51.0, 75.0, 77.0, 101.0, 156.0, 230.0, 349.0, 528.0, 580.0, 580.0, 411.0, 252.0, 180.0, 127.0, 86.0, 49.0, 51.0, 30.0, 16.0, 9.0, 13.0, 9.0, 0.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7109375, -14.244873046875, -13.77880859375, -13.312744140625, -12.8466796875, -12.380615234375, -11.91455078125, -11.448486328125, -10.982421875, -10.516357421875, -10.05029296875, -9.584228515625, -9.1181640625, -8.652099609375, -8.18603515625, -7.719970703125, -7.25390625, -6.787841796875, -6.32177734375, -5.855712890625, -5.3896484375, -4.923583984375, -4.45751953125, -3.991455078125, -3.525390625, -3.059326171875, -2.59326171875, -2.127197265625, -1.6611328125, -1.195068359375, -0.72900390625, -0.262939453125, 0.203125, 0.669189453125, 1.13525390625, 1.601318359375, 2.0673828125, 2.533447265625, 2.99951171875, 3.465576171875, 3.931640625, 4.397705078125, 4.86376953125, 5.329833984375, 5.7958984375, 6.261962890625, 6.72802734375, 7.194091796875, 7.66015625, 8.126220703125, 8.59228515625, 9.058349609375, 9.5244140625, 9.990478515625, 10.45654296875, 10.922607421875, 11.388671875, 11.854736328125, 12.32080078125, 12.786865234375, 13.2529296875, 13.718994140625, 14.18505859375, 14.651123046875, 15.1171875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 13.0, 12.0, 16.0, 30.0, 32.0, 53.0, 49.0, 103.0, 104.0, 124.0, 182.0, 255.0, 347.0, 610.0, 3026.0, 4030765.0, 155985.0, 974.0, 373.0, 279.0, 213.0, 135.0, 113.0, 98.0, 85.0, 64.0, 54.0, 50.0, 29.0, 38.0, 14.0, 12.0, 11.0, 13.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-78.4375, -75.8896484375, -73.341796875, -70.7939453125, -68.24609375, -65.6982421875, -63.150390625, -60.6025390625, -58.0546875, -55.5068359375, -52.958984375, -50.4111328125, -47.86328125, -45.3154296875, -42.767578125, -40.2197265625, -37.671875, -35.1240234375, -32.576171875, -30.0283203125, -27.48046875, -24.9326171875, -22.384765625, -19.8369140625, -17.2890625, -14.7412109375, -12.193359375, -9.6455078125, -7.09765625, -4.5498046875, -2.001953125, 0.5458984375, 3.09375, 5.6416015625, 8.189453125, 10.7373046875, 13.28515625, 15.8330078125, 18.380859375, 20.9287109375, 23.4765625, 26.0244140625, 28.572265625, 31.1201171875, 33.66796875, 36.2158203125, 38.763671875, 41.3115234375, 43.859375, 46.4072265625, 48.955078125, 51.5029296875, 54.05078125, 56.5986328125, 59.146484375, 61.6943359375, 64.2421875, 66.7900390625, 69.337890625, 71.8857421875, 74.43359375, 76.9814453125, 79.529296875, 82.0771484375, 84.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 43.0, 274.0, 447.0, 204.0, 34.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.85195922851562, -217.94973754882812, -213.04751586914062, -208.14529418945312, -203.24307250976562, -198.3408660888672, -193.4386444091797, -188.5364227294922, -183.6342010498047, -178.7319793701172, -173.8297576904297, -168.9275360107422, -164.02532958984375, -159.12310791015625, -154.22088623046875, -149.31866455078125, -144.41644287109375, -139.51422119140625, -134.61199951171875, -129.70977783203125, -124.80756378173828, -119.90534210205078, -115.00312805175781, -110.10090637207031, -105.19868469238281, -100.29646301269531, -95.39424133300781, -90.49202728271484, -85.58980560302734, -80.68758392333984, -75.78536987304688, -70.88314819335938, -65.9809341430664, -61.078712463378906, -56.17649459838867, -51.27427673339844, -46.37205505371094, -41.46983337402344, -36.5676155090332, -31.66539764404297, -26.76317596435547, -21.8609561920166, -16.958736419677734, -12.056516647338867, -7.154296875, -2.252077102661133, 2.6501426696777344, 7.552360534667969, 12.454582214355469, 17.356801986694336, 22.259021759033203, 27.16124153137207, 32.06346130371094, 36.96568298339844, 41.86790084838867, 46.770118713378906, 51.672340393066406, 56.574562072753906, 61.47677993774414, 66.37899780273438, 71.28121948242188, 76.18344116210938, 81.08566284179688, 85.98787689208984, 90.89009857177734]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 7.0, 10.0, 10.0, 20.0, 13.0, 22.0, 10.0, 40.0, 25.0, 38.0, 32.0, 29.0, 40.0, 36.0, 40.0, 42.0, 34.0, 38.0, 32.0, 37.0, 44.0, 33.0, 39.0, 34.0, 30.0, 25.0, 37.0, 20.0, 16.0, 21.0, 16.0, 21.0, 13.0, 10.0, 8.0, 13.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-39.63624572753906, -38.40560531616211, -37.17496871948242, -35.94432830810547, -34.71369171142578, -33.48305130004883, -32.252410888671875, -31.021772384643555, -29.791133880615234, -28.560495376586914, -27.329856872558594, -26.09921646118164, -24.86857795715332, -23.637939453125, -22.407299041748047, -21.176660537719727, -19.946022033691406, -18.715383529663086, -17.484745025634766, -16.254104614257812, -15.023466110229492, -13.792827606201172, -12.562188148498535, -11.331548690795898, -10.100910186767578, -8.870271682739258, -7.639632225036621, -6.408993244171143, -5.178354263305664, -3.9477152824401855, -2.717076301574707, -1.4864368438720703, -0.2557945251464844, 0.9748444557189941, 2.2054834365844727, 3.436122417449951, 4.66676139831543, 5.897400379180908, 7.128039360046387, 8.358678817749023, 9.589317321777344, 10.819955825805664, 12.0505952835083, 13.281234741210938, 14.511873245239258, 15.742511749267578, 16.97315216064453, 18.20379066467285, 19.434429168701172, 20.665067672729492, 21.895706176757812, 23.126346588134766, 24.356985092163086, 25.587623596191406, 26.81826400756836, 28.04890251159668, 29.279541015625, 30.51017951965332, 31.74081802368164, 32.971458435058594, 34.20209503173828, 35.432735443115234, 36.66337585449219, 37.894012451171875, 39.12465286254883]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 5.0, 12.0, 10.0, 17.0, 27.0, 42.0, 56.0, 73.0, 99.0, 175.0, 248.0, 360.0, 491.0, 790.0, 1167.0, 1654.0, 2565.0, 3856.0, 5926.0, 9279.0, 14653.0, 23762.0, 38019.0, 63856.0, 108400.0, 192852.0, 236447.0, 137716.0, 79264.0, 47644.0, 28962.0, 17869.0, 11261.0, 7100.0, 4692.0, 3045.0, 1999.0, 1291.0, 941.0, 569.0, 443.0, 284.0, 200.0, 140.0, 95.0, 60.0, 40.0, 24.0, 29.0, 25.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0], "bins": [-1.150390625, -1.115753173828125, -1.08111572265625, -1.046478271484375, -1.0118408203125, -0.977203369140625, -0.94256591796875, -0.907928466796875, -0.873291015625, -0.838653564453125, -0.80401611328125, -0.769378662109375, -0.7347412109375, -0.700103759765625, -0.66546630859375, -0.630828857421875, -0.59619140625, -0.561553955078125, -0.52691650390625, -0.492279052734375, -0.4576416015625, -0.423004150390625, -0.38836669921875, -0.353729248046875, -0.319091796875, -0.284454345703125, -0.24981689453125, -0.215179443359375, -0.1805419921875, -0.145904541015625, -0.11126708984375, -0.076629638671875, -0.0419921875, -0.007354736328125, 0.02728271484375, 0.061920166015625, 0.0965576171875, 0.131195068359375, 0.16583251953125, 0.200469970703125, 0.235107421875, 0.269744873046875, 0.30438232421875, 0.339019775390625, 0.3736572265625, 0.408294677734375, 0.44293212890625, 0.477569580078125, 0.51220703125, 0.546844482421875, 0.58148193359375, 0.616119384765625, 0.6507568359375, 0.685394287109375, 0.72003173828125, 0.754669189453125, 0.789306640625, 0.823944091796875, 0.85858154296875, 0.893218994140625, 0.9278564453125, 0.962493896484375, 0.99713134765625, 1.031768798828125, 1.06640625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 12.0, 14.0, 22.0, 13.0, 16.0, 19.0, 20.0, 27.0, 30.0, 33.0, 38.0, 45.0, 42.0, 50.0, 35.0, 69.0, 1063.0, 56.0, 36.0, 39.0, 41.0, 43.0, 32.0, 44.0, 27.0, 25.0, 17.0, 23.0, 15.0, 23.0, 16.0, 4.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.83648681640625, -4.6807861328125, -4.52508544921875, -4.369384765625, -4.21368408203125, -4.0579833984375, -3.90228271484375, -3.74658203125, -3.59088134765625, -3.4351806640625, -3.27947998046875, -3.123779296875, -2.96807861328125, -2.8123779296875, -2.65667724609375, -2.5009765625, -2.34527587890625, -2.1895751953125, -2.03387451171875, -1.878173828125, -1.72247314453125, -1.5667724609375, -1.41107177734375, -1.25537109375, -1.09967041015625, -0.9439697265625, -0.78826904296875, -0.632568359375, -0.47686767578125, -0.3211669921875, -0.16546630859375, -0.009765625, 0.14593505859375, 0.3016357421875, 0.45733642578125, 0.613037109375, 0.76873779296875, 0.9244384765625, 1.08013916015625, 1.23583984375, 1.39154052734375, 1.5472412109375, 1.70294189453125, 1.858642578125, 2.01434326171875, 2.1700439453125, 2.32574462890625, 2.4814453125, 2.63714599609375, 2.7928466796875, 2.94854736328125, 3.104248046875, 3.25994873046875, 3.4156494140625, 3.57135009765625, 3.72705078125, 3.88275146484375, 4.0384521484375, 4.19415283203125, 4.349853515625, 4.50555419921875, 4.6612548828125, 4.81695556640625, 4.97265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 8.0, 17.0, 25.0, 25.0, 43.0, 72.0, 84.0, 167.0, 222.0, 351.0, 571.0, 829.0, 1403.0, 2175.0, 3327.0, 5270.0, 8255.0, 13209.0, 22526.0, 38718.0, 68479.0, 123478.0, 1290857.0, 235396.0, 119917.0, 66549.0, 37954.0, 21848.0, 12909.0, 8115.0, 5102.0, 3317.0, 2125.0, 1331.0, 902.0, 520.0, 351.0, 223.0, 155.0, 102.0, 64.0, 45.0, 37.0, 17.0, 18.0, 6.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.0279998779296875, -0.992523193359375, -0.9570465087890625, -0.92156982421875, -0.8860931396484375, -0.850616455078125, -0.8151397705078125, -0.7796630859375, -0.7441864013671875, -0.708709716796875, -0.6732330322265625, -0.63775634765625, -0.6022796630859375, -0.566802978515625, -0.5313262939453125, -0.495849609375, -0.4603729248046875, -0.424896240234375, -0.3894195556640625, -0.35394287109375, -0.3184661865234375, -0.282989501953125, -0.2475128173828125, -0.2120361328125, -0.1765594482421875, -0.141082763671875, -0.1056060791015625, -0.07012939453125, -0.0346527099609375, 0.000823974609375, 0.0363006591796875, 0.07177734375, 0.1072540283203125, 0.142730712890625, 0.1782073974609375, 0.21368408203125, 0.2491607666015625, 0.284637451171875, 0.3201141357421875, 0.3555908203125, 0.3910675048828125, 0.426544189453125, 0.4620208740234375, 0.49749755859375, 0.5329742431640625, 0.568450927734375, 0.6039276123046875, 0.639404296875, 0.6748809814453125, 0.710357666015625, 0.7458343505859375, 0.78131103515625, 0.8167877197265625, 0.852264404296875, 0.8877410888671875, 0.9232177734375, 0.9586944580078125, 0.994171142578125, 1.0296478271484375, 1.06512451171875, 1.1006011962890625, 1.136077880859375, 1.1715545654296875, 1.20703125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 3.0, 0.0, 5.0, 4.0, 5.0, 4.0, 10.0, 10.0, 10.0, 18.0, 11.0, 16.0, 25.0, 19.0, 33.0, 36.0, 29.0, 42.0, 49.0, 58.0, 60.0, 49.0, 56.0, 44.0, 46.0, 51.0, 48.0, 45.0, 34.0, 33.0, 23.0, 17.0, 22.0, 16.0, 17.0, 9.0, 13.0, 5.0, 8.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00040340423583984375, -0.00038740038871765137, -0.000371396541595459, -0.0003553926944732666, -0.0003393888473510742, -0.00032338500022888184, -0.00030738115310668945, -0.00029137730598449707, -0.0002753734588623047, -0.0002593696117401123, -0.00024336576461791992, -0.00022736191749572754, -0.00021135807037353516, -0.00019535422325134277, -0.0001793503761291504, -0.000163346529006958, -0.00014734268188476562, -0.00013133883476257324, -0.00011533498764038086, -9.933114051818848e-05, -8.33272933959961e-05, -6.732344627380371e-05, -5.131959915161133e-05, -3.5315752029418945e-05, -1.9311904907226562e-05, -3.3080577850341797e-06, 1.2695789337158203e-05, 2.8699636459350586e-05, 4.470348358154297e-05, 6.070733070373535e-05, 7.671117782592773e-05, 9.271502494812012e-05, 0.0001087188720703125, 0.00012472271919250488, 0.00014072656631469727, 0.00015673041343688965, 0.00017273426055908203, 0.00018873810768127441, 0.0002047419548034668, 0.00022074580192565918, 0.00023674964904785156, 0.00025275349617004395, 0.00026875734329223633, 0.0002847611904144287, 0.0003007650375366211, 0.0003167688846588135, 0.00033277273178100586, 0.00034877657890319824, 0.0003647804260253906, 0.000380784273147583, 0.0003967881202697754, 0.0004127919673919678, 0.00042879581451416016, 0.00044479966163635254, 0.0004608035087585449, 0.0004768073558807373, 0.0004928112030029297, 0.0005088150501251221, 0.0005248188972473145, 0.0005408227443695068, 0.0005568265914916992, 0.0005728304386138916, 0.000588834285736084, 0.0006048381328582764, 0.0006208419799804688]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 7.0, 6.0, 5.0, 19.0, 14.0, 13.0, 27.0, 34.0, 46.0, 56.0, 76.0, 98.0, 146.0, 270.0, 736.0, 43407.0, 1001008.0, 1531.0, 414.0, 197.0, 108.0, 81.0, 59.0, 42.0, 39.0, 29.0, 21.0, 16.0, 11.0, 11.0, 9.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0182037353515625, -0.017739534378051758, -0.017275333404541016, -0.016811132431030273, -0.01634693145751953, -0.01588273048400879, -0.015418529510498047, -0.014954328536987305, -0.014490127563476562, -0.01402592658996582, -0.013561725616455078, -0.013097524642944336, -0.012633323669433594, -0.012169122695922852, -0.01170492172241211, -0.011240720748901367, -0.010776519775390625, -0.010312318801879883, -0.00984811782836914, -0.009383916854858398, -0.008919715881347656, -0.008455514907836914, -0.007991313934326172, -0.00752711296081543, -0.0070629119873046875, -0.006598711013793945, -0.006134510040283203, -0.005670309066772461, -0.005206108093261719, -0.0047419071197509766, -0.004277706146240234, -0.003813505172729492, -0.00334930419921875, -0.002885103225708008, -0.0024209022521972656, -0.0019567012786865234, -0.0014925003051757812, -0.001028299331665039, -0.0005640983581542969, -9.989738464355469e-05, 0.0003643035888671875, 0.0008285045623779297, 0.0012927055358886719, 0.001756906509399414, 0.0022211074829101562, 0.0026853084564208984, 0.0031495094299316406, 0.003613710403442383, 0.004077911376953125, 0.004542112350463867, 0.005006313323974609, 0.0054705142974853516, 0.005934715270996094, 0.006398916244506836, 0.006863117218017578, 0.00732731819152832, 0.0077915191650390625, 0.008255720138549805, 0.008719921112060547, 0.009184122085571289, 0.009648323059082031, 0.010112524032592773, 0.010576725006103516, 0.011040925979614258, 0.011505126953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 16.0, 26.0, 74.0, 132.0, 192.0, 230.0, 164.0, 102.0, 44.0, 17.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005026980652473867, -0.00048484522267244756, -0.0004669924092013389, -0.00044913956662639976, -0.0004312867531552911, -0.00041343391058035195, -0.0003955810680054128, -0.00037772825453430414, -0.00035987544106319547, -0.00034202259848825634, -0.00032416978501714766, -0.00030631694244220853, -0.00028846412897109985, -0.0002706112863961607, -0.0002527584438212216, -0.00023490563035011292, -0.00021705278777517378, -0.00019919995975214988, -0.00018134713172912598, -0.00016349428915418684, -0.00014564147568307817, -0.00012778863310813904, -0.00010993580508511513, -9.208297706209123e-05, -7.423014903906733e-05, -5.6377321016043425e-05, -3.8524489355040714e-05, -2.0671657694038004e-05, -2.8188296710141003e-06, 1.5033998352009803e-05, 3.288683365099132e-05, 5.0739661674015224e-05, 6.859248969703913e-05, 8.644531772006303e-05, 0.00010429814574308693, 0.00012215098831802607, 0.00014000380178913474, 0.00015785664436407387, 0.00017570947238709778, 0.00019356230041012168, 0.00021141512843314558, 0.00022926795645616949, 0.0002471207990311086, 0.0002649736125022173, 0.0002828264550771564, 0.0003006792685482651, 0.00031853211112320423, 0.0003363849245943129, 0.00035423776716925204, 0.00037209060974419117, 0.00038994342321529984, 0.000407796265790239, 0.00042564907926134765, 0.0004435019218362868, 0.00046135473530739546, 0.0004792075778823346, 0.0004970604204572737, 0.0005149132339283824, 0.000532766105607152, 0.0005506189190782607, 0.0005684717325493693, 0.000586324546020478, 0.0006041774176992476, 0.0006220302311703563, 0.000639883044641465]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 12.0, 14.0, 14.0, 26.0, 16.0, 20.0, 32.0, 31.0, 42.0, 23.0, 28.0, 38.0, 41.0, 34.0, 43.0, 50.0, 49.0, 42.0, 35.0, 42.0, 34.0, 31.0, 43.0, 35.0, 27.0, 32.0, 29.0, 21.0, 21.0, 16.0, 14.0, 17.0, 8.0, 8.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00031960010528564453, -0.00031033530831336975, -0.00030107051134109497, -0.0002918057143688202, -0.0002825409173965454, -0.00027327612042427063, -0.00026401132345199585, -0.00025474652647972107, -0.0002454817295074463, -0.0002362169325351715, -0.00022695213556289673, -0.00021768733859062195, -0.00020842254161834717, -0.0001991577446460724, -0.0001898929476737976, -0.00018062815070152283, -0.00017136335372924805, -0.00016209855675697327, -0.00015283375978469849, -0.0001435689628124237, -0.00013430416584014893, -0.00012503936886787415, -0.00011577457189559937, -0.00010650977492332458, -9.72449779510498e-05, -8.798018097877502e-05, -7.871538400650024e-05, -6.945058703422546e-05, -6.0185790061950684e-05, -5.09209930896759e-05, -4.165619611740112e-05, -3.239139914512634e-05, -2.3126602172851562e-05, -1.3861805200576782e-05, -4.597008228302002e-06, 4.667788743972778e-06, 1.3932585716247559e-05, 2.319738268852234e-05, 3.246217966079712e-05, 4.17269766330719e-05, 5.099177360534668e-05, 6.025657057762146e-05, 6.952136754989624e-05, 7.878616452217102e-05, 8.80509614944458e-05, 9.731575846672058e-05, 0.00010658055543899536, 0.00011584535241127014, 0.00012511014938354492, 0.0001343749463558197, 0.00014363974332809448, 0.00015290454030036926, 0.00016216933727264404, 0.00017143413424491882, 0.0001806989312171936, 0.00018996372818946838, 0.00019922852516174316, 0.00020849332213401794, 0.00021775811910629272, 0.0002270229160785675, 0.00023628771305084229, 0.00024555251002311707, 0.00025481730699539185, 0.0002640821039676666, 0.0002733469009399414]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 12.0, 15.0, 18.0, 12.0, 23.0, 28.0, 19.0, 28.0, 27.0, 36.0, 35.0, 44.0, 33.0, 47.0, 46.0, 50.0, 33.0, 39.0, 39.0, 37.0, 33.0, 28.0, 36.0, 39.0, 26.0, 26.0, 26.0, 23.0, 24.0, 14.0, 19.0, 10.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3212890625, -6.099609375, -5.8779296875, -5.65625, -5.4345703125, -5.212890625, -4.9912109375, -4.76953125, -4.5478515625, -4.326171875, -4.1044921875, -3.8828125, -3.6611328125, -3.439453125, -3.2177734375, -2.99609375, -2.7744140625, -2.552734375, -2.3310546875, -2.109375, -1.8876953125, -1.666015625, -1.4443359375, -1.22265625, -1.0009765625, -0.779296875, -0.5576171875, -0.3359375, -0.1142578125, 0.107421875, 0.3291015625, 0.55078125, 0.7724609375, 0.994140625, 1.2158203125, 1.4375, 1.6591796875, 1.880859375, 2.1025390625, 2.32421875, 2.5458984375, 2.767578125, 2.9892578125, 3.2109375, 3.4326171875, 3.654296875, 3.8759765625, 4.09765625, 4.3193359375, 4.541015625, 4.7626953125, 4.984375, 5.2060546875, 5.427734375, 5.6494140625, 5.87109375, 6.0927734375, 6.314453125, 6.5361328125, 6.7578125, 6.9794921875, 7.201171875, 7.4228515625, 7.64453125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 9.0, 6.0, 17.0, 23.0, 21.0, 28.0, 28.0, 50.0, 62.0, 84.0, 101.0, 170.0, 216.0, 370.0, 573.0, 1073.0, 3416.0, 25175.0, 364112.0, 609130.0, 36368.0, 4442.0, 1187.0, 633.0, 373.0, 257.0, 155.0, 107.0, 88.0, 64.0, 58.0, 31.0, 22.0, 28.0, 10.0, 19.0, 16.0, 7.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.1070556640625, -11.690673828125, -11.2742919921875, -10.85791015625, -10.4415283203125, -10.025146484375, -9.6087646484375, -9.1923828125, -8.7760009765625, -8.359619140625, -7.9432373046875, -7.52685546875, -7.1104736328125, -6.694091796875, -6.2777099609375, -5.861328125, -5.4449462890625, -5.028564453125, -4.6121826171875, -4.19580078125, -3.7794189453125, -3.363037109375, -2.9466552734375, -2.5302734375, -2.1138916015625, -1.697509765625, -1.2811279296875, -0.86474609375, -0.4483642578125, -0.031982421875, 0.3843994140625, 0.80078125, 1.2171630859375, 1.633544921875, 2.0499267578125, 2.46630859375, 2.8826904296875, 3.299072265625, 3.7154541015625, 4.1318359375, 4.5482177734375, 4.964599609375, 5.3809814453125, 5.79736328125, 6.2137451171875, 6.630126953125, 7.0465087890625, 7.462890625, 7.8792724609375, 8.295654296875, 8.7120361328125, 9.12841796875, 9.5447998046875, 9.961181640625, 10.3775634765625, 10.7939453125, 11.2103271484375, 11.626708984375, 12.0430908203125, 12.45947265625, 12.8758544921875, 13.292236328125, 13.7086181640625, 14.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 3.0, 10.0, 7.0, 8.0, 9.0, 18.0, 15.0, 10.0, 21.0, 34.0, 23.0, 24.0, 38.0, 41.0, 49.0, 37.0, 58.0, 70.0, 175.0, 1748.0, 157.0, 60.0, 42.0, 49.0, 35.0, 41.0, 43.0, 24.0, 16.0, 29.0, 30.0, 22.0, 13.0, 13.0, 9.0, 10.0, 11.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-22.28125, -21.615234375, -20.94921875, -20.283203125, -19.6171875, -18.951171875, -18.28515625, -17.619140625, -16.953125, -16.287109375, -15.62109375, -14.955078125, -14.2890625, -13.623046875, -12.95703125, -12.291015625, -11.625, -10.958984375, -10.29296875, -9.626953125, -8.9609375, -8.294921875, -7.62890625, -6.962890625, -6.296875, -5.630859375, -4.96484375, -4.298828125, -3.6328125, -2.966796875, -2.30078125, -1.634765625, -0.96875, -0.302734375, 0.36328125, 1.029296875, 1.6953125, 2.361328125, 3.02734375, 3.693359375, 4.359375, 5.025390625, 5.69140625, 6.357421875, 7.0234375, 7.689453125, 8.35546875, 9.021484375, 9.6875, 10.353515625, 11.01953125, 11.685546875, 12.3515625, 13.017578125, 13.68359375, 14.349609375, 15.015625, 15.681640625, 16.34765625, 17.013671875, 17.6796875, 18.345703125, 19.01171875, 19.677734375, 20.34375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 1.0, 3.0, 4.0, 8.0, 5.0, 9.0, 14.0, 14.0, 12.0, 11.0, 17.0, 29.0, 40.0, 26.0, 37.0, 41.0, 71.0, 79.0, 120.0, 186.0, 359.0, 863.0, 14169.0, 3122304.0, 5640.0, 678.0, 293.0, 171.0, 121.0, 74.0, 62.0, 47.0, 31.0, 35.0, 21.0, 19.0, 13.0, 16.0, 11.0, 10.0, 11.0, 8.0, 3.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-61.375, -59.3564453125, -57.337890625, -55.3193359375, -53.30078125, -51.2822265625, -49.263671875, -47.2451171875, -45.2265625, -43.2080078125, -41.189453125, -39.1708984375, -37.15234375, -35.1337890625, -33.115234375, -31.0966796875, -29.078125, -27.0595703125, -25.041015625, -23.0224609375, -21.00390625, -18.9853515625, -16.966796875, -14.9482421875, -12.9296875, -10.9111328125, -8.892578125, -6.8740234375, -4.85546875, -2.8369140625, -0.818359375, 1.2001953125, 3.21875, 5.2373046875, 7.255859375, 9.2744140625, 11.29296875, 13.3115234375, 15.330078125, 17.3486328125, 19.3671875, 21.3857421875, 23.404296875, 25.4228515625, 27.44140625, 29.4599609375, 31.478515625, 33.4970703125, 35.515625, 37.5341796875, 39.552734375, 41.5712890625, 43.58984375, 45.6083984375, 47.626953125, 49.6455078125, 51.6640625, 53.6826171875, 55.701171875, 57.7197265625, 59.73828125, 61.7568359375, 63.775390625, 65.7939453125, 67.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 18.0, 22.0, 37.0, 63.0, 90.0, 118.0, 123.0, 129.0, 132.0, 99.0, 76.0, 49.0, 27.0, 14.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-26.973709106445312, -26.45728874206543, -25.940868377685547, -25.424448013305664, -24.90802764892578, -24.391605377197266, -23.875186920166016, -23.3587646484375, -22.842344284057617, -22.325923919677734, -21.80950355529785, -21.29308319091797, -20.776662826538086, -20.260242462158203, -19.743820190429688, -19.227399826049805, -18.710979461669922, -18.19455909729004, -17.678138732910156, -17.161718368530273, -16.64529800415039, -16.128875732421875, -15.612456321716309, -15.096035957336426, -14.57961654663086, -14.063196182250977, -13.546775817871094, -13.030355453491211, -12.513934135437012, -11.997513771057129, -11.481093406677246, -10.964673042297363, -10.448253631591797, -9.931833267211914, -9.415412902832031, -8.898992538452148, -8.38257122039795, -7.866150856018066, -7.349730491638184, -6.833310127258301, -6.316888809204102, -5.800468444824219, -5.284047603607178, -4.767627239227295, -4.251206398010254, -3.734786033630371, -3.2183656692504883, -2.7019450664520264, -2.1855244636535645, -1.6691038608551025, -1.1526833772659302, -0.6362628936767578, -0.1198422908782959, 0.396578311920166, 0.9129986763000488, 1.4294192790985107, 1.9458398818969727, 2.4622604846954346, 2.9786810874938965, 3.4951014518737793, 4.01152229309082, 4.527942657470703, 5.044363021850586, 5.560783386230469, 6.07720422744751]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 9.0, 7.0, 9.0, 8.0, 9.0, 10.0, 21.0, 11.0, 19.0, 19.0, 25.0, 22.0, 36.0, 31.0, 27.0, 31.0, 31.0, 32.0, 33.0, 40.0, 31.0, 39.0, 38.0, 38.0, 38.0, 36.0, 28.0, 32.0, 29.0, 27.0, 27.0, 27.0, 20.0, 22.0, 18.0, 23.0, 20.0, 13.0, 10.0, 7.0, 6.0, 7.0, 6.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-58.09512710571289, -56.42301559448242, -54.75090789794922, -53.07879638671875, -51.40668487548828, -49.73457717895508, -48.06246566772461, -46.390357971191406, -44.71824645996094, -43.04613494873047, -41.374027252197266, -39.7019157409668, -38.029808044433594, -36.357696533203125, -34.685585021972656, -33.01347351074219, -31.341365814208984, -29.66925621032715, -27.997146606445312, -26.325035095214844, -24.652925491333008, -22.980815887451172, -21.308704376220703, -19.636594772338867, -17.96448516845703, -16.292375564575195, -14.620265007019043, -12.94815444946289, -11.276044845581055, -9.603935241699219, -7.931824684143066, -6.259714126586914, -4.587608337402344, -2.9154982566833496, -1.2433881759643555, 0.42872190475463867, 2.100831985473633, 3.7729415893554688, 5.445052146911621, 7.117162704467773, 8.78927230834961, 10.461381912231445, 12.133492469787598, 13.80560302734375, 15.477712631225586, 17.149822235107422, 18.82193374633789, 20.494043350219727, 22.166152954101562, 23.8382625579834, 25.510372161865234, 27.182483673095703, 28.85459327697754, 30.526702880859375, 32.198814392089844, 33.87092590332031, 35.543033599853516, 37.215145111083984, 38.88725280761719, 40.559364318847656, 42.231475830078125, 43.90358352661133, 45.5756950378418, 47.247802734375, 48.91991424560547]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 3.0, 7.0, 8.0, 15.0, 12.0, 11.0, 26.0, 25.0, 29.0, 19.0, 28.0, 33.0, 29.0, 41.0, 37.0, 47.0, 43.0, 43.0, 53.0, 49.0, 33.0, 37.0, 38.0, 42.0, 29.0, 37.0, 26.0, 27.0, 27.0, 35.0, 20.0, 12.0, 19.0, 16.0, 11.0, 8.0, 8.0, 4.0, 7.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5859375, -7.341552734375, -7.09716796875, -6.852783203125, -6.6083984375, -6.364013671875, -6.11962890625, -5.875244140625, -5.630859375, -5.386474609375, -5.14208984375, -4.897705078125, -4.6533203125, -4.408935546875, -4.16455078125, -3.920166015625, -3.67578125, -3.431396484375, -3.18701171875, -2.942626953125, -2.6982421875, -2.453857421875, -2.20947265625, -1.965087890625, -1.720703125, -1.476318359375, -1.23193359375, -0.987548828125, -0.7431640625, -0.498779296875, -0.25439453125, -0.010009765625, 0.234375, 0.478759765625, 0.72314453125, 0.967529296875, 1.2119140625, 1.456298828125, 1.70068359375, 1.945068359375, 2.189453125, 2.433837890625, 2.67822265625, 2.922607421875, 3.1669921875, 3.411376953125, 3.65576171875, 3.900146484375, 4.14453125, 4.388916015625, 4.63330078125, 4.877685546875, 5.1220703125, 5.366455078125, 5.61083984375, 5.855224609375, 6.099609375, 6.343994140625, 6.58837890625, 6.832763671875, 7.0771484375, 7.321533203125, 7.56591796875, 7.810302734375, 8.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 17.0, 15.0, 22.0, 24.0, 32.0, 57.0, 68.0, 103.0, 139.0, 246.0, 441.0, 781.0, 1879.0, 5200.0, 18019.0, 81141.0, 416757.0, 1360626.0, 1578434.0, 578609.0, 115101.0, 24645.0, 7009.0, 2524.0, 1030.0, 500.0, 256.0, 159.0, 132.0, 72.0, 61.0, 38.0, 46.0, 21.0, 19.0, 11.0, 8.0, 14.0, 2.0, 5.0, 9.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.53125, -10.2396240234375, -9.947998046875, -9.6563720703125, -9.36474609375, -9.0731201171875, -8.781494140625, -8.4898681640625, -8.1982421875, -7.9066162109375, -7.614990234375, -7.3233642578125, -7.03173828125, -6.7401123046875, -6.448486328125, -6.1568603515625, -5.865234375, -5.5736083984375, -5.281982421875, -4.9903564453125, -4.69873046875, -4.4071044921875, -4.115478515625, -3.8238525390625, -3.5322265625, -3.2406005859375, -2.948974609375, -2.6573486328125, -2.36572265625, -2.0740966796875, -1.782470703125, -1.4908447265625, -1.19921875, -0.9075927734375, -0.615966796875, -0.3243408203125, -0.03271484375, 0.2589111328125, 0.550537109375, 0.8421630859375, 1.1337890625, 1.4254150390625, 1.717041015625, 2.0086669921875, 2.30029296875, 2.5919189453125, 2.883544921875, 3.1751708984375, 3.466796875, 3.7584228515625, 4.050048828125, 4.3416748046875, 4.63330078125, 4.9249267578125, 5.216552734375, 5.5081787109375, 5.7998046875, 6.0914306640625, 6.383056640625, 6.6746826171875, 6.96630859375, 7.2579345703125, 7.549560546875, 7.8411865234375, 8.1328125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 5.0, 12.0, 5.0, 4.0, 18.0, 27.0, 29.0, 39.0, 42.0, 45.0, 62.0, 78.0, 93.0, 133.0, 140.0, 206.0, 234.0, 297.0, 304.0, 372.0, 352.0, 298.0, 254.0, 188.0, 175.0, 124.0, 106.0, 84.0, 74.0, 61.0, 41.0, 38.0, 32.0, 24.0, 15.0, 15.0, 10.0, 9.0, 10.0, 5.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.390625, -12.0433349609375, -11.696044921875, -11.3487548828125, -11.00146484375, -10.6541748046875, -10.306884765625, -9.9595947265625, -9.6123046875, -9.2650146484375, -8.917724609375, -8.5704345703125, -8.22314453125, -7.8758544921875, -7.528564453125, -7.1812744140625, -6.833984375, -6.4866943359375, -6.139404296875, -5.7921142578125, -5.44482421875, -5.0975341796875, -4.750244140625, -4.4029541015625, -4.0556640625, -3.7083740234375, -3.361083984375, -3.0137939453125, -2.66650390625, -2.3192138671875, -1.971923828125, -1.6246337890625, -1.27734375, -0.9300537109375, -0.582763671875, -0.2354736328125, 0.11181640625, 0.4591064453125, 0.806396484375, 1.1536865234375, 1.5009765625, 1.8482666015625, 2.195556640625, 2.5428466796875, 2.89013671875, 3.2374267578125, 3.584716796875, 3.9320068359375, 4.279296875, 4.6265869140625, 4.973876953125, 5.3211669921875, 5.66845703125, 6.0157470703125, 6.363037109375, 6.7103271484375, 7.0576171875, 7.4049072265625, 7.752197265625, 8.0994873046875, 8.44677734375, 8.7940673828125, 9.141357421875, 9.4886474609375, 9.8359375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 7.0, 7.0, 13.0, 14.0, 22.0, 29.0, 26.0, 46.0, 60.0, 86.0, 87.0, 108.0, 138.0, 188.0, 218.0, 280.0, 404.0, 700.0, 2289.0, 155133.0, 4018232.0, 12902.0, 1253.0, 500.0, 344.0, 228.0, 181.0, 154.0, 135.0, 100.0, 87.0, 63.0, 54.0, 45.0, 35.0, 33.0, 15.0, 15.0, 21.0, 9.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.5625, -62.68017578125, -60.7978515625, -58.91552734375, -57.033203125, -55.15087890625, -53.2685546875, -51.38623046875, -49.50390625, -47.62158203125, -45.7392578125, -43.85693359375, -41.974609375, -40.09228515625, -38.2099609375, -36.32763671875, -34.4453125, -32.56298828125, -30.6806640625, -28.79833984375, -26.916015625, -25.03369140625, -23.1513671875, -21.26904296875, -19.38671875, -17.50439453125, -15.6220703125, -13.73974609375, -11.857421875, -9.97509765625, -8.0927734375, -6.21044921875, -4.328125, -2.44580078125, -0.5634765625, 1.31884765625, 3.201171875, 5.08349609375, 6.9658203125, 8.84814453125, 10.73046875, 12.61279296875, 14.4951171875, 16.37744140625, 18.259765625, 20.14208984375, 22.0244140625, 23.90673828125, 25.7890625, 27.67138671875, 29.5537109375, 31.43603515625, 33.318359375, 35.20068359375, 37.0830078125, 38.96533203125, 40.84765625, 42.72998046875, 44.6123046875, 46.49462890625, 48.376953125, 50.25927734375, 52.1416015625, 54.02392578125, 55.90625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 55.0, 113.0, 245.0, 274.0, 191.0, 87.0, 30.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.8114242553711, -97.7901382446289, -94.76885986328125, -91.74757385253906, -88.72628784179688, -85.70500183105469, -82.68372344970703, -79.66243743896484, -76.64115142822266, -73.61986541748047, -70.59858703613281, -67.57730102539062, -64.55601501464844, -61.534732818603516, -58.513450622558594, -55.492164611816406, -52.470882415771484, -49.44960021972656, -46.428314208984375, -43.40703201293945, -40.385746002197266, -37.364463806152344, -34.343177795410156, -31.321895599365234, -28.30061149597168, -25.279327392578125, -22.25804328918457, -19.236759185791016, -16.215476989746094, -13.194191932678223, -10.172908782958984, -7.15162467956543, -4.130340576171875, -1.1090567111968994, 1.9122271537780762, 4.933510780334473, 7.954794883728027, 10.976078987121582, 13.99736213684082, 17.018646240234375, 20.03993034362793, 23.061214447021484, 26.08249855041504, 29.103782653808594, 32.125064849853516, 35.1463508605957, 38.167633056640625, 41.18891906738281, 44.210201263427734, 47.231483459472656, 50.252769470214844, 53.274051666259766, 56.29533767700195, 59.316619873046875, 62.33790588378906, 65.35919189453125, 68.3804702758789, 71.4017562866211, 74.42303466796875, 77.44432067871094, 80.46560668945312, 83.48689270019531, 86.50817108154297, 89.52945709228516, 92.55074310302734]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 9.0, 9.0, 19.0, 10.0, 23.0, 13.0, 19.0, 21.0, 23.0, 27.0, 30.0, 30.0, 35.0, 31.0, 36.0, 36.0, 42.0, 41.0, 40.0, 42.0, 40.0, 35.0, 34.0, 36.0, 30.0, 23.0, 21.0, 34.0, 14.0, 24.0, 27.0, 19.0, 16.0, 17.0, 9.0, 6.0, 15.0, 10.0, 6.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-42.974578857421875, -41.634178161621094, -40.29378128051758, -38.95338439941406, -37.61298370361328, -36.2725830078125, -34.932186126708984, -33.59178924560547, -32.25138854980469, -30.91098976135254, -29.57059097290039, -28.230192184448242, -26.889793395996094, -25.549394607543945, -24.208995819091797, -22.86859703063965, -21.5281982421875, -20.18779945373535, -18.847400665283203, -17.507001876831055, -16.166603088378906, -14.826204299926758, -13.48580551147461, -12.145406723022461, -10.805007934570312, -9.464609146118164, -8.124210357666016, -6.783811569213867, -5.443412780761719, -4.10301399230957, -2.762615203857422, -1.4222164154052734, -0.081817626953125, 1.2585811614990234, 2.598979949951172, 3.9393787384033203, 5.279777526855469, 6.620176315307617, 7.960575103759766, 9.300973892211914, 10.641372680664062, 11.981771469116211, 13.32217025756836, 14.662569046020508, 16.002967834472656, 17.343366622924805, 18.683765411376953, 20.0241641998291, 21.36456298828125, 22.7049617767334, 24.045360565185547, 25.385759353637695, 26.726158142089844, 28.066556930541992, 29.40695571899414, 30.74735450744629, 32.08775329589844, 33.42815399169922, 34.768550872802734, 36.10894775390625, 37.44934844970703, 38.78974914550781, 40.13014602661133, 41.470542907714844, 42.810943603515625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 38.0, 29.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 14.0, 11.0, 19.0, 21.0, 38.0, 50.0, 91.0, 96.0, 179.0, 260.0, 397.0, 595.0, 921.0, 1399.0, 2105.0, 3267.0, 5011.0, 7685.0, 11946.0, 18854.0, 30442.0, 49725.0, 83379.0, 140386.0, 236192.0, 181602.0, 106525.0, 63446.0, 38736.0, 23339.0, 14738.0, 9397.0, 5954.0, 4087.0, 2549.0, 1739.0, 1120.0, 776.0, 476.0, 316.0, 214.0, 155.0, 105.0, 61.0, 55.0, 25.0, 25.0, 15.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0], "bins": [-1.177734375, -1.143829345703125, -1.10992431640625, -1.076019287109375, -1.0421142578125, -1.008209228515625, -0.97430419921875, -0.940399169921875, -0.906494140625, -0.872589111328125, -0.83868408203125, -0.804779052734375, -0.7708740234375, -0.736968994140625, -0.70306396484375, -0.669158935546875, -0.63525390625, -0.601348876953125, -0.56744384765625, -0.533538818359375, -0.4996337890625, -0.465728759765625, -0.43182373046875, -0.397918701171875, -0.364013671875, -0.330108642578125, -0.29620361328125, -0.262298583984375, -0.2283935546875, -0.194488525390625, -0.16058349609375, -0.126678466796875, -0.0927734375, -0.058868408203125, -0.02496337890625, 0.008941650390625, 0.0428466796875, 0.076751708984375, 0.11065673828125, 0.144561767578125, 0.178466796875, 0.212371826171875, 0.24627685546875, 0.280181884765625, 0.3140869140625, 0.347991943359375, 0.38189697265625, 0.415802001953125, 0.44970703125, 0.483612060546875, 0.51751708984375, 0.551422119140625, 0.5853271484375, 0.619232177734375, 0.65313720703125, 0.687042236328125, 0.720947265625, 0.754852294921875, 0.78875732421875, 0.822662353515625, 0.8565673828125, 0.890472412109375, 0.92437744140625, 0.958282470703125, 0.9921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 4.0, 10.0, 12.0, 14.0, 10.0, 12.0, 17.0, 20.0, 22.0, 17.0, 33.0, 26.0, 28.0, 28.0, 20.0, 34.0, 27.0, 31.0, 35.0, 32.0, 1058.0, 34.0, 43.0, 34.0, 47.0, 37.0, 39.0, 26.0, 26.0, 23.0, 29.0, 27.0, 25.0, 20.0, 20.0, 15.0, 18.0, 13.0, 10.0, 8.0, 3.0, 7.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-4.2265625, -4.101776123046875, -3.97698974609375, -3.852203369140625, -3.7274169921875, -3.602630615234375, -3.47784423828125, -3.353057861328125, -3.228271484375, -3.103485107421875, -2.97869873046875, -2.853912353515625, -2.7291259765625, -2.604339599609375, -2.47955322265625, -2.354766845703125, -2.22998046875, -2.105194091796875, -1.98040771484375, -1.855621337890625, -1.7308349609375, -1.606048583984375, -1.48126220703125, -1.356475830078125, -1.231689453125, -1.106903076171875, -0.98211669921875, -0.857330322265625, -0.7325439453125, -0.607757568359375, -0.48297119140625, -0.358184814453125, -0.2333984375, -0.108612060546875, 0.01617431640625, 0.140960693359375, 0.2657470703125, 0.390533447265625, 0.51531982421875, 0.640106201171875, 0.764892578125, 0.889678955078125, 1.01446533203125, 1.139251708984375, 1.2640380859375, 1.388824462890625, 1.51361083984375, 1.638397216796875, 1.76318359375, 1.887969970703125, 2.01275634765625, 2.137542724609375, 2.2623291015625, 2.387115478515625, 2.51190185546875, 2.636688232421875, 2.761474609375, 2.886260986328125, 3.01104736328125, 3.135833740234375, 3.2606201171875, 3.385406494140625, 3.51019287109375, 3.634979248046875, 3.759765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 8.0, 8.0, 22.0, 37.0, 48.0, 64.0, 110.0, 152.0, 225.0, 346.0, 506.0, 697.0, 1035.0, 1610.0, 2275.0, 3166.0, 4654.0, 6856.0, 10163.0, 14832.0, 21779.0, 33249.0, 50151.0, 77952.0, 127717.0, 1267885.0, 176097.0, 102730.0, 64591.0, 42067.0, 27772.0, 18826.0, 12480.0, 8484.0, 5906.0, 3951.0, 2748.0, 1874.0, 1280.0, 904.0, 621.0, 390.0, 320.0, 178.0, 117.0, 80.0, 59.0, 39.0, 23.0, 15.0, 14.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.923828125, -0.8956527709960938, -0.8674774169921875, -0.8393020629882812, -0.811126708984375, -0.7829513549804688, -0.7547760009765625, -0.7266006469726562, -0.69842529296875, -0.6702499389648438, -0.6420745849609375, -0.6138992309570312, -0.585723876953125, -0.5575485229492188, -0.5293731689453125, -0.5011978149414062, -0.4730224609375, -0.44484710693359375, -0.4166717529296875, -0.38849639892578125, -0.360321044921875, -0.33214569091796875, -0.3039703369140625, -0.27579498291015625, -0.24761962890625, -0.21944427490234375, -0.1912689208984375, -0.16309356689453125, -0.134918212890625, -0.10674285888671875, -0.0785675048828125, -0.05039215087890625, -0.022216796875, 0.00595855712890625, 0.0341339111328125, 0.06230926513671875, 0.090484619140625, 0.11865997314453125, 0.1468353271484375, 0.17501068115234375, 0.20318603515625, 0.23136138916015625, 0.2595367431640625, 0.28771209716796875, 0.315887451171875, 0.34406280517578125, 0.3722381591796875, 0.40041351318359375, 0.4285888671875, 0.45676422119140625, 0.4849395751953125, 0.5131149291992188, 0.541290283203125, 0.5694656372070312, 0.5976409912109375, 0.6258163452148438, 0.65399169921875, 0.6821670532226562, 0.7103424072265625, 0.7385177612304688, 0.766693115234375, 0.7948684692382812, 0.8230438232421875, 0.8512191772460938, 0.87939453125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 10.0, 11.0, 19.0, 21.0, 28.0, 26.0, 30.0, 24.0, 45.0, 53.0, 52.0, 44.0, 64.0, 51.0, 53.0, 39.0, 55.0, 48.0, 44.0, 28.0, 27.0, 28.0, 36.0, 24.0, 23.0, 14.0, 13.0, 13.0, 9.0, 9.0, 5.0, 8.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004916191101074219, -0.00047466158866882324, -0.0004577040672302246, -0.000440746545791626, -0.00042378902435302734, -0.0004068315029144287, -0.0003898739814758301, -0.00037291646003723145, -0.0003559589385986328, -0.0003390014171600342, -0.00032204389572143555, -0.0003050863742828369, -0.0002881288528442383, -0.00027117133140563965, -0.000254213809967041, -0.00023725628852844238, -0.00022029876708984375, -0.00020334124565124512, -0.00018638372421264648, -0.00016942620277404785, -0.00015246868133544922, -0.00013551115989685059, -0.00011855363845825195, -0.00010159611701965332, -8.463859558105469e-05, -6.768107414245605e-05, -5.072355270385742e-05, -3.376603126525879e-05, -1.6808509826660156e-05, 1.4901161193847656e-07, 1.710653305053711e-05, 3.406405448913574e-05, 5.1021575927734375e-05, 6.797909736633301e-05, 8.493661880493164e-05, 0.00010189414024353027, 0.0001188516616821289, 0.00013580918312072754, 0.00015276670455932617, 0.0001697242259979248, 0.00018668174743652344, 0.00020363926887512207, 0.0002205967903137207, 0.00023755431175231934, 0.00025451183319091797, 0.0002714693546295166, 0.00028842687606811523, 0.00030538439750671387, 0.0003223419189453125, 0.00033929944038391113, 0.00035625696182250977, 0.0003732144832611084, 0.00039017200469970703, 0.00040712952613830566, 0.0004240870475769043, 0.00044104456901550293, 0.00045800209045410156, 0.0004749596118927002, 0.0004919171333312988, 0.0005088746547698975, 0.0005258321762084961, 0.0005427896976470947, 0.0005597472190856934, 0.000576704740524292, 0.0005936622619628906]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 5.0, 9.0, 8.0, 7.0, 16.0, 8.0, 23.0, 14.0, 25.0, 27.0, 38.0, 40.0, 57.0, 68.0, 95.0, 142.0, 245.0, 496.0, 1596.0, 903343.0, 140159.0, 1022.0, 412.0, 167.0, 125.0, 84.0, 59.0, 45.0, 41.0, 35.0, 27.0, 22.0, 17.0, 13.0, 15.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012794256210327148, -0.012404918670654297, -0.012015581130981445, -0.011626243591308594, -0.011236906051635742, -0.01084756851196289, -0.010458230972290039, -0.010068893432617188, -0.009679555892944336, -0.009290218353271484, -0.008900880813598633, -0.008511543273925781, -0.00812220573425293, -0.007732868194580078, -0.0073435306549072266, -0.006954193115234375, -0.0065648555755615234, -0.006175518035888672, -0.00578618049621582, -0.005396842956542969, -0.005007505416870117, -0.004618167877197266, -0.004228830337524414, -0.0038394927978515625, -0.003450155258178711, -0.0030608177185058594, -0.002671480178833008, -0.0022821426391601562, -0.0018928050994873047, -0.0015034675598144531, -0.0011141300201416016, -0.00072479248046875, -0.00033545494079589844, 5.3882598876953125e-05, 0.0004432201385498047, 0.0008325576782226562, 0.0012218952178955078, 0.0016112327575683594, 0.002000570297241211, 0.0023899078369140625, 0.002779245376586914, 0.0031685829162597656, 0.003557920455932617, 0.003947257995605469, 0.00433659553527832, 0.004725933074951172, 0.0051152706146240234, 0.005504608154296875, 0.0058939456939697266, 0.006283283233642578, 0.00667262077331543, 0.007061958312988281, 0.007451295852661133, 0.007840633392333984, 0.008229970932006836, 0.008619308471679688, 0.009008646011352539, 0.00939798355102539, 0.009787321090698242, 0.010176658630371094, 0.010565996170043945, 0.010955333709716797, 0.011344671249389648, 0.0117340087890625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 75.0, 728.0, 208.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004281291738152504, -0.004202988464385271, -0.004124685190618038, -0.004046381916850805, -0.003968078643083572, -0.003889775602146983, -0.003811472561210394, -0.003733169287443161, -0.003654866013675928, -0.0035765627399086952, -0.0034982594661414623, -0.003419956425204873, -0.00334165315143764, -0.0032633498776704073, -0.003185046836733818, -0.003106743562966585, -0.0030284402891993523, -0.0029501370154321194, -0.0028718337416648865, -0.0027935307007282972, -0.0027152274269610643, -0.0026369241531938314, -0.002558621112257242, -0.0024803178384900093, -0.0024020145647227764, -0.0023237112909555435, -0.0022454080171883106, -0.0021671049762517214, -0.0020888017024844885, -0.0020104984287172556, -0.0019321952713653445, -0.0018538921140134335, -0.0017755888402462006, -0.0016972855664789677, -0.0016189824091270566, -0.0015406792517751455, -0.0014623759780079126, -0.0013840727042406797, -0.0013057695468887687, -0.0012274663895368576, -0.0011491631157696247, -0.0010708598420023918, -0.0009925566846504807, -0.0009142534690909088, -0.0008359502535313368, -0.0007576470379717648, -0.0006793438224121928, -0.0006010406068526208, -0.0005227374495007098, -0.0004444342339411378, -0.0003661310183815658, -0.00028782780282199383, -0.00020952458726242185, -0.00013122137170284986, -5.2918156143277884e-05, 2.5385059416294098e-05, 0.00010368827497586608, 0.00018199149053543806, 0.00026029470609501004, 0.000338597921654582, 0.000416901137214154, 0.000495204352773726, 0.000573507568333298, 0.00065181078389287, 0.0007301139994524419]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 4.0, 9.0, 13.0, 19.0, 14.0, 16.0, 20.0, 20.0, 27.0, 32.0, 32.0, 33.0, 39.0, 28.0, 34.0, 38.0, 38.0, 50.0, 27.0, 42.0, 41.0, 24.0, 33.0, 45.0, 41.0, 32.0, 36.0, 36.0, 28.0, 16.0, 16.0, 15.0, 15.0, 13.0, 6.0, 14.0, 16.0, 12.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026291608810424805, -0.000253492034971714, -0.00024406798183918, -0.00023464392870664597, -0.00022521987557411194, -0.0002157958224415779, -0.00020637176930904388, -0.00019694771617650986, -0.00018752366304397583, -0.0001780996099114418, -0.00016867555677890778, -0.00015925150364637375, -0.00014982745051383972, -0.0001404033973813057, -0.00013097934424877167, -0.00012155529111623764, -0.00011213123798370361, -0.00010270718485116959, -9.328313171863556e-05, -8.385907858610153e-05, -7.44350254535675e-05, -6.501097232103348e-05, -5.558691918849945e-05, -4.6162866055965424e-05, -3.6738812923431396e-05, -2.731475979089737e-05, -1.7890706658363342e-05, -8.466653525829315e-06, 9.57399606704712e-07, 1.0381452739238739e-05, 1.9805505871772766e-05, 2.9229559004306793e-05, 3.865361213684082e-05, 4.807766526937485e-05, 5.7501718401908875e-05, 6.69257715344429e-05, 7.634982466697693e-05, 8.577387779951096e-05, 9.519793093204498e-05, 0.00010462198406457901, 0.00011404603719711304, 0.00012347009032964706, 0.0001328941434621811, 0.00014231819659471512, 0.00015174224972724915, 0.00016116630285978317, 0.0001705903559923172, 0.00018001440912485123, 0.00018943846225738525, 0.00019886251538991928, 0.0002082865685224533, 0.00021771062165498734, 0.00022713467478752136, 0.0002365587279200554, 0.0002459827810525894, 0.00025540683418512344, 0.00026483088731765747, 0.0002742549404501915, 0.0002836789935827255, 0.00029310304671525955, 0.0003025270998477936, 0.0003119511529803276, 0.00032137520611286163, 0.00033079925924539566, 0.0003402233123779297]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 10.0, 11.0, 17.0, 13.0, 16.0, 15.0, 18.0, 19.0, 29.0, 26.0, 39.0, 28.0, 24.0, 37.0, 31.0, 28.0, 41.0, 38.0, 47.0, 35.0, 46.0, 33.0, 35.0, 27.0, 29.0, 26.0, 28.0, 21.0, 34.0, 18.0, 30.0, 12.0, 25.0, 13.0, 10.0, 11.0, 11.0, 14.0, 5.0, 6.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703125, -5.50262451171875, -5.3021240234375, -5.10162353515625, -4.901123046875, -4.70062255859375, -4.5001220703125, -4.29962158203125, -4.09912109375, -3.89862060546875, -3.6981201171875, -3.49761962890625, -3.297119140625, -3.09661865234375, -2.8961181640625, -2.69561767578125, -2.4951171875, -2.29461669921875, -2.0941162109375, -1.89361572265625, -1.693115234375, -1.49261474609375, -1.2921142578125, -1.09161376953125, -0.89111328125, -0.69061279296875, -0.4901123046875, -0.28961181640625, -0.089111328125, 0.11138916015625, 0.3118896484375, 0.51239013671875, 0.712890625, 0.91339111328125, 1.1138916015625, 1.31439208984375, 1.514892578125, 1.71539306640625, 1.9158935546875, 2.11639404296875, 2.31689453125, 2.51739501953125, 2.7178955078125, 2.91839599609375, 3.118896484375, 3.31939697265625, 3.5198974609375, 3.72039794921875, 3.9208984375, 4.12139892578125, 4.3218994140625, 4.52239990234375, 4.722900390625, 4.92340087890625, 5.1239013671875, 5.32440185546875, 5.52490234375, 5.72540283203125, 5.9259033203125, 6.12640380859375, 6.326904296875, 6.52740478515625, 6.7279052734375, 6.92840576171875, 7.12890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 6.0, 12.0, 10.0, 20.0, 24.0, 26.0, 32.0, 27.0, 39.0, 72.0, 110.0, 150.0, 310.0, 567.0, 1153.0, 2482.0, 5271.0, 11522.0, 25285.0, 56511.0, 135683.0, 335220.0, 280620.0, 108054.0, 46079.0, 21153.0, 9485.0, 4291.0, 2007.0, 1025.0, 472.0, 252.0, 167.0, 95.0, 68.0, 39.0, 37.0, 28.0, 30.0, 15.0, 19.0, 16.0, 13.0, 9.0, 5.0, 3.0, 5.0, 3.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.10546875, -4.94012451171875, -4.7747802734375, -4.60943603515625, -4.444091796875, -4.27874755859375, -4.1134033203125, -3.94805908203125, -3.78271484375, -3.61737060546875, -3.4520263671875, -3.28668212890625, -3.121337890625, -2.95599365234375, -2.7906494140625, -2.62530517578125, -2.4599609375, -2.29461669921875, -2.1292724609375, -1.96392822265625, -1.798583984375, -1.63323974609375, -1.4678955078125, -1.30255126953125, -1.13720703125, -0.97186279296875, -0.8065185546875, -0.64117431640625, -0.475830078125, -0.31048583984375, -0.1451416015625, 0.02020263671875, 0.185546875, 0.35089111328125, 0.5162353515625, 0.68157958984375, 0.846923828125, 1.01226806640625, 1.1776123046875, 1.34295654296875, 1.50830078125, 1.67364501953125, 1.8389892578125, 2.00433349609375, 2.169677734375, 2.33502197265625, 2.5003662109375, 2.66571044921875, 2.8310546875, 2.99639892578125, 3.1617431640625, 3.32708740234375, 3.492431640625, 3.65777587890625, 3.8231201171875, 3.98846435546875, 4.15380859375, 4.31915283203125, 4.4844970703125, 4.64984130859375, 4.815185546875, 4.98052978515625, 5.1458740234375, 5.31121826171875, 5.4765625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 6.0, 4.0, 14.0, 14.0, 10.0, 16.0, 25.0, 22.0, 18.0, 28.0, 33.0, 38.0, 35.0, 29.0, 50.0, 50.0, 72.0, 176.0, 1561.0, 287.0, 87.0, 51.0, 53.0, 44.0, 41.0, 36.0, 21.0, 24.0, 31.0, 16.0, 29.0, 21.0, 15.0, 14.0, 13.0, 14.0, 15.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.328125, -19.666015625, -19.00390625, -18.341796875, -17.6796875, -17.017578125, -16.35546875, -15.693359375, -15.03125, -14.369140625, -13.70703125, -13.044921875, -12.3828125, -11.720703125, -11.05859375, -10.396484375, -9.734375, -9.072265625, -8.41015625, -7.748046875, -7.0859375, -6.423828125, -5.76171875, -5.099609375, -4.4375, -3.775390625, -3.11328125, -2.451171875, -1.7890625, -1.126953125, -0.46484375, 0.197265625, 0.859375, 1.521484375, 2.18359375, 2.845703125, 3.5078125, 4.169921875, 4.83203125, 5.494140625, 6.15625, 6.818359375, 7.48046875, 8.142578125, 8.8046875, 9.466796875, 10.12890625, 10.791015625, 11.453125, 12.115234375, 12.77734375, 13.439453125, 14.1015625, 14.763671875, 15.42578125, 16.087890625, 16.75, 17.412109375, 18.07421875, 18.736328125, 19.3984375, 20.060546875, 20.72265625, 21.384765625, 22.046875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 8.0, 8.0, 12.0, 14.0, 18.0, 29.0, 24.0, 33.0, 29.0, 55.0, 62.0, 74.0, 97.0, 121.0, 151.0, 227.0, 371.0, 610.0, 1595.0, 44790.0, 3042972.0, 50818.0, 1687.0, 632.0, 341.0, 228.0, 180.0, 120.0, 86.0, 54.0, 48.0, 51.0, 29.0, 29.0, 18.0, 10.0, 12.0, 12.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.16015625, -34.0078125, -32.85546875, -31.703125, -30.55078125, -29.3984375, -28.24609375, -27.09375, -25.94140625, -24.7890625, -23.63671875, -22.484375, -21.33203125, -20.1796875, -19.02734375, -17.875, -16.72265625, -15.5703125, -14.41796875, -13.265625, -12.11328125, -10.9609375, -9.80859375, -8.65625, -7.50390625, -6.3515625, -5.19921875, -4.046875, -2.89453125, -1.7421875, -0.58984375, 0.5625, 1.71484375, 2.8671875, 4.01953125, 5.171875, 6.32421875, 7.4765625, 8.62890625, 9.78125, 10.93359375, 12.0859375, 13.23828125, 14.390625, 15.54296875, 16.6953125, 17.84765625, 19.0, 20.15234375, 21.3046875, 22.45703125, 23.609375, 24.76171875, 25.9140625, 27.06640625, 28.21875, 29.37109375, 30.5234375, 31.67578125, 32.828125, 33.98046875, 35.1328125, 36.28515625, 37.4375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 29.0, 123.0, 348.0, 343.0, 125.0, 28.0, 13.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.078289031982422, -22.232301712036133, -20.386314392089844, -18.540327072143555, -16.694339752197266, -14.848352432250977, -13.002365112304688, -11.156377792358398, -9.31039047241211, -7.46440315246582, -5.618415832519531, -3.772428512573242, -1.9264411926269531, -0.08045387268066406, 1.765533447265625, 3.611520767211914, 5.457508087158203, 7.303495407104492, 9.149482727050781, 10.99547004699707, 12.84145736694336, 14.687444686889648, 16.533432006835938, 18.379419326782227, 20.225406646728516, 22.071393966674805, 23.917381286621094, 25.763368606567383, 27.609355926513672, 29.45534324645996, 31.30133056640625, 33.147315979003906, 34.99330139160156, 36.83928680419922, 38.68527603149414, 40.53126525878906, 42.37725067138672, 44.223236083984375, 46.0692253112793, 47.91521453857422, 49.761199951171875, 51.60718536376953, 53.45317459106445, 55.299163818359375, 57.14514923095703, 58.99113464355469, 60.83712387084961, 62.68311309814453, 64.52909851074219, 66.37508392333984, 68.2210693359375, 70.06706237792969, 71.91304779052734, 73.759033203125, 75.60502624511719, 77.45101165771484, 79.2969970703125, 81.14298248291016, 82.98896789550781, 84.8349609375, 86.68094635009766, 88.52693176269531, 90.3729248046875, 92.21891021728516, 94.06489562988281]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 1.0, 5.0, 4.0, 8.0, 10.0, 10.0, 9.0, 11.0, 10.0, 12.0, 26.0, 15.0, 18.0, 25.0, 22.0, 26.0, 42.0, 27.0, 41.0, 42.0, 40.0, 35.0, 44.0, 37.0, 53.0, 35.0, 40.0, 34.0, 37.0, 26.0, 34.0, 31.0, 23.0, 24.0, 16.0, 19.0, 21.0, 16.0, 13.0, 12.0, 11.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-51.13607406616211, -49.5098762512207, -47.8836784362793, -46.25748062133789, -44.631282806396484, -43.00508499145508, -41.37888717651367, -39.752689361572266, -38.12649154663086, -36.50029373168945, -34.87409591674805, -33.24789810180664, -31.621700286865234, -29.995502471923828, -28.369304656982422, -26.743106842041016, -25.11690902709961, -23.490711212158203, -21.864513397216797, -20.23831558227539, -18.612117767333984, -16.985919952392578, -15.359722137451172, -13.733524322509766, -12.10732650756836, -10.481128692626953, -8.854930877685547, -7.228733062744141, -5.602535247802734, -3.976337432861328, -2.350139617919922, -0.7239418029785156, 0.9022598266601562, 2.5284576416015625, 4.154655456542969, 5.780853271484375, 7.407051086425781, 9.033248901367188, 10.659446716308594, 12.28564453125, 13.911842346191406, 15.538040161132812, 17.16423797607422, 18.790435791015625, 20.41663360595703, 22.042831420898438, 23.669029235839844, 25.29522705078125, 26.921424865722656, 28.547622680664062, 30.17382049560547, 31.800018310546875, 33.42621612548828, 35.05241394042969, 36.678611755371094, 38.3048095703125, 39.931007385253906, 41.55720520019531, 43.18340301513672, 44.809600830078125, 46.43579864501953, 48.06199645996094, 49.688194274902344, 51.31439208984375, 52.940589904785156]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 7.0, 4.0, 1.0, 13.0, 8.0, 10.0, 13.0, 15.0, 17.0, 19.0, 14.0, 25.0, 25.0, 30.0, 26.0, 26.0, 38.0, 35.0, 43.0, 32.0, 42.0, 45.0, 41.0, 33.0, 36.0, 46.0, 33.0, 36.0, 37.0, 29.0, 32.0, 26.0, 19.0, 19.0, 27.0, 15.0, 18.0, 11.0, 12.0, 11.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.0191650390625, -5.800048828125, -5.5809326171875, -5.36181640625, -5.1427001953125, -4.923583984375, -4.7044677734375, -4.4853515625, -4.2662353515625, -4.047119140625, -3.8280029296875, -3.60888671875, -3.3897705078125, -3.170654296875, -2.9515380859375, -2.732421875, -2.5133056640625, -2.294189453125, -2.0750732421875, -1.85595703125, -1.6368408203125, -1.417724609375, -1.1986083984375, -0.9794921875, -0.7603759765625, -0.541259765625, -0.3221435546875, -0.10302734375, 0.1160888671875, 0.335205078125, 0.5543212890625, 0.7734375, 0.9925537109375, 1.211669921875, 1.4307861328125, 1.64990234375, 1.8690185546875, 2.088134765625, 2.3072509765625, 2.5263671875, 2.7454833984375, 2.964599609375, 3.1837158203125, 3.40283203125, 3.6219482421875, 3.841064453125, 4.0601806640625, 4.279296875, 4.4984130859375, 4.717529296875, 4.9366455078125, 5.15576171875, 5.3748779296875, 5.593994140625, 5.8131103515625, 6.0322265625, 6.2513427734375, 6.470458984375, 6.6895751953125, 6.90869140625, 7.1278076171875, 7.346923828125, 7.5660400390625, 7.78515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 6.0, 17.0, 16.0, 13.0, 21.0, 16.0, 30.0, 24.0, 45.0, 47.0, 51.0, 79.0, 112.0, 178.0, 382.0, 1490.0, 15290.0, 571202.0, 3377851.0, 217059.0, 8317.0, 1083.0, 292.0, 180.0, 96.0, 56.0, 63.0, 31.0, 33.0, 37.0, 22.0, 24.0, 18.0, 13.0, 9.0, 14.0, 11.0, 8.0, 5.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.203125, -21.49560546875, -20.7880859375, -20.08056640625, -19.373046875, -18.66552734375, -17.9580078125, -17.25048828125, -16.54296875, -15.83544921875, -15.1279296875, -14.42041015625, -13.712890625, -13.00537109375, -12.2978515625, -11.59033203125, -10.8828125, -10.17529296875, -9.4677734375, -8.76025390625, -8.052734375, -7.34521484375, -6.6376953125, -5.93017578125, -5.22265625, -4.51513671875, -3.8076171875, -3.10009765625, -2.392578125, -1.68505859375, -0.9775390625, -0.27001953125, 0.4375, 1.14501953125, 1.8525390625, 2.56005859375, 3.267578125, 3.97509765625, 4.6826171875, 5.39013671875, 6.09765625, 6.80517578125, 7.5126953125, 8.22021484375, 8.927734375, 9.63525390625, 10.3427734375, 11.05029296875, 11.7578125, 12.46533203125, 13.1728515625, 13.88037109375, 14.587890625, 15.29541015625, 16.0029296875, 16.71044921875, 17.41796875, 18.12548828125, 18.8330078125, 19.54052734375, 20.248046875, 20.95556640625, 21.6630859375, 22.37060546875, 23.078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 6.0, 4.0, 8.0, 6.0, 17.0, 19.0, 24.0, 25.0, 41.0, 58.0, 60.0, 92.0, 95.0, 135.0, 146.0, 236.0, 310.0, 363.0, 416.0, 431.0, 330.0, 289.0, 198.0, 146.0, 140.0, 96.0, 82.0, 72.0, 54.0, 39.0, 29.0, 26.0, 19.0, 13.0, 9.0, 8.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3587646484375, -9.022216796875, -8.6856689453125, -8.34912109375, -8.0125732421875, -7.676025390625, -7.3394775390625, -7.0029296875, -6.6663818359375, -6.329833984375, -5.9932861328125, -5.65673828125, -5.3201904296875, -4.983642578125, -4.6470947265625, -4.310546875, -3.9739990234375, -3.637451171875, -3.3009033203125, -2.96435546875, -2.6278076171875, -2.291259765625, -1.9547119140625, -1.6181640625, -1.2816162109375, -0.945068359375, -0.6085205078125, -0.27197265625, 0.0645751953125, 0.401123046875, 0.7376708984375, 1.07421875, 1.4107666015625, 1.747314453125, 2.0838623046875, 2.42041015625, 2.7569580078125, 3.093505859375, 3.4300537109375, 3.7666015625, 4.1031494140625, 4.439697265625, 4.7762451171875, 5.11279296875, 5.4493408203125, 5.785888671875, 6.1224365234375, 6.458984375, 6.7955322265625, 7.132080078125, 7.4686279296875, 7.80517578125, 8.1417236328125, 8.478271484375, 8.8148193359375, 9.1513671875, 9.4879150390625, 9.824462890625, 10.1610107421875, 10.49755859375, 10.8341064453125, 11.170654296875, 11.5072021484375, 11.84375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 7.0, 11.0, 9.0, 9.0, 17.0, 12.0, 29.0, 32.0, 58.0, 50.0, 71.0, 80.0, 107.0, 135.0, 230.0, 273.0, 366.0, 867.0, 11938.0, 4132243.0, 45128.0, 1049.0, 440.0, 280.0, 172.0, 136.0, 118.0, 85.0, 71.0, 56.0, 50.0, 34.0, 26.0, 30.0, 16.0, 15.0, 13.0, 11.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.625, -76.3525390625, -74.080078125, -71.8076171875, -69.53515625, -67.2626953125, -64.990234375, -62.7177734375, -60.4453125, -58.1728515625, -55.900390625, -53.6279296875, -51.35546875, -49.0830078125, -46.810546875, -44.5380859375, -42.265625, -39.9931640625, -37.720703125, -35.4482421875, -33.17578125, -30.9033203125, -28.630859375, -26.3583984375, -24.0859375, -21.8134765625, -19.541015625, -17.2685546875, -14.99609375, -12.7236328125, -10.451171875, -8.1787109375, -5.90625, -3.6337890625, -1.361328125, 0.9111328125, 3.18359375, 5.4560546875, 7.728515625, 10.0009765625, 12.2734375, 14.5458984375, 16.818359375, 19.0908203125, 21.36328125, 23.6357421875, 25.908203125, 28.1806640625, 30.453125, 32.7255859375, 34.998046875, 37.2705078125, 39.54296875, 41.8154296875, 44.087890625, 46.3603515625, 48.6328125, 50.9052734375, 53.177734375, 55.4501953125, 57.72265625, 59.9951171875, 62.267578125, 64.5400390625, 66.8125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 47.0, 296.0, 471.0, 181.0, 18.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-288.2147216796875, -282.9056701660156, -277.5966491699219, -272.28759765625, -266.9785461425781, -261.66949462890625, -256.3604736328125, -251.05142211914062, -245.74237060546875, -240.43333435058594, -235.12428283691406, -229.81524658203125, -224.50619506835938, -219.19715881347656, -213.8881072998047, -208.57907104492188, -203.27001953125, -197.9609832763672, -192.6519317626953, -187.3428955078125, -182.03384399414062, -176.7248077392578, -171.41575622558594, -166.10671997070312, -160.7976837158203, -155.4886474609375, -150.17959594726562, -144.8705596923828, -139.56150817871094, -134.25247192382812, -128.94342041015625, -123.63438415527344, -118.3253173828125, -113.01627349853516, -107.70722961425781, -102.39818572998047, -97.08914184570312, -91.78009796142578, -86.47105407714844, -81.16201782226562, -75.85297393798828, -70.54393005371094, -65.2348861694336, -59.92584228515625, -54.616798400878906, -49.30775451660156, -43.998714447021484, -38.68967056274414, -33.3806266784668, -28.071582794189453, -22.76253890991211, -17.4534969329834, -12.144453048706055, -6.835409164428711, -1.5263671875, 3.7826766967773438, 9.091720581054688, 14.400764465332031, 19.709808349609375, 25.018850326538086, 30.32789421081543, 35.636940002441406, 40.945980072021484, 46.25502395629883, 51.56406784057617]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 7.0, 2.0, 8.0, 16.0, 9.0, 14.0, 15.0, 22.0, 20.0, 13.0, 24.0, 18.0, 22.0, 33.0, 34.0, 32.0, 30.0, 28.0, 53.0, 42.0, 29.0, 35.0, 42.0, 37.0, 26.0, 40.0, 30.0, 27.0, 35.0, 32.0, 27.0, 27.0, 29.0, 24.0, 20.0, 21.0, 8.0, 13.0, 14.0, 6.0, 8.0, 3.0, 11.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.510982513427734, -35.232784271240234, -33.95458984375, -32.6763916015625, -31.398197174072266, -30.119998931884766, -28.8418025970459, -27.56360626220703, -26.285409927368164, -25.007213592529297, -23.72901725769043, -22.450820922851562, -21.172622680664062, -19.894428253173828, -18.616230010986328, -17.33803367614746, -16.059837341308594, -14.781641006469727, -13.50344467163086, -12.225247383117676, -10.947051048278809, -9.668854713439941, -8.390657424926758, -7.112461090087891, -5.834264755249023, -4.556068420410156, -3.277871608734131, -1.9996750354766846, -0.7214784622192383, 0.5567178726196289, 1.8349146842956543, 3.1131114959716797, 4.391304016113281, 5.669500350952148, 6.947697162628174, 8.2258939743042, 9.504090309143066, 10.782286643981934, 12.060483932495117, 13.338680267333984, 14.616876602172852, 15.895072937011719, 17.173269271850586, 18.451465606689453, 19.729663848876953, 21.007858276367188, 22.286056518554688, 23.564252853393555, 24.842449188232422, 26.12064552307129, 27.398841857910156, 28.677038192749023, 29.95523452758789, 31.23343276977539, 32.511627197265625, 33.789825439453125, 35.068023681640625, 36.346221923828125, 37.62441635131836, 38.90261459350586, 40.180809020996094, 41.459007263183594, 42.73720169067383, 44.01539993286133, 45.29359436035156]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 4.0, 18.0, 9.0, 21.0, 37.0, 56.0, 89.0, 137.0, 197.0, 273.0, 389.0, 508.0, 835.0, 1161.0, 1809.0, 2614.0, 3555.0, 5347.0, 7661.0, 11707.0, 17198.0, 26013.0, 40268.0, 62867.0, 101520.0, 166013.0, 219074.0, 138209.0, 84316.0, 53444.0, 34393.0, 22360.0, 14777.0, 10096.0, 6778.0, 4682.0, 3170.0, 2118.0, 1504.0, 1055.0, 713.0, 512.0, 333.0, 224.0, 178.0, 106.0, 71.0, 43.0, 30.0, 26.0, 19.0, 6.0, 11.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0478515625, -1.0154266357421875, -0.983001708984375, -0.9505767822265625, -0.91815185546875, -0.8857269287109375, -0.853302001953125, -0.8208770751953125, -0.7884521484375, -0.7560272216796875, -0.723602294921875, -0.6911773681640625, -0.65875244140625, -0.6263275146484375, -0.593902587890625, -0.5614776611328125, -0.529052734375, -0.4966278076171875, -0.464202880859375, -0.4317779541015625, -0.39935302734375, -0.3669281005859375, -0.334503173828125, -0.3020782470703125, -0.2696533203125, -0.2372283935546875, -0.204803466796875, -0.1723785400390625, -0.13995361328125, -0.1075286865234375, -0.075103759765625, -0.0426788330078125, -0.01025390625, 0.0221710205078125, 0.054595947265625, 0.0870208740234375, 0.11944580078125, 0.1518707275390625, 0.184295654296875, 0.2167205810546875, 0.2491455078125, 0.2815704345703125, 0.313995361328125, 0.3464202880859375, 0.37884521484375, 0.4112701416015625, 0.443695068359375, 0.4761199951171875, 0.508544921875, 0.5409698486328125, 0.573394775390625, 0.6058197021484375, 0.63824462890625, 0.6706695556640625, 0.703094482421875, 0.7355194091796875, 0.7679443359375, 0.8003692626953125, 0.832794189453125, 0.8652191162109375, 0.89764404296875, 0.9300689697265625, 0.962493896484375, 0.9949188232421875, 1.02734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 10.0, 14.0, 15.0, 12.0, 25.0, 19.0, 33.0, 17.0, 31.0, 36.0, 29.0, 40.0, 38.0, 37.0, 36.0, 44.0, 1061.0, 44.0, 40.0, 51.0, 44.0, 43.0, 33.0, 29.0, 31.0, 29.0, 28.0, 27.0, 18.0, 26.0, 17.0, 9.0, 14.0, 10.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.5655517578125, -4.416259765625, -4.2669677734375, -4.11767578125, -3.9683837890625, -3.819091796875, -3.6697998046875, -3.5205078125, -3.3712158203125, -3.221923828125, -3.0726318359375, -2.92333984375, -2.7740478515625, -2.624755859375, -2.4754638671875, -2.326171875, -2.1768798828125, -2.027587890625, -1.8782958984375, -1.72900390625, -1.5797119140625, -1.430419921875, -1.2811279296875, -1.1318359375, -0.9825439453125, -0.833251953125, -0.6839599609375, -0.53466796875, -0.3853759765625, -0.236083984375, -0.0867919921875, 0.0625, 0.2117919921875, 0.361083984375, 0.5103759765625, 0.65966796875, 0.8089599609375, 0.958251953125, 1.1075439453125, 1.2568359375, 1.4061279296875, 1.555419921875, 1.7047119140625, 1.85400390625, 2.0032958984375, 2.152587890625, 2.3018798828125, 2.451171875, 2.6004638671875, 2.749755859375, 2.8990478515625, 3.04833984375, 3.1976318359375, 3.346923828125, 3.4962158203125, 3.6455078125, 3.7947998046875, 3.944091796875, 4.0933837890625, 4.24267578125, 4.3919677734375, 4.541259765625, 4.6905517578125, 4.83984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 8.0, 11.0, 18.0, 29.0, 45.0, 64.0, 91.0, 156.0, 195.0, 304.0, 455.0, 685.0, 1131.0, 1801.0, 2766.0, 4228.0, 6660.0, 10720.0, 16682.0, 27192.0, 44273.0, 74358.0, 129473.0, 1284186.0, 205998.0, 113577.0, 66363.0, 39350.0, 24453.0, 15231.0, 9548.0, 6178.0, 3904.0, 2426.0, 1568.0, 1044.0, 685.0, 423.0, 292.0, 167.0, 142.0, 88.0, 52.0, 38.0, 28.0, 12.0, 14.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.063232421875, -1.02880859375, -0.994384765625, -0.9599609375, -0.925537109375, -0.89111328125, -0.856689453125, -0.822265625, -0.787841796875, -0.75341796875, -0.718994140625, -0.6845703125, -0.650146484375, -0.61572265625, -0.581298828125, -0.546875, -0.512451171875, -0.47802734375, -0.443603515625, -0.4091796875, -0.374755859375, -0.34033203125, -0.305908203125, -0.271484375, -0.237060546875, -0.20263671875, -0.168212890625, -0.1337890625, -0.099365234375, -0.06494140625, -0.030517578125, 0.00390625, 0.038330078125, 0.07275390625, 0.107177734375, 0.1416015625, 0.176025390625, 0.21044921875, 0.244873046875, 0.279296875, 0.313720703125, 0.34814453125, 0.382568359375, 0.4169921875, 0.451416015625, 0.48583984375, 0.520263671875, 0.5546875, 0.589111328125, 0.62353515625, 0.657958984375, 0.6923828125, 0.726806640625, 0.76123046875, 0.795654296875, 0.830078125, 0.864501953125, 0.89892578125, 0.933349609375, 0.9677734375, 1.002197265625, 1.03662109375, 1.071044921875, 1.10546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 8.0, 5.0, 8.0, 16.0, 13.0, 16.0, 35.0, 40.0, 40.0, 56.0, 62.0, 69.0, 97.0, 102.0, 69.0, 75.0, 63.0, 50.0, 42.0, 25.0, 20.0, 16.0, 9.0, 17.0, 5.0, 6.0, 7.0, 8.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009007453918457031, -0.0008743852376937866, -0.0008480250835418701, -0.0008216649293899536, -0.0007953047752380371, -0.0007689446210861206, -0.0007425844669342041, -0.0007162243127822876, -0.0006898641586303711, -0.0006635040044784546, -0.0006371438503265381, -0.0006107836961746216, -0.0005844235420227051, -0.0005580633878707886, -0.0005317032337188721, -0.0005053430795669556, -0.00047898292541503906, -0.00045262277126312256, -0.00042626261711120605, -0.00039990246295928955, -0.00037354230880737305, -0.00034718215465545654, -0.00032082200050354004, -0.00029446184635162354, -0.00026810169219970703, -0.00024174153804779053, -0.00021538138389587402, -0.00018902122974395752, -0.00016266107559204102, -0.0001363009214401245, -0.00010994076728820801, -8.35806131362915e-05, -5.7220458984375e-05, -3.0860304832458496e-05, -4.500150680541992e-06, 2.1860003471374512e-05, 4.8220157623291016e-05, 7.458031177520752e-05, 0.00010094046592712402, 0.00012730062007904053, 0.00015366077423095703, 0.00018002092838287354, 0.00020638108253479004, 0.00023274123668670654, 0.00025910139083862305, 0.00028546154499053955, 0.00031182169914245605, 0.00033818185329437256, 0.00036454200744628906, 0.00039090216159820557, 0.00041726231575012207, 0.0004436224699020386, 0.0004699826240539551, 0.0004963427782058716, 0.0005227029323577881, 0.0005490630865097046, 0.0005754232406616211, 0.0006017833948135376, 0.0006281435489654541, 0.0006545037031173706, 0.0006808638572692871, 0.0007072240114212036, 0.0007335841655731201, 0.0007599443197250366, 0.0007863044738769531]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 9.0, 13.0, 9.0, 15.0, 23.0, 27.0, 36.0, 55.0, 76.0, 153.0, 243.0, 423.0, 1709.0, 1037379.0, 6986.0, 645.0, 266.0, 151.0, 98.0, 57.0, 39.0, 40.0, 20.0, 15.0, 13.0, 8.0, 7.0, 4.0, 7.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.017974853515625, -0.017368793487548828, -0.016762733459472656, -0.016156673431396484, -0.015550613403320312, -0.01494455337524414, -0.014338493347167969, -0.013732433319091797, -0.013126373291015625, -0.012520313262939453, -0.011914253234863281, -0.01130819320678711, -0.010702133178710938, -0.010096073150634766, -0.009490013122558594, -0.008883953094482422, -0.00827789306640625, -0.007671833038330078, -0.007065773010253906, -0.006459712982177734, -0.0058536529541015625, -0.005247592926025391, -0.004641532897949219, -0.004035472869873047, -0.003429412841796875, -0.002823352813720703, -0.0022172927856445312, -0.0016112327575683594, -0.0010051727294921875, -0.0003991127014160156, 0.00020694732666015625, 0.0008130073547363281, 0.0014190673828125, 0.002025127410888672, 0.0026311874389648438, 0.0032372474670410156, 0.0038433074951171875, 0.004449367523193359, 0.005055427551269531, 0.005661487579345703, 0.006267547607421875, 0.006873607635498047, 0.007479667663574219, 0.00808572769165039, 0.008691787719726562, 0.009297847747802734, 0.009903907775878906, 0.010509967803955078, 0.01111602783203125, 0.011722087860107422, 0.012328147888183594, 0.012934207916259766, 0.013540267944335938, 0.01414632797241211, 0.014752388000488281, 0.015358448028564453, 0.015964508056640625, 0.016570568084716797, 0.01717662811279297, 0.01778268814086914, 0.018388748168945312, 0.018994808197021484, 0.019600868225097656, 0.020206928253173828, 0.02081298828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 13.0, 31.0, 175.0, 306.0, 311.0, 135.0, 35.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016441349871456623, -0.0016124630346894264, -0.0015807910822331905, -0.0015491191297769547, -0.0015174472937360406, -0.0014857753412798047, -0.0014541033888235688, -0.001422431436367333, -0.001390759483911097, -0.0013590875314548612, -0.0013274155789986253, -0.0012957437429577112, -0.0012640717905014753, -0.0012323998380452394, -0.0012007278855890036, -0.0011690559331327677, -0.0011373839806765318, -0.001105712028220296, -0.00107404007576406, -0.0010423681233078241, -0.00101069628726691, -0.0009790243348106742, -0.0009473523823544383, -0.0009156804298982024, -0.0008840085938572884, -0.0008523366414010525, -0.0008206647471524775, -0.0007889927946962416, -0.0007573208422400057, -0.0007256489479914308, -0.0006939769955351949, -0.000662305043078959, -0.000630633148830384, -0.0005989611963741481, -0.0005672893021255732, -0.0005356173496693373, -0.0005039453972131014, -0.00047227347386069596, -0.00044060155050829053, -0.00040892959805205464, -0.0003772576746996492, -0.0003455857513472438, -0.0003139137988910079, -0.00028224187553860247, -0.00025056995218619704, -0.00021889799972996116, -0.00018722607637755573, -0.00015555413847323507, -0.0001238822005689144, -9.221026266459376e-05, -6.053833203623071e-05, -2.886640140786767e-05, 2.805536496452987e-06, 3.4477474400773644e-05, 6.614939775317907e-05, 9.782133565749973e-05, 0.0001294932735618204, 0.00016116521146614105, 0.0001928371493704617, 0.00022450907272286713, 0.00025618099607527256, 0.00028785294853150845, 0.0003195248718839139, 0.0003511967952363193, 0.0003828687476925552]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 7.0, 3.0, 7.0, 9.0, 10.0, 16.0, 8.0, 15.0, 15.0, 26.0, 21.0, 19.0, 28.0, 36.0, 28.0, 33.0, 26.0, 30.0, 38.0, 34.0, 31.0, 51.0, 38.0, 43.0, 37.0, 42.0, 30.0, 38.0, 42.0, 37.0, 31.0, 22.0, 23.0, 20.0, 13.0, 11.0, 21.0, 14.0, 10.0, 8.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003153681755065918, -0.00030407775193452835, -0.0002927873283624649, -0.00028149690479040146, -0.000270206481218338, -0.00025891605764627457, -0.0002476256340742111, -0.00023633521050214767, -0.00022504478693008423, -0.00021375436335802078, -0.00020246393978595734, -0.0001911735162138939, -0.00017988309264183044, -0.000168592669069767, -0.00015730224549770355, -0.0001460118219256401, -0.00013472139835357666, -0.00012343097478151321, -0.00011214055120944977, -0.00010085012763738632, -8.955970406532288e-05, -7.826928049325943e-05, -6.697885692119598e-05, -5.568843334913254e-05, -4.439800977706909e-05, -3.3107586205005646e-05, -2.18171626329422e-05, -1.0526739060878754e-05, 7.636845111846924e-07, 1.2054108083248138e-05, 2.3344531655311584e-05, 3.463495522737503e-05, 4.5925378799438477e-05, 5.721580237150192e-05, 6.850622594356537e-05, 7.979664951562881e-05, 9.108707308769226e-05, 0.00010237749665975571, 0.00011366792023181915, 0.0001249583438038826, 0.00013624876737594604, 0.0001475391909480095, 0.00015882961452007294, 0.00017012003809213638, 0.00018141046166419983, 0.00019270088523626328, 0.00020399130880832672, 0.00021528173238039017, 0.0002265721559524536, 0.00023786257952451706, 0.0002491530030965805, 0.00026044342666864395, 0.0002717338502407074, 0.00028302427381277084, 0.0002943146973848343, 0.00030560512095689774, 0.0003168955445289612, 0.00032818596810102463, 0.0003394763916730881, 0.0003507668152451515, 0.00036205723881721497, 0.0003733476623892784, 0.00038463808596134186, 0.0003959285095334053, 0.00040721893310546875]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 8.0, 9.0, 7.0, 18.0, 4.0, 21.0, 18.0, 23.0, 18.0, 23.0, 31.0, 32.0, 39.0, 33.0, 44.0, 29.0, 30.0, 36.0, 41.0, 58.0, 33.0, 43.0, 39.0, 35.0, 39.0, 38.0, 37.0, 28.0, 25.0, 24.0, 20.0, 17.0, 16.0, 17.0, 10.0, 14.0, 8.0, 9.0, 8.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.22265625, -6.9989013671875, -6.775146484375, -6.5513916015625, -6.32763671875, -6.1038818359375, -5.880126953125, -5.6563720703125, -5.4326171875, -5.2088623046875, -4.985107421875, -4.7613525390625, -4.53759765625, -4.3138427734375, -4.090087890625, -3.8663330078125, -3.642578125, -3.4188232421875, -3.195068359375, -2.9713134765625, -2.74755859375, -2.5238037109375, -2.300048828125, -2.0762939453125, -1.8525390625, -1.6287841796875, -1.405029296875, -1.1812744140625, -0.95751953125, -0.7337646484375, -0.510009765625, -0.2862548828125, -0.0625, 0.1612548828125, 0.385009765625, 0.6087646484375, 0.83251953125, 1.0562744140625, 1.280029296875, 1.5037841796875, 1.7275390625, 1.9512939453125, 2.175048828125, 2.3988037109375, 2.62255859375, 2.8463134765625, 3.070068359375, 3.2938232421875, 3.517578125, 3.7413330078125, 3.965087890625, 4.1888427734375, 4.41259765625, 4.6363525390625, 4.860107421875, 5.0838623046875, 5.3076171875, 5.5313720703125, 5.755126953125, 5.9788818359375, 6.20263671875, 6.4263916015625, 6.650146484375, 6.8739013671875, 7.09765625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 5.0, 11.0, 10.0, 12.0, 13.0, 20.0, 33.0, 39.0, 43.0, 56.0, 72.0, 105.0, 171.0, 221.0, 362.0, 633.0, 1956.0, 11205.0, 94921.0, 766244.0, 151262.0, 16517.0, 2624.0, 753.0, 382.0, 242.0, 183.0, 115.0, 72.0, 63.0, 41.0, 31.0, 30.0, 28.0, 13.0, 17.0, 11.0, 8.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.9036865234375, -13.463623046875, -13.0235595703125, -12.58349609375, -12.1434326171875, -11.703369140625, -11.2633056640625, -10.8232421875, -10.3831787109375, -9.943115234375, -9.5030517578125, -9.06298828125, -8.6229248046875, -8.182861328125, -7.7427978515625, -7.302734375, -6.8626708984375, -6.422607421875, -5.9825439453125, -5.54248046875, -5.1024169921875, -4.662353515625, -4.2222900390625, -3.7822265625, -3.3421630859375, -2.902099609375, -2.4620361328125, -2.02197265625, -1.5819091796875, -1.141845703125, -0.7017822265625, -0.26171875, 0.1783447265625, 0.618408203125, 1.0584716796875, 1.49853515625, 1.9385986328125, 2.378662109375, 2.8187255859375, 3.2587890625, 3.6988525390625, 4.138916015625, 4.5789794921875, 5.01904296875, 5.4591064453125, 5.899169921875, 6.3392333984375, 6.779296875, 7.2193603515625, 7.659423828125, 8.0994873046875, 8.53955078125, 8.9796142578125, 9.419677734375, 9.8597412109375, 10.2998046875, 10.7398681640625, 11.179931640625, 11.6199951171875, 12.06005859375, 12.5001220703125, 12.940185546875, 13.3802490234375, 13.8203125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 7.0, 12.0, 6.0, 10.0, 12.0, 10.0, 23.0, 21.0, 25.0, 22.0, 34.0, 32.0, 41.0, 36.0, 48.0, 56.0, 74.0, 247.0, 1677.0, 178.0, 57.0, 51.0, 43.0, 36.0, 42.0, 24.0, 35.0, 33.0, 18.0, 14.0, 17.0, 22.0, 16.0, 11.0, 5.0, 14.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.484375, -22.781005859375, -22.07763671875, -21.374267578125, -20.6708984375, -19.967529296875, -19.26416015625, -18.560791015625, -17.857421875, -17.154052734375, -16.45068359375, -15.747314453125, -15.0439453125, -14.340576171875, -13.63720703125, -12.933837890625, -12.23046875, -11.527099609375, -10.82373046875, -10.120361328125, -9.4169921875, -8.713623046875, -8.01025390625, -7.306884765625, -6.603515625, -5.900146484375, -5.19677734375, -4.493408203125, -3.7900390625, -3.086669921875, -2.38330078125, -1.679931640625, -0.9765625, -0.273193359375, 0.43017578125, 1.133544921875, 1.8369140625, 2.540283203125, 3.24365234375, 3.947021484375, 4.650390625, 5.353759765625, 6.05712890625, 6.760498046875, 7.4638671875, 8.167236328125, 8.87060546875, 9.573974609375, 10.27734375, 10.980712890625, 11.68408203125, 12.387451171875, 13.0908203125, 13.794189453125, 14.49755859375, 15.200927734375, 15.904296875, 16.607666015625, 17.31103515625, 18.014404296875, 18.7177734375, 19.421142578125, 20.12451171875, 20.827880859375, 21.53125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 3.0, 11.0, 12.0, 12.0, 16.0, 23.0, 18.0, 17.0, 23.0, 42.0, 40.0, 53.0, 86.0, 88.0, 168.0, 288.0, 557.0, 2357.0, 801157.0, 2336245.0, 2886.0, 636.0, 321.0, 173.0, 103.0, 72.0, 62.0, 42.0, 29.0, 30.0, 29.0, 17.0, 13.0, 15.0, 9.0, 8.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.9375, -48.32861328125, -46.7197265625, -45.11083984375, -43.501953125, -41.89306640625, -40.2841796875, -38.67529296875, -37.06640625, -35.45751953125, -33.8486328125, -32.23974609375, -30.630859375, -29.02197265625, -27.4130859375, -25.80419921875, -24.1953125, -22.58642578125, -20.9775390625, -19.36865234375, -17.759765625, -16.15087890625, -14.5419921875, -12.93310546875, -11.32421875, -9.71533203125, -8.1064453125, -6.49755859375, -4.888671875, -3.27978515625, -1.6708984375, -0.06201171875, 1.546875, 3.15576171875, 4.7646484375, 6.37353515625, 7.982421875, 9.59130859375, 11.2001953125, 12.80908203125, 14.41796875, 16.02685546875, 17.6357421875, 19.24462890625, 20.853515625, 22.46240234375, 24.0712890625, 25.68017578125, 27.2890625, 28.89794921875, 30.5068359375, 32.11572265625, 33.724609375, 35.33349609375, 36.9423828125, 38.55126953125, 40.16015625, 41.76904296875, 43.3779296875, 44.98681640625, 46.595703125, 48.20458984375, 49.8134765625, 51.42236328125, 53.03125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 13.0, 792.0, 206.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.23040008544922, -15.555150985717773, -9.879901885986328, -4.204652786254883, 1.4705963134765625, 7.145845413208008, 12.821094512939453, 18.49634552001953, 24.171592712402344, 29.84684181213379, 35.522090911865234, 41.19734191894531, 46.872589111328125, 52.54783630371094, 58.223087310791016, 63.898338317871094, 69.5735855102539, 75.24883270263672, 80.92408752441406, 86.59933471679688, 92.27458190917969, 97.9498291015625, 103.62507629394531, 109.30033111572266, 114.97557830810547, 120.65082550048828, 126.32608032226562, 132.00132751464844, 137.67657470703125, 143.35182189941406, 149.02706909179688, 154.70233154296875, 160.3775634765625, 166.0528106689453, 171.72805786132812, 177.40330505371094, 183.07855224609375, 188.75381469726562, 194.42906188964844, 200.10430908203125, 205.77955627441406, 211.45480346679688, 217.1300506591797, 222.8052978515625, 228.48056030273438, 234.1558074951172, 239.8310546875, 245.5063018798828, 251.18154907226562, 256.8568115234375, 262.53204345703125, 268.2073059082031, 273.8825378417969, 279.55780029296875, 285.2330322265625, 290.9082946777344, 296.58355712890625, 302.2588195800781, 307.9340515136719, 313.60931396484375, 319.2845458984375, 324.9598083496094, 330.6350402832031, 336.310302734375, 341.98553466796875]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 4.0, 5.0, 11.0, 11.0, 13.0, 13.0, 13.0, 21.0, 26.0, 21.0, 28.0, 30.0, 32.0, 34.0, 51.0, 40.0, 36.0, 38.0, 49.0, 37.0, 44.0, 41.0, 34.0, 38.0, 41.0, 33.0, 30.0, 27.0, 22.0, 22.0, 31.0, 14.0, 12.0, 15.0, 16.0, 8.0, 9.0, 8.0, 12.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0], "bins": [-56.44456481933594, -54.778480529785156, -53.11240005493164, -51.446319580078125, -49.780235290527344, -48.11415100097656, -46.44807052612305, -44.78199005126953, -43.11590576171875, -41.44982147216797, -39.78374099731445, -38.11766052246094, -36.451576232910156, -34.785491943359375, -33.11941146850586, -31.45332908630371, -29.787246704101562, -28.121164321899414, -26.455081939697266, -24.788999557495117, -23.12291717529297, -21.45683479309082, -19.790752410888672, -18.124670028686523, -16.458587646484375, -14.792505264282227, -13.126422882080078, -11.46034049987793, -9.794258117675781, -8.128175735473633, -6.462093353271484, -4.796010971069336, -3.129932403564453, -1.4638500213623047, 0.20223236083984375, 1.8683147430419922, 3.5343971252441406, 5.200479507446289, 6.8665618896484375, 8.532644271850586, 10.198726654052734, 11.864809036254883, 13.530891418457031, 15.19697380065918, 16.863056182861328, 18.529138565063477, 20.195220947265625, 21.861303329467773, 23.527385711669922, 25.19346809387207, 26.85955047607422, 28.525632858276367, 30.191715240478516, 31.857797622680664, 33.52388000488281, 35.189964294433594, 36.85604476928711, 38.522125244140625, 40.188209533691406, 41.85429382324219, 43.5203742980957, 45.18645477294922, 46.8525390625, 48.51862335205078, 50.1847038269043]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 5.0, 10.0, 14.0, 5.0, 17.0, 11.0, 26.0, 19.0, 30.0, 23.0, 37.0, 38.0, 36.0, 26.0, 33.0, 40.0, 41.0, 39.0, 44.0, 46.0, 35.0, 33.0, 38.0, 39.0, 44.0, 37.0, 31.0, 20.0, 25.0, 33.0, 21.0, 17.0, 14.0, 12.0, 9.0, 10.0, 9.0, 5.0, 4.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.2734375, -7.04437255859375, -6.8153076171875, -6.58624267578125, -6.357177734375, -6.12811279296875, -5.8990478515625, -5.66998291015625, -5.44091796875, -5.21185302734375, -4.9827880859375, -4.75372314453125, -4.524658203125, -4.29559326171875, -4.0665283203125, -3.83746337890625, -3.6083984375, -3.37933349609375, -3.1502685546875, -2.92120361328125, -2.692138671875, -2.46307373046875, -2.2340087890625, -2.00494384765625, -1.77587890625, -1.54681396484375, -1.3177490234375, -1.08868408203125, -0.859619140625, -0.63055419921875, -0.4014892578125, -0.17242431640625, 0.056640625, 0.28570556640625, 0.5147705078125, 0.74383544921875, 0.972900390625, 1.20196533203125, 1.4310302734375, 1.66009521484375, 1.88916015625, 2.11822509765625, 2.3472900390625, 2.57635498046875, 2.805419921875, 3.03448486328125, 3.2635498046875, 3.49261474609375, 3.7216796875, 3.95074462890625, 4.1798095703125, 4.40887451171875, 4.637939453125, 4.86700439453125, 5.0960693359375, 5.32513427734375, 5.55419921875, 5.78326416015625, 6.0123291015625, 6.24139404296875, 6.470458984375, 6.69952392578125, 6.9285888671875, 7.15765380859375, 7.38671875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 8.0, 2.0, 8.0, 3.0, 14.0, 14.0, 25.0, 13.0, 24.0, 37.0, 45.0, 51.0, 79.0, 115.0, 257.0, 493.0, 1388.0, 7257.0, 99731.0, 2508775.0, 1521832.0, 47588.0, 4475.0, 1061.0, 371.0, 189.0, 98.0, 79.0, 65.0, 37.0, 31.0, 23.0, 25.0, 16.0, 13.0, 11.0, 5.0, 5.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.03125, -22.3515625, -21.671875, -20.9921875, -20.3125, -19.6328125, -18.953125, -18.2734375, -17.59375, -16.9140625, -16.234375, -15.5546875, -14.875, -14.1953125, -13.515625, -12.8359375, -12.15625, -11.4765625, -10.796875, -10.1171875, -9.4375, -8.7578125, -8.078125, -7.3984375, -6.71875, -6.0390625, -5.359375, -4.6796875, -4.0, -3.3203125, -2.640625, -1.9609375, -1.28125, -0.6015625, 0.078125, 0.7578125, 1.4375, 2.1171875, 2.796875, 3.4765625, 4.15625, 4.8359375, 5.515625, 6.1953125, 6.875, 7.5546875, 8.234375, 8.9140625, 9.59375, 10.2734375, 10.953125, 11.6328125, 12.3125, 12.9921875, 13.671875, 14.3515625, 15.03125, 15.7109375, 16.390625, 17.0703125, 17.75, 18.4296875, 19.109375, 19.7890625, 20.46875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 11.0, 14.0, 17.0, 16.0, 23.0, 39.0, 47.0, 53.0, 86.0, 76.0, 114.0, 146.0, 188.0, 252.0, 330.0, 402.0, 374.0, 345.0, 338.0, 262.0, 192.0, 151.0, 127.0, 110.0, 69.0, 59.0, 41.0, 37.0, 24.0, 21.0, 21.0, 12.0, 16.0, 5.0, 4.0, 8.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6171875, -9.292724609375, -8.96826171875, -8.643798828125, -8.3193359375, -7.994873046875, -7.67041015625, -7.345947265625, -7.021484375, -6.697021484375, -6.37255859375, -6.048095703125, -5.7236328125, -5.399169921875, -5.07470703125, -4.750244140625, -4.42578125, -4.101318359375, -3.77685546875, -3.452392578125, -3.1279296875, -2.803466796875, -2.47900390625, -2.154541015625, -1.830078125, -1.505615234375, -1.18115234375, -0.856689453125, -0.5322265625, -0.207763671875, 0.11669921875, 0.441162109375, 0.765625, 1.090087890625, 1.41455078125, 1.739013671875, 2.0634765625, 2.387939453125, 2.71240234375, 3.036865234375, 3.361328125, 3.685791015625, 4.01025390625, 4.334716796875, 4.6591796875, 4.983642578125, 5.30810546875, 5.632568359375, 5.95703125, 6.281494140625, 6.60595703125, 6.930419921875, 7.2548828125, 7.579345703125, 7.90380859375, 8.228271484375, 8.552734375, 8.877197265625, 9.20166015625, 9.526123046875, 9.8505859375, 10.175048828125, 10.49951171875, 10.823974609375, 11.1484375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 9.0, 16.0, 21.0, 22.0, 38.0, 46.0, 52.0, 72.0, 92.0, 120.0, 161.0, 297.0, 517.0, 1835.0, 298296.0, 3885713.0, 5136.0, 680.0, 360.0, 218.0, 154.0, 93.0, 81.0, 50.0, 43.0, 31.0, 38.0, 20.0, 14.0, 10.0, 10.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.625, -66.3505859375, -64.076171875, -61.8017578125, -59.52734375, -57.2529296875, -54.978515625, -52.7041015625, -50.4296875, -48.1552734375, -45.880859375, -43.6064453125, -41.33203125, -39.0576171875, -36.783203125, -34.5087890625, -32.234375, -29.9599609375, -27.685546875, -25.4111328125, -23.13671875, -20.8623046875, -18.587890625, -16.3134765625, -14.0390625, -11.7646484375, -9.490234375, -7.2158203125, -4.94140625, -2.6669921875, -0.392578125, 1.8818359375, 4.15625, 6.4306640625, 8.705078125, 10.9794921875, 13.25390625, 15.5283203125, 17.802734375, 20.0771484375, 22.3515625, 24.6259765625, 26.900390625, 29.1748046875, 31.44921875, 33.7236328125, 35.998046875, 38.2724609375, 40.546875, 42.8212890625, 45.095703125, 47.3701171875, 49.64453125, 51.9189453125, 54.193359375, 56.4677734375, 58.7421875, 61.0166015625, 63.291015625, 65.5654296875, 67.83984375, 70.1142578125, 72.388671875, 74.6630859375, 76.9375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 19.0, 49.0, 118.0, 135.0, 177.0, 173.0, 136.0, 86.0, 58.0, 29.0, 20.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.96239471435547, -64.2294692993164, -62.49654006958008, -60.763614654541016, -59.03068542480469, -57.297760009765625, -55.56483459472656, -53.831905364990234, -52.098976135253906, -50.366050720214844, -48.633121490478516, -46.90019607543945, -45.167266845703125, -43.43434143066406, -41.701416015625, -39.96848678588867, -38.23556137084961, -36.50263595581055, -34.76970672607422, -33.036781311035156, -31.303852081298828, -29.570926666259766, -27.83799934387207, -26.105072021484375, -24.37214469909668, -22.639217376708984, -20.90629005432129, -19.173362731933594, -17.44043731689453, -15.70750904083252, -13.97458267211914, -12.241655349731445, -10.508731842041016, -8.77580451965332, -7.042877674102783, -5.309950828552246, -3.577023506164551, -1.8440961837768555, -0.11116981506347656, 1.6217575073242188, 3.354684829711914, 5.087612152099609, 6.8205389976501465, 8.553465843200684, 10.286393165588379, 12.019320487976074, 13.752246856689453, 15.485174179077148, 17.218101501464844, 18.95102882385254, 20.683956146240234, 22.416881561279297, 24.149810791015625, 25.882736206054688, 27.615663528442383, 29.348590850830078, 31.081518173217773, 32.81444549560547, 34.54737091064453, 36.28030014038086, 38.01322555541992, 39.74615478515625, 41.47908020019531, 43.212005615234375, 44.9449348449707]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 9.0, 10.0, 22.0, 21.0, 26.0, 32.0, 31.0, 31.0, 33.0, 37.0, 36.0, 41.0, 42.0, 45.0, 44.0, 40.0, 45.0, 42.0, 48.0, 51.0, 27.0, 41.0, 32.0, 29.0, 24.0, 23.0, 25.0, 17.0, 18.0, 11.0, 9.0, 9.0, 9.0, 6.0, 8.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.00720977783203, -34.65553665161133, -33.30386734008789, -31.952194213867188, -30.600522994995117, -29.248851776123047, -27.897178649902344, -26.545507431030273, -25.193836212158203, -23.842164993286133, -22.490493774414062, -21.13882064819336, -19.78714942932129, -18.43547821044922, -17.083805084228516, -15.732133865356445, -14.380462646484375, -13.028791427612305, -11.677119255065918, -10.325447082519531, -8.973775863647461, -7.622104167938232, -6.270432472229004, -4.918760299682617, -3.567089080810547, -2.2154173851013184, -0.8637456893920898, 0.48792600631713867, 1.8395977020263672, 3.1912693977355957, 4.542941093444824, 5.894613265991211, 7.246284484863281, 8.597955703735352, 9.949627876281738, 11.301300048828125, 12.652971267700195, 14.004642486572266, 15.356314659118652, 16.70798683166504, 18.05965805053711, 19.41132926940918, 20.76300048828125, 22.114673614501953, 23.466344833374023, 24.818016052246094, 26.169689178466797, 27.521360397338867, 28.873031616210938, 30.224702835083008, 31.576374053955078, 32.92804718017578, 34.27971649169922, 35.63138961791992, 36.983062744140625, 38.33473205566406, 39.686405181884766, 41.03807830810547, 42.389747619628906, 43.74142074584961, 45.09309387207031, 46.44476318359375, 47.79643630981445, 49.148109436035156, 50.499778747558594]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 10.0, 11.0, 24.0, 32.0, 50.0, 72.0, 115.0, 204.0, 267.0, 425.0, 693.0, 1047.0, 1715.0, 2774.0, 4702.0, 7510.0, 12860.0, 22268.0, 39603.0, 71632.0, 134059.0, 263851.0, 223538.0, 115850.0, 62138.0, 34519.0, 19674.0, 11494.0, 6704.0, 4149.0, 2420.0, 1510.0, 966.0, 608.0, 369.0, 248.0, 121.0, 110.0, 57.0, 43.0, 33.0, 22.0, 18.0, 8.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.3505859375, -1.306854248046875, -1.26312255859375, -1.219390869140625, -1.1756591796875, -1.131927490234375, -1.08819580078125, -1.044464111328125, -1.000732421875, -0.957000732421875, -0.91326904296875, -0.869537353515625, -0.8258056640625, -0.782073974609375, -0.73834228515625, -0.694610595703125, -0.65087890625, -0.607147216796875, -0.56341552734375, -0.519683837890625, -0.4759521484375, -0.432220458984375, -0.38848876953125, -0.344757080078125, -0.301025390625, -0.257293701171875, -0.21356201171875, -0.169830322265625, -0.1260986328125, -0.082366943359375, -0.03863525390625, 0.005096435546875, 0.048828125, 0.092559814453125, 0.13629150390625, 0.180023193359375, 0.2237548828125, 0.267486572265625, 0.31121826171875, 0.354949951171875, 0.398681640625, 0.442413330078125, 0.48614501953125, 0.529876708984375, 0.5736083984375, 0.617340087890625, 0.66107177734375, 0.704803466796875, 0.74853515625, 0.792266845703125, 0.83599853515625, 0.879730224609375, 0.9234619140625, 0.967193603515625, 1.01092529296875, 1.054656982421875, 1.098388671875, 1.142120361328125, 1.18585205078125, 1.229583740234375, 1.2733154296875, 1.317047119140625, 1.36077880859375, 1.404510498046875, 1.4482421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 7.0, 12.0, 9.0, 13.0, 6.0, 20.0, 20.0, 16.0, 18.0, 22.0, 33.0, 24.0, 29.0, 35.0, 31.0, 32.0, 38.0, 42.0, 43.0, 1064.0, 30.0, 29.0, 37.0, 37.0, 37.0, 32.0, 33.0, 24.0, 36.0, 26.0, 29.0, 17.0, 13.0, 15.0, 20.0, 17.0, 14.0, 18.0, 9.0, 5.0, 4.0, 1.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.07470703125, -3.9384765625, -3.80224609375, -3.666015625, -3.52978515625, -3.3935546875, -3.25732421875, -3.12109375, -2.98486328125, -2.8486328125, -2.71240234375, -2.576171875, -2.43994140625, -2.3037109375, -2.16748046875, -2.03125, -1.89501953125, -1.7587890625, -1.62255859375, -1.486328125, -1.35009765625, -1.2138671875, -1.07763671875, -0.94140625, -0.80517578125, -0.6689453125, -0.53271484375, -0.396484375, -0.26025390625, -0.1240234375, 0.01220703125, 0.1484375, 0.28466796875, 0.4208984375, 0.55712890625, 0.693359375, 0.82958984375, 0.9658203125, 1.10205078125, 1.23828125, 1.37451171875, 1.5107421875, 1.64697265625, 1.783203125, 1.91943359375, 2.0556640625, 2.19189453125, 2.328125, 2.46435546875, 2.6005859375, 2.73681640625, 2.873046875, 3.00927734375, 3.1455078125, 3.28173828125, 3.41796875, 3.55419921875, 3.6904296875, 3.82666015625, 3.962890625, 4.09912109375, 4.2353515625, 4.37158203125, 4.5078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 18.0, 30.0, 47.0, 78.0, 88.0, 154.0, 234.0, 327.0, 463.0, 670.0, 995.0, 1450.0, 2050.0, 3068.0, 4617.0, 6708.0, 9916.0, 14897.0, 22525.0, 35266.0, 55791.0, 89944.0, 152458.0, 1286924.0, 155574.0, 91525.0, 56529.0, 35573.0, 22872.0, 15071.0, 10132.0, 6850.0, 4493.0, 3126.0, 2108.0, 1423.0, 975.0, 672.0, 475.0, 329.0, 220.0, 144.0, 103.0, 65.0, 43.0, 31.0, 23.0, 9.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-1.048828125, -1.016571044921875, -0.98431396484375, -0.952056884765625, -0.9197998046875, -0.887542724609375, -0.85528564453125, -0.823028564453125, -0.790771484375, -0.758514404296875, -0.72625732421875, -0.694000244140625, -0.6617431640625, -0.629486083984375, -0.59722900390625, -0.564971923828125, -0.53271484375, -0.500457763671875, -0.46820068359375, -0.435943603515625, -0.4036865234375, -0.371429443359375, -0.33917236328125, -0.306915283203125, -0.274658203125, -0.242401123046875, -0.21014404296875, -0.177886962890625, -0.1456298828125, -0.113372802734375, -0.08111572265625, -0.048858642578125, -0.0166015625, 0.015655517578125, 0.04791259765625, 0.080169677734375, 0.1124267578125, 0.144683837890625, 0.17694091796875, 0.209197998046875, 0.241455078125, 0.273712158203125, 0.30596923828125, 0.338226318359375, 0.3704833984375, 0.402740478515625, 0.43499755859375, 0.467254638671875, 0.49951171875, 0.531768798828125, 0.56402587890625, 0.596282958984375, 0.6285400390625, 0.660797119140625, 0.69305419921875, 0.725311279296875, 0.757568359375, 0.789825439453125, 0.82208251953125, 0.854339599609375, 0.8865966796875, 0.918853759765625, 0.95111083984375, 0.983367919921875, 1.015625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 8.0, 9.0, 15.0, 15.0, 23.0, 21.0, 26.0, 37.0, 39.0, 57.0, 57.0, 53.0, 63.0, 40.0, 71.0, 40.0, 60.0, 39.0, 40.0, 40.0, 35.0, 23.0, 28.0, 23.0, 9.0, 15.0, 13.0, 12.0, 9.0, 15.0, 9.0, 4.0, 2.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006341934204101562, -0.0006148815155029297, -0.0005955696105957031, -0.0005762577056884766, -0.00055694580078125, -0.0005376338958740234, -0.0005183219909667969, -0.0004990100860595703, -0.00047969818115234375, -0.0004603862762451172, -0.0004410743713378906, -0.00042176246643066406, -0.0004024505615234375, -0.00038313865661621094, -0.0003638267517089844, -0.0003445148468017578, -0.00032520294189453125, -0.0003058910369873047, -0.0002865791320800781, -0.00026726722717285156, -0.000247955322265625, -0.00022864341735839844, -0.00020933151245117188, -0.0001900196075439453, -0.00017070770263671875, -0.0001513957977294922, -0.00013208389282226562, -0.00011277198791503906, -9.34600830078125e-05, -7.414817810058594e-05, -5.4836273193359375e-05, -3.552436828613281e-05, -1.621246337890625e-05, 3.0994415283203125e-06, 2.2411346435546875e-05, 4.172325134277344e-05, 6.103515625e-05, 8.034706115722656e-05, 9.965896606445312e-05, 0.00011897087097167969, 0.00013828277587890625, 0.0001575946807861328, 0.00017690658569335938, 0.00019621849060058594, 0.0002155303955078125, 0.00023484230041503906, 0.0002541542053222656, 0.0002734661102294922, 0.00029277801513671875, 0.0003120899200439453, 0.0003314018249511719, 0.00035071372985839844, 0.000370025634765625, 0.00038933753967285156, 0.0004086494445800781, 0.0004279613494873047, 0.00044727325439453125, 0.0004665851593017578, 0.0004858970642089844, 0.0005052089691162109, 0.0005245208740234375, 0.0005438327789306641, 0.0005631446838378906, 0.0005824565887451172, 0.0006017684936523438]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 9.0, 14.0, 13.0, 12.0, 26.0, 24.0, 26.0, 25.0, 52.0, 48.0, 76.0, 95.0, 127.0, 230.0, 482.0, 1099.0, 318087.0, 725454.0, 1328.0, 478.0, 243.0, 138.0, 121.0, 78.0, 49.0, 32.0, 35.0, 32.0, 22.0, 15.0, 18.0, 10.0, 9.0, 8.0, 7.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01404571533203125, -0.013607501983642578, -0.013169288635253906, -0.012731075286865234, -0.012292861938476562, -0.01185464859008789, -0.011416435241699219, -0.010978221893310547, -0.010540008544921875, -0.010101795196533203, -0.009663581848144531, -0.00922536849975586, -0.008787155151367188, -0.008348941802978516, -0.007910728454589844, -0.007472515106201172, -0.0070343017578125, -0.006596088409423828, -0.006157875061035156, -0.005719661712646484, -0.0052814483642578125, -0.004843235015869141, -0.004405021667480469, -0.003966808319091797, -0.003528594970703125, -0.003090381622314453, -0.0026521682739257812, -0.0022139549255371094, -0.0017757415771484375, -0.0013375282287597656, -0.0008993148803710938, -0.0004611015319824219, -2.288818359375e-05, 0.0004153251647949219, 0.0008535385131835938, 0.0012917518615722656, 0.0017299652099609375, 0.0021681785583496094, 0.0026063919067382812, 0.003044605255126953, 0.003482818603515625, 0.003921031951904297, 0.004359245300292969, 0.004797458648681641, 0.0052356719970703125, 0.005673885345458984, 0.006112098693847656, 0.006550312042236328, 0.006988525390625, 0.007426738739013672, 0.007864952087402344, 0.008303165435791016, 0.008741378784179688, 0.00917959213256836, 0.009617805480957031, 0.010056018829345703, 0.010494232177734375, 0.010932445526123047, 0.011370658874511719, 0.01180887222290039, 0.012247085571289062, 0.012685298919677734, 0.013123512268066406, 0.013561725616455078, 0.01399993896484375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 76.0, 304.0, 397.0, 183.0, 33.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001418866217136383, -0.001380834262818098, -0.001342802424915135, -0.00130477047059685, -0.001266738516278565, -0.0012287066783756018, -0.0011906747240573168, -0.0011526427697390318, -0.0011146108154207468, -0.0010765788611024618, -0.0010385470231994987, -0.0010005150688812137, -0.0009624831145629287, -0.0009244512184523046, -0.0008864193223416805, -0.0008483873680233955, -0.0008103555301204324, -0.0007723236340098083, -0.0007342916796915233, -0.0006962597835808992, -0.0006582278292626143, -0.0006201959331519902, -0.0005821640370413661, -0.0005441320827230811, -0.000506100186612457, -0.0004680682613980025, -0.000430036336183548, -0.0003920044400729239, -0.00035397251485846937, -0.00031594058964401484, -0.00027790869353339076, -0.00023987676831893623, -0.00020184495951980352, -0.000163813034305349, -0.0001257811236428097, -8.774920570431277e-05, -4.9717287765815854e-05, -1.1685362551361322e-05, 2.634654811117798e-05, 6.437845877371728e-05, 0.00010241038398817182, 0.00014044230920262635, 0.00017847421986516565, 0.00021650613052770495, 0.0002545380557421595, 0.000292569980956614, 0.0003306018770672381, 0.0003686338022816926, 0.00040666572749614716, 0.0004446976527106017, 0.0004827295779250562, 0.0005207614740356803, 0.0005587934283539653, 0.0005968253244645894, 0.0006348572205752134, 0.0006728891748934984, 0.0007109210710041225, 0.0007489529671147466, 0.0007869849214330316, 0.0008250168175436556, 0.0008630487136542797, 0.0009010806679725647, 0.0009391125640831888, 0.0009771444601938128, 0.0010151764145120978]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 4.0, 10.0, 7.0, 8.0, 9.0, 7.0, 20.0, 20.0, 19.0, 26.0, 24.0, 30.0, 31.0, 44.0, 33.0, 34.0, 23.0, 38.0, 38.0, 46.0, 30.0, 40.0, 56.0, 32.0, 41.0, 44.0, 36.0, 26.0, 31.0, 16.0, 30.0, 28.0, 18.0, 20.0, 14.0, 13.0, 9.0, 11.0, 13.0, 3.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003337860107421875, -0.00032325461506843567, -0.00031272321939468384, -0.000302191823720932, -0.0002916604280471802, -0.00028112903237342834, -0.0002705976366996765, -0.0002600662410259247, -0.00024953484535217285, -0.00023900344967842102, -0.0002284720540046692, -0.00021794065833091736, -0.00020740926265716553, -0.0001968778669834137, -0.00018634647130966187, -0.00017581507563591003, -0.0001652836799621582, -0.00015475228428840637, -0.00014422088861465454, -0.0001336894929409027, -0.00012315809726715088, -0.00011262670159339905, -0.00010209530591964722, -9.156391024589539e-05, -8.103251457214355e-05, -7.050111889839172e-05, -5.996972322463989e-05, -4.943832755088806e-05, -3.890693187713623e-05, -2.83755362033844e-05, -1.784414052963257e-05, -7.312744855880737e-06, 3.2186508178710938e-06, 1.3750046491622925e-05, 2.4281442165374756e-05, 3.481283783912659e-05, 4.534423351287842e-05, 5.587562918663025e-05, 6.640702486038208e-05, 7.693842053413391e-05, 8.746981620788574e-05, 9.800121188163757e-05, 0.0001085326075553894, 0.00011906400322914124, 0.00012959539890289307, 0.0001401267945766449, 0.00015065819025039673, 0.00016118958592414856, 0.0001717209815979004, 0.00018225237727165222, 0.00019278377294540405, 0.00020331516861915588, 0.00021384656429290771, 0.00022437795996665955, 0.00023490935564041138, 0.0002454407513141632, 0.00025597214698791504, 0.00026650354266166687, 0.0002770349383354187, 0.00028756633400917053, 0.00029809772968292236, 0.0003086291253566742, 0.000319160521030426, 0.00032969191670417786, 0.0003402233123779297]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 11.0, 16.0, 19.0, 18.0, 27.0, 18.0, 32.0, 17.0, 30.0, 40.0, 38.0, 27.0, 46.0, 40.0, 35.0, 44.0, 44.0, 41.0, 38.0, 34.0, 30.0, 49.0, 38.0, 34.0, 29.0, 30.0, 30.0, 21.0, 19.0, 11.0, 9.0, 14.0, 7.0, 7.0, 7.0, 8.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.4053955078125, -7.166259765625, -6.9271240234375, -6.68798828125, -6.4488525390625, -6.209716796875, -5.9705810546875, -5.7314453125, -5.4923095703125, -5.253173828125, -5.0140380859375, -4.77490234375, -4.5357666015625, -4.296630859375, -4.0574951171875, -3.818359375, -3.5792236328125, -3.340087890625, -3.1009521484375, -2.86181640625, -2.6226806640625, -2.383544921875, -2.1444091796875, -1.9052734375, -1.6661376953125, -1.427001953125, -1.1878662109375, -0.94873046875, -0.7095947265625, -0.470458984375, -0.2313232421875, 0.0078125, 0.2469482421875, 0.486083984375, 0.7252197265625, 0.96435546875, 1.2034912109375, 1.442626953125, 1.6817626953125, 1.9208984375, 2.1600341796875, 2.399169921875, 2.6383056640625, 2.87744140625, 3.1165771484375, 3.355712890625, 3.5948486328125, 3.833984375, 4.0731201171875, 4.312255859375, 4.5513916015625, 4.79052734375, 5.0296630859375, 5.268798828125, 5.5079345703125, 5.7470703125, 5.9862060546875, 6.225341796875, 6.4644775390625, 6.70361328125, 6.9427490234375, 7.181884765625, 7.4210205078125, 7.66015625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 6.0, 11.0, 15.0, 17.0, 24.0, 28.0, 50.0, 61.0, 88.0, 108.0, 138.0, 180.0, 244.0, 342.0, 497.0, 706.0, 1279.0, 4113.0, 26305.0, 595492.0, 390516.0, 21036.0, 3641.0, 1120.0, 651.0, 488.0, 358.0, 284.0, 192.0, 137.0, 102.0, 77.0, 55.0, 36.0, 22.0, 34.0, 22.0, 16.0, 12.0, 10.0, 7.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.73828125, -18.1328125, -17.52734375, -16.921875, -16.31640625, -15.7109375, -15.10546875, -14.5, -13.89453125, -13.2890625, -12.68359375, -12.078125, -11.47265625, -10.8671875, -10.26171875, -9.65625, -9.05078125, -8.4453125, -7.83984375, -7.234375, -6.62890625, -6.0234375, -5.41796875, -4.8125, -4.20703125, -3.6015625, -2.99609375, -2.390625, -1.78515625, -1.1796875, -0.57421875, 0.03125, 0.63671875, 1.2421875, 1.84765625, 2.453125, 3.05859375, 3.6640625, 4.26953125, 4.875, 5.48046875, 6.0859375, 6.69140625, 7.296875, 7.90234375, 8.5078125, 9.11328125, 9.71875, 10.32421875, 10.9296875, 11.53515625, 12.140625, 12.74609375, 13.3515625, 13.95703125, 14.5625, 15.16796875, 15.7734375, 16.37890625, 16.984375, 17.58984375, 18.1953125, 18.80078125, 19.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 4.0, 7.0, 18.0, 15.0, 16.0, 13.0, 25.0, 29.0, 26.0, 23.0, 39.0, 39.0, 41.0, 56.0, 52.0, 105.0, 1564.0, 428.0, 90.0, 54.0, 45.0, 49.0, 40.0, 38.0, 36.0, 32.0, 18.0, 25.0, 19.0, 16.0, 14.0, 16.0, 13.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.09375, -23.3623046875, -22.630859375, -21.8994140625, -21.16796875, -20.4365234375, -19.705078125, -18.9736328125, -18.2421875, -17.5107421875, -16.779296875, -16.0478515625, -15.31640625, -14.5849609375, -13.853515625, -13.1220703125, -12.390625, -11.6591796875, -10.927734375, -10.1962890625, -9.46484375, -8.7333984375, -8.001953125, -7.2705078125, -6.5390625, -5.8076171875, -5.076171875, -4.3447265625, -3.61328125, -2.8818359375, -2.150390625, -1.4189453125, -0.6875, 0.0439453125, 0.775390625, 1.5068359375, 2.23828125, 2.9697265625, 3.701171875, 4.4326171875, 5.1640625, 5.8955078125, 6.626953125, 7.3583984375, 8.08984375, 8.8212890625, 9.552734375, 10.2841796875, 11.015625, 11.7470703125, 12.478515625, 13.2099609375, 13.94140625, 14.6728515625, 15.404296875, 16.1357421875, 16.8671875, 17.5986328125, 18.330078125, 19.0615234375, 19.79296875, 20.5244140625, 21.255859375, 21.9873046875, 22.71875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 1.0, 3.0, 5.0, 3.0, 13.0, 10.0, 19.0, 14.0, 19.0, 20.0, 27.0, 30.0, 28.0, 37.0, 60.0, 70.0, 103.0, 197.0, 326.0, 959.0, 19838.0, 3113929.0, 8364.0, 758.0, 304.0, 164.0, 99.0, 50.0, 43.0, 31.0, 32.0, 33.0, 26.0, 16.0, 21.0, 16.0, 10.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.625, -62.5673828125, -60.509765625, -58.4521484375, -56.39453125, -54.3369140625, -52.279296875, -50.2216796875, -48.1640625, -46.1064453125, -44.048828125, -41.9912109375, -39.93359375, -37.8759765625, -35.818359375, -33.7607421875, -31.703125, -29.6455078125, -27.587890625, -25.5302734375, -23.47265625, -21.4150390625, -19.357421875, -17.2998046875, -15.2421875, -13.1845703125, -11.126953125, -9.0693359375, -7.01171875, -4.9541015625, -2.896484375, -0.8388671875, 1.21875, 3.2763671875, 5.333984375, 7.3916015625, 9.44921875, 11.5068359375, 13.564453125, 15.6220703125, 17.6796875, 19.7373046875, 21.794921875, 23.8525390625, 25.91015625, 27.9677734375, 30.025390625, 32.0830078125, 34.140625, 36.1982421875, 38.255859375, 40.3134765625, 42.37109375, 44.4287109375, 46.486328125, 48.5439453125, 50.6015625, 52.6591796875, 54.716796875, 56.7744140625, 58.83203125, 60.8896484375, 62.947265625, 65.0048828125, 67.0625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 226.0, 643.0, 131.0, 8.0, 0.0, 0.0, 1.0], "bins": [-178.9009552001953, -175.83958435058594, -172.7781982421875, -169.71682739257812, -166.6554412841797, -163.5940704345703, -160.53268432617188, -157.4713134765625, -154.40992736816406, -151.3485565185547, -148.28717041015625, -145.22579956054688, -142.16441345214844, -139.10304260253906, -136.04165649414062, -132.98028564453125, -129.91891479492188, -126.85753631591797, -123.79615783691406, -120.73477935791016, -117.67340087890625, -114.61203002929688, -111.55064392089844, -108.48927307128906, -105.42788696289062, -102.36650848388672, -99.30513000488281, -96.2437515258789, -93.182373046875, -90.12100219726562, -87.05961608886719, -83.99824523925781, -80.93685913085938, -77.87548065185547, -74.81410217285156, -71.75272369384766, -68.69134521484375, -65.62997436523438, -62.5685920715332, -59.50721740722656, -56.445838928222656, -53.38446044921875, -50.323081970214844, -47.26170349121094, -44.2003288269043, -41.13895034790039, -38.077571868896484, -35.016197204589844, -31.954818725585938, -28.89344024658203, -25.832063674926758, -22.77068519592285, -19.709308624267578, -16.647930145263672, -13.586551666259766, -10.525175094604492, -7.463796615600586, -4.402419090270996, -1.341041088104248, 1.7203369140625, 4.78171443939209, 7.84309196472168, 10.904470443725586, 13.96584701538086, 17.027225494384766]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 6.0, 4.0, 5.0, 15.0, 9.0, 9.0, 10.0, 23.0, 15.0, 17.0, 23.0, 29.0, 18.0, 38.0, 42.0, 28.0, 35.0, 43.0, 46.0, 39.0, 51.0, 38.0, 51.0, 35.0, 39.0, 38.0, 24.0, 38.0, 29.0, 39.0, 24.0, 21.0, 11.0, 20.0, 19.0, 10.0, 17.0, 10.0, 7.0, 6.0, 5.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-55.071990966796875, -53.43459701538086, -51.797203063964844, -50.15980529785156, -48.52241134643555, -46.88501739501953, -45.247623443603516, -43.6102294921875, -41.972835540771484, -40.33544158935547, -38.69804763793945, -37.06065368652344, -35.423255920410156, -33.78586196899414, -32.148468017578125, -30.51107406616211, -28.87367820739746, -27.236284255981445, -25.598888397216797, -23.96149444580078, -22.324100494384766, -20.68670654296875, -19.0493106842041, -17.411916732788086, -15.774521827697754, -14.137126922607422, -12.499732971191406, -10.862338066101074, -9.224943161010742, -7.587549209594727, -5.9501543045043945, -4.312760353088379, -2.675365447998047, -1.0379709005355835, 0.5994236469268799, 2.236818313598633, 3.8742127418518066, 5.5116071701049805, 7.1490020751953125, 8.786396026611328, 10.42379093170166, 12.061185836791992, 13.698579788208008, 15.33597469329834, 16.973369598388672, 18.610763549804688, 20.248157501220703, 21.88555145263672, 23.522947311401367, 25.160341262817383, 26.79773712158203, 28.435131072998047, 30.072525024414062, 31.709918975830078, 33.347312927246094, 34.984710693359375, 36.62210464477539, 38.259498596191406, 39.89689254760742, 41.53428649902344, 43.17168426513672, 44.809078216552734, 46.44647216796875, 48.083866119384766, 49.72126007080078]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 5.0, 12.0, 8.0, 13.0, 14.0, 12.0, 21.0, 16.0, 18.0, 26.0, 31.0, 26.0, 22.0, 27.0, 30.0, 39.0, 41.0, 39.0, 31.0, 36.0, 40.0, 38.0, 38.0, 30.0, 42.0, 38.0, 35.0, 44.0, 28.0, 23.0, 22.0, 24.0, 21.0, 18.0, 9.0, 13.0, 10.0, 13.0, 11.0, 11.0, 3.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.07391357421875, -6.8470458984375, -6.62017822265625, -6.393310546875, -6.16644287109375, -5.9395751953125, -5.71270751953125, -5.48583984375, -5.25897216796875, -5.0321044921875, -4.80523681640625, -4.578369140625, -4.35150146484375, -4.1246337890625, -3.89776611328125, -3.6708984375, -3.44403076171875, -3.2171630859375, -2.99029541015625, -2.763427734375, -2.53656005859375, -2.3096923828125, -2.08282470703125, -1.85595703125, -1.62908935546875, -1.4022216796875, -1.17535400390625, -0.948486328125, -0.72161865234375, -0.4947509765625, -0.26788330078125, -0.041015625, 0.18585205078125, 0.4127197265625, 0.63958740234375, 0.866455078125, 1.09332275390625, 1.3201904296875, 1.54705810546875, 1.77392578125, 2.00079345703125, 2.2276611328125, 2.45452880859375, 2.681396484375, 2.90826416015625, 3.1351318359375, 3.36199951171875, 3.5888671875, 3.81573486328125, 4.0426025390625, 4.26947021484375, 4.496337890625, 4.72320556640625, 4.9500732421875, 5.17694091796875, 5.40380859375, 5.63067626953125, 5.8575439453125, 6.08441162109375, 6.311279296875, 6.53814697265625, 6.7650146484375, 6.99188232421875, 7.21875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 5.0, 6.0, 1.0, 10.0, 11.0, 3.0, 24.0, 28.0, 23.0, 46.0, 58.0, 62.0, 65.0, 95.0, 116.0, 183.0, 250.0, 377.0, 656.0, 1349.0, 3568.0, 13821.0, 129338.0, 1938843.0, 1947696.0, 136701.0, 14029.0, 3599.0, 1385.0, 604.0, 371.0, 217.0, 180.0, 127.0, 88.0, 74.0, 65.0, 30.0, 34.0, 30.0, 21.0, 19.0, 21.0, 11.0, 13.0, 10.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.1162109375, -15.560546875, -15.0048828125, -14.44921875, -13.8935546875, -13.337890625, -12.7822265625, -12.2265625, -11.6708984375, -11.115234375, -10.5595703125, -10.00390625, -9.4482421875, -8.892578125, -8.3369140625, -7.78125, -7.2255859375, -6.669921875, -6.1142578125, -5.55859375, -5.0029296875, -4.447265625, -3.8916015625, -3.3359375, -2.7802734375, -2.224609375, -1.6689453125, -1.11328125, -0.5576171875, -0.001953125, 0.5537109375, 1.109375, 1.6650390625, 2.220703125, 2.7763671875, 3.33203125, 3.8876953125, 4.443359375, 4.9990234375, 5.5546875, 6.1103515625, 6.666015625, 7.2216796875, 7.77734375, 8.3330078125, 8.888671875, 9.4443359375, 10.0, 10.5556640625, 11.111328125, 11.6669921875, 12.22265625, 12.7783203125, 13.333984375, 13.8896484375, 14.4453125, 15.0009765625, 15.556640625, 16.1123046875, 16.66796875, 17.2236328125, 17.779296875, 18.3349609375, 18.890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 17.0, 19.0, 20.0, 44.0, 62.0, 84.0, 117.0, 148.0, 249.0, 399.0, 563.0, 616.0, 575.0, 392.0, 250.0, 165.0, 92.0, 81.0, 59.0, 32.0, 25.0, 15.0, 13.0, 9.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.31005859375, -13.8076171875, -13.30517578125, -12.802734375, -12.30029296875, -11.7978515625, -11.29541015625, -10.79296875, -10.29052734375, -9.7880859375, -9.28564453125, -8.783203125, -8.28076171875, -7.7783203125, -7.27587890625, -6.7734375, -6.27099609375, -5.7685546875, -5.26611328125, -4.763671875, -4.26123046875, -3.7587890625, -3.25634765625, -2.75390625, -2.25146484375, -1.7490234375, -1.24658203125, -0.744140625, -0.24169921875, 0.2607421875, 0.76318359375, 1.265625, 1.76806640625, 2.2705078125, 2.77294921875, 3.275390625, 3.77783203125, 4.2802734375, 4.78271484375, 5.28515625, 5.78759765625, 6.2900390625, 6.79248046875, 7.294921875, 7.79736328125, 8.2998046875, 8.80224609375, 9.3046875, 9.80712890625, 10.3095703125, 10.81201171875, 11.314453125, 11.81689453125, 12.3193359375, 12.82177734375, 13.32421875, 13.82666015625, 14.3291015625, 14.83154296875, 15.333984375, 15.83642578125, 16.3388671875, 16.84130859375, 17.34375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 20.0, 23.0, 34.0, 43.0, 54.0, 78.0, 114.0, 125.0, 184.0, 313.0, 668.0, 2208.0, 45152.0, 4049742.0, 90533.0, 3013.0, 780.0, 324.0, 217.0, 131.0, 110.0, 104.0, 73.0, 41.0, 36.0, 25.0, 15.0, 24.0, 10.0, 19.0, 5.0, 5.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.9375, -49.21484375, -47.4921875, -45.76953125, -44.046875, -42.32421875, -40.6015625, -38.87890625, -37.15625, -35.43359375, -33.7109375, -31.98828125, -30.265625, -28.54296875, -26.8203125, -25.09765625, -23.375, -21.65234375, -19.9296875, -18.20703125, -16.484375, -14.76171875, -13.0390625, -11.31640625, -9.59375, -7.87109375, -6.1484375, -4.42578125, -2.703125, -0.98046875, 0.7421875, 2.46484375, 4.1875, 5.91015625, 7.6328125, 9.35546875, 11.078125, 12.80078125, 14.5234375, 16.24609375, 17.96875, 19.69140625, 21.4140625, 23.13671875, 24.859375, 26.58203125, 28.3046875, 30.02734375, 31.75, 33.47265625, 35.1953125, 36.91796875, 38.640625, 40.36328125, 42.0859375, 43.80859375, 45.53125, 47.25390625, 48.9765625, 50.69921875, 52.421875, 54.14453125, 55.8671875, 57.58984375, 59.3125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 37.0, 138.0, 304.0, 348.0, 131.0, 36.0, 8.0, 2.0, 4.0], "bins": [-213.93435668945312, -210.24412536621094, -206.55389404296875, -202.86366271972656, -199.17343139648438, -195.48321533203125, -191.79298400878906, -188.10275268554688, -184.4125213623047, -180.7222900390625, -177.0320587158203, -173.34182739257812, -169.65159606933594, -165.96136474609375, -162.27114868164062, -158.58091735839844, -154.89068603515625, -151.20045471191406, -147.51022338867188, -143.8199920654297, -140.1297607421875, -136.43954467773438, -132.7493133544922, -129.05908203125, -125.36884307861328, -121.6786117553711, -117.9883804321289, -114.29815673828125, -110.60792541503906, -106.91769409179688, -103.22746276855469, -99.5372314453125, -95.84700012207031, -92.15676879882812, -88.46653747558594, -84.77631378173828, -81.0860824584961, -77.3958511352539, -73.70561981201172, -70.01539611816406, -66.32516479492188, -62.63493347167969, -58.944705963134766, -55.25447463989258, -51.564247131347656, -47.87401580810547, -44.18378448486328, -40.49355697631836, -36.80332946777344, -33.11309814453125, -29.422870635986328, -25.73263931274414, -22.04241180419922, -18.35218048095703, -14.661951065063477, -10.971721649169922, -7.281492233276367, -3.5912625789642334, 0.09896707534790039, 3.7891969680786133, 7.479426383972168, 11.169656753540039, 14.859886169433594, 18.55011558532715, 22.240345001220703]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 5.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 14.0, 15.0, 17.0, 19.0, 26.0, 27.0, 25.0, 19.0, 24.0, 29.0, 37.0, 38.0, 39.0, 40.0, 31.0, 32.0, 34.0, 46.0, 31.0, 47.0, 33.0, 26.0, 32.0, 47.0, 23.0, 23.0, 13.0, 18.0, 14.0, 25.0, 16.0, 16.0, 9.0, 15.0, 12.0, 10.0, 3.0, 11.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-35.75941467285156, -34.63930130004883, -33.51919174194336, -32.399078369140625, -31.27896499633789, -30.15885353088379, -29.038742065429688, -27.918628692626953, -26.79851722717285, -25.67840576171875, -24.558292388916016, -23.438180923461914, -22.318069458007812, -21.197956085205078, -20.077844619750977, -18.957733154296875, -17.83761978149414, -16.71750831604004, -15.597394943237305, -14.477283477783203, -13.357171058654785, -12.237058639526367, -11.116947174072266, -9.996834754943848, -8.87672233581543, -7.756609916687012, -6.636497974395752, -5.516386032104492, -4.396273612976074, -3.2761611938476562, -2.1560492515563965, -1.0359373092651367, 0.08417510986328125, 1.2042872905731201, 2.324399471282959, 3.444511651992798, 4.564623832702637, 5.684736251831055, 6.8048481941223145, 7.924960136413574, 9.045072555541992, 10.16518497467041, 11.285297393798828, 12.40540885925293, 13.525521278381348, 14.645633697509766, 15.765745162963867, 16.88585662841797, 18.005970001220703, 19.126081466674805, 20.24619483947754, 21.36630630493164, 22.486419677734375, 23.606531143188477, 24.726642608642578, 25.846755981445312, 26.966867446899414, 28.086978912353516, 29.20709228515625, 30.32720375061035, 31.447315216064453, 32.56742858886719, 33.68754196166992, 34.80765151977539, 35.927764892578125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 33.0, 30.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 2.0, 4.0, 9.0, 7.0, 20.0, 22.0, 37.0, 43.0, 85.0, 105.0, 166.0, 227.0, 354.0, 438.0, 709.0, 1024.0, 1466.0, 2186.0, 3143.0, 4669.0, 6694.0, 10090.0, 15057.0, 22638.0, 34451.0, 53758.0, 85829.0, 141256.0, 224005.0, 163757.0, 98493.0, 61074.0, 39031.0, 25544.0, 16981.0, 11381.0, 7714.0, 5004.0, 3476.0, 2380.0, 1603.0, 1092.0, 778.0, 511.0, 378.0, 290.0, 189.0, 141.0, 77.0, 46.0, 44.0, 38.0, 16.0, 13.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0791015625, -1.0449981689453125, -1.010894775390625, -0.9767913818359375, -0.94268798828125, -0.9085845947265625, -0.874481201171875, -0.8403778076171875, -0.8062744140625, -0.7721710205078125, -0.738067626953125, -0.7039642333984375, -0.66986083984375, -0.6357574462890625, -0.601654052734375, -0.5675506591796875, -0.533447265625, -0.4993438720703125, -0.465240478515625, -0.4311370849609375, -0.39703369140625, -0.3629302978515625, -0.328826904296875, -0.2947235107421875, -0.2606201171875, -0.2265167236328125, -0.192413330078125, -0.1583099365234375, -0.12420654296875, -0.0901031494140625, -0.055999755859375, -0.0218963623046875, 0.01220703125, 0.0463104248046875, 0.080413818359375, 0.1145172119140625, 0.14862060546875, 0.1827239990234375, 0.216827392578125, 0.2509307861328125, 0.2850341796875, 0.3191375732421875, 0.353240966796875, 0.3873443603515625, 0.42144775390625, 0.4555511474609375, 0.489654541015625, 0.5237579345703125, 0.557861328125, 0.5919647216796875, 0.626068115234375, 0.6601715087890625, 0.69427490234375, 0.7283782958984375, 0.762481689453125, 0.7965850830078125, 0.8306884765625, 0.8647918701171875, 0.898895263671875, 0.9329986572265625, 0.96710205078125, 1.0012054443359375, 1.035308837890625, 1.0694122314453125, 1.103515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 10.0, 10.0, 8.0, 18.0, 13.0, 27.0, 23.0, 28.0, 29.0, 25.0, 25.0, 23.0, 34.0, 41.0, 45.0, 34.0, 37.0, 1069.0, 38.0, 34.0, 30.0, 50.0, 37.0, 35.0, 40.0, 40.0, 23.0, 24.0, 29.0, 19.0, 19.0, 11.0, 13.0, 12.0, 5.0, 9.0, 6.0, 12.0, 1.0, 5.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2972412109375, -5.141357421875, -4.9854736328125, -4.82958984375, -4.6737060546875, -4.517822265625, -4.3619384765625, -4.2060546875, -4.0501708984375, -3.894287109375, -3.7384033203125, -3.58251953125, -3.4266357421875, -3.270751953125, -3.1148681640625, -2.958984375, -2.8031005859375, -2.647216796875, -2.4913330078125, -2.33544921875, -2.1795654296875, -2.023681640625, -1.8677978515625, -1.7119140625, -1.5560302734375, -1.400146484375, -1.2442626953125, -1.08837890625, -0.9324951171875, -0.776611328125, -0.6207275390625, -0.46484375, -0.3089599609375, -0.153076171875, 0.0028076171875, 0.15869140625, 0.3145751953125, 0.470458984375, 0.6263427734375, 0.7822265625, 0.9381103515625, 1.093994140625, 1.2498779296875, 1.40576171875, 1.5616455078125, 1.717529296875, 1.8734130859375, 2.029296875, 2.1851806640625, 2.341064453125, 2.4969482421875, 2.65283203125, 2.8087158203125, 2.964599609375, 3.1204833984375, 3.2763671875, 3.4322509765625, 3.588134765625, 3.7440185546875, 3.89990234375, 4.0557861328125, 4.211669921875, 4.3675537109375, 4.5234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 12.0, 25.0, 41.0, 46.0, 91.0, 138.0, 172.0, 277.0, 379.0, 615.0, 920.0, 1456.0, 2094.0, 3098.0, 4694.0, 7172.0, 10883.0, 17039.0, 26863.0, 44315.0, 74643.0, 131300.0, 1289586.0, 201971.0, 110593.0, 63961.0, 38149.0, 23508.0, 14746.0, 9713.0, 6277.0, 4163.0, 2711.0, 1828.0, 1251.0, 801.0, 558.0, 353.0, 229.0, 158.0, 102.0, 63.0, 48.0, 28.0, 17.0, 13.0, 8.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.169921875, -1.1320037841796875, -1.094085693359375, -1.0561676025390625, -1.01824951171875, -0.9803314208984375, -0.942413330078125, -0.9044952392578125, -0.8665771484375, -0.8286590576171875, -0.790740966796875, -0.7528228759765625, -0.71490478515625, -0.6769866943359375, -0.639068603515625, -0.6011505126953125, -0.563232421875, -0.5253143310546875, -0.487396240234375, -0.4494781494140625, -0.41156005859375, -0.3736419677734375, -0.335723876953125, -0.2978057861328125, -0.2598876953125, -0.2219696044921875, -0.184051513671875, -0.1461334228515625, -0.10821533203125, -0.0702972412109375, -0.032379150390625, 0.0055389404296875, 0.04345703125, 0.0813751220703125, 0.119293212890625, 0.1572113037109375, 0.19512939453125, 0.2330474853515625, 0.270965576171875, 0.3088836669921875, 0.3468017578125, 0.3847198486328125, 0.422637939453125, 0.4605560302734375, 0.49847412109375, 0.5363922119140625, 0.574310302734375, 0.6122283935546875, 0.650146484375, 0.6880645751953125, 0.725982666015625, 0.7639007568359375, 0.80181884765625, 0.8397369384765625, 0.877655029296875, 0.9155731201171875, 0.9534912109375, 0.9914093017578125, 1.029327392578125, 1.0672454833984375, 1.10516357421875, 1.1430816650390625, 1.180999755859375, 1.2189178466796875, 1.2568359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 4.0, 3.0, 7.0, 16.0, 12.0, 17.0, 17.0, 18.0, 29.0, 37.0, 53.0, 68.0, 71.0, 91.0, 84.0, 84.0, 79.0, 69.0, 42.0, 47.0, 33.0, 27.0, 19.0, 21.0, 14.0, 12.0, 6.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010671615600585938, -0.0010363012552261353, -0.0010054409503936768, -0.0009745806455612183, -0.0009437203407287598, -0.0009128600358963013, -0.0008819997310638428, -0.0008511394262313843, -0.0008202791213989258, -0.0007894188165664673, -0.0007585585117340088, -0.0007276982069015503, -0.0006968379020690918, -0.0006659775972366333, -0.0006351172924041748, -0.0006042569875717163, -0.0005733966827392578, -0.0005425363779067993, -0.0005116760730743408, -0.0004808157682418823, -0.00044995546340942383, -0.00041909515857696533, -0.00038823485374450684, -0.00035737454891204834, -0.00032651424407958984, -0.00029565393924713135, -0.00026479363441467285, -0.00023393332958221436, -0.00020307302474975586, -0.00017221271991729736, -0.00014135241508483887, -0.00011049211025238037, -7.963180541992188e-05, -4.877150058746338e-05, -1.7911195755004883e-05, 1.2949109077453613e-05, 4.380941390991211e-05, 7.46697187423706e-05, 0.0001055300235748291, 0.0001363903284072876, 0.0001672506332397461, 0.0001981109380722046, 0.00022897124290466309, 0.0002598315477371216, 0.0002906918525695801, 0.0003215521574020386, 0.00035241246223449707, 0.00038327276706695557, 0.00041413307189941406, 0.00044499337673187256, 0.00047585368156433105, 0.0005067139863967896, 0.000537574291229248, 0.0005684345960617065, 0.000599294900894165, 0.0006301552057266235, 0.000661015510559082, 0.0006918758153915405, 0.000722736120223999, 0.0007535964250564575, 0.000784456729888916, 0.0008153170347213745, 0.000846177339553833, 0.0008770376443862915, 0.00090789794921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 15.0, 11.0, 15.0, 24.0, 36.0, 38.0, 47.0, 70.0, 98.0, 157.0, 308.0, 575.0, 3473.0, 1038840.0, 3403.0, 605.0, 287.0, 164.0, 91.0, 68.0, 59.0, 42.0, 26.0, 26.0, 11.0, 20.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.018646240234375, -0.018014192581176758, -0.017382144927978516, -0.016750097274780273, -0.01611804962158203, -0.015486001968383789, -0.014853954315185547, -0.014221906661987305, -0.013589859008789062, -0.01295781135559082, -0.012325763702392578, -0.011693716049194336, -0.011061668395996094, -0.010429620742797852, -0.00979757308959961, -0.009165525436401367, -0.008533477783203125, -0.007901430130004883, -0.007269382476806641, -0.0066373348236083984, -0.006005287170410156, -0.005373239517211914, -0.004741191864013672, -0.00410914421081543, -0.0034770965576171875, -0.0028450489044189453, -0.002213001251220703, -0.001580953598022461, -0.0009489059448242188, -0.00031685829162597656, 0.0003151893615722656, 0.0009472370147705078, 0.00157928466796875, 0.002211332321166992, 0.0028433799743652344, 0.0034754276275634766, 0.004107475280761719, 0.004739522933959961, 0.005371570587158203, 0.006003618240356445, 0.0066356658935546875, 0.00726771354675293, 0.007899761199951172, 0.008531808853149414, 0.009163856506347656, 0.009795904159545898, 0.01042795181274414, 0.011059999465942383, 0.011692047119140625, 0.012324094772338867, 0.01295614242553711, 0.013588190078735352, 0.014220237731933594, 0.014852285385131836, 0.015484333038330078, 0.01611638069152832, 0.016748428344726562, 0.017380475997924805, 0.018012523651123047, 0.01864457130432129, 0.01927661895751953, 0.019908666610717773, 0.020540714263916016, 0.021172761917114258, 0.0218048095703125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 14.0, 38.0, 64.0, 118.0, 160.0, 200.0, 158.0, 100.0, 68.0, 39.0, 18.0, 17.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004894381272606552, -0.0004709027416538447, -0.00045236735604703426, -0.0004338319704402238, -0.00041529658483341336, -0.00039676117012277246, -0.000378225784515962, -0.00035969039890915155, -0.0003411550133023411, -0.00032261962769553065, -0.0003040842420887202, -0.00028554885648190975, -0.00026701344177126884, -0.00024847808526828885, -0.00022994267055764794, -0.0002114072849508375, -0.00019287189934402704, -0.0001743365137372166, -0.00015580112813040614, -0.00013726572797168046, -0.00011873034236487001, -0.00010019495675805956, -8.16595638752915e-05, -6.312417099252343e-05, -4.458878538571298e-05, -2.6053396140923724e-05, -7.518006896134466e-06, 1.1017382348654792e-05, 2.955277159344405e-05, 4.80881572002545e-05, 6.662355008302256e-05, 8.515894296579063e-05, 0.00010369427036494017, 0.00012222965597175062, 0.00014076504157856107, 0.00015930044173728675, 0.0001778358273440972, 0.00019637121295090765, 0.00021490661310963333, 0.00023344199871644378, 0.00025197738432325423, 0.0002705127699300647, 0.00028904815553687513, 0.0003075835411436856, 0.0003261189558543265, 0.0003446543123573065, 0.0003631897270679474, 0.00038172511267475784, 0.0004002604982815683, 0.00041879588388837874, 0.0004373312694951892, 0.00045586665510199964, 0.0004744020407088101, 0.000492937455419451, 0.000511472811922431, 0.0005300082266330719, 0.0005485436413437128, 0.0005670790560543537, 0.0005856144125573337, 0.0006041498272679746, 0.0006226851837709546, 0.0006412205984815955, 0.0006597559549845755, 0.0006782913696952164, 0.0006968267261981964]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 4.0, 5.0, 8.0, 13.0, 11.0, 14.0, 18.0, 17.0, 19.0, 26.0, 20.0, 27.0, 29.0, 30.0, 48.0, 32.0, 23.0, 40.0, 41.0, 27.0, 33.0, 47.0, 40.0, 41.0, 27.0, 39.0, 38.0, 25.0, 26.0, 32.0, 23.0, 15.0, 21.0, 21.0, 18.0, 10.0, 13.0, 11.0, 8.0, 17.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003337264060974121, -0.0003224192187190056, -0.00031111203134059906, -0.00029980484396219254, -0.000288497656583786, -0.0002771904692053795, -0.00026588328182697296, -0.00025457609444856644, -0.0002432689070701599, -0.0002319617196917534, -0.00022065453231334686, -0.00020934734493494034, -0.0001980401575565338, -0.0001867329701781273, -0.00017542578279972076, -0.00016411859542131424, -0.00015281140804290771, -0.0001415042206645012, -0.00013019703328609467, -0.00011888984590768814, -0.00010758265852928162, -9.627547115087509e-05, -8.496828377246857e-05, -7.366109639406204e-05, -6.235390901565552e-05, -5.104672163724899e-05, -3.973953425884247e-05, -2.8432346880435944e-05, -1.712515950202942e-05, -5.817972123622894e-06, 5.48921525478363e-06, 1.6796402633190155e-05, 2.810359001159668e-05, 3.9410777390003204e-05, 5.071796476840973e-05, 6.202515214681625e-05, 7.333233952522278e-05, 8.46395269036293e-05, 9.594671428203583e-05, 0.00010725390166044235, 0.00011856108903884888, 0.0001298682764172554, 0.00014117546379566193, 0.00015248265117406845, 0.00016378983855247498, 0.0001750970259308815, 0.00018640421330928802, 0.00019771140068769455, 0.00020901858806610107, 0.0002203257754445076, 0.00023163296282291412, 0.00024294015020132065, 0.00025424733757972717, 0.0002655545249581337, 0.0002768617123365402, 0.00028816889971494675, 0.00029947608709335327, 0.0003107832744717598, 0.0003220904618501663, 0.00033339764922857285, 0.00034470483660697937, 0.0003560120239853859, 0.0003673192113637924, 0.00037862639874219894, 0.00038993358612060547]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 6.0, 6.0, 12.0, 13.0, 6.0, 22.0, 17.0, 19.0, 23.0, 34.0, 22.0, 27.0, 28.0, 37.0, 42.0, 34.0, 31.0, 43.0, 35.0, 40.0, 43.0, 46.0, 38.0, 31.0, 34.0, 29.0, 33.0, 30.0, 28.0, 22.0, 27.0, 14.0, 18.0, 19.0, 16.0, 13.0, 9.0, 9.0, 10.0, 4.0, 8.0, 3.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51953125, -7.28167724609375, -7.0438232421875, -6.80596923828125, -6.568115234375, -6.33026123046875, -6.0924072265625, -5.85455322265625, -5.61669921875, -5.37884521484375, -5.1409912109375, -4.90313720703125, -4.665283203125, -4.42742919921875, -4.1895751953125, -3.95172119140625, -3.7138671875, -3.47601318359375, -3.2381591796875, -3.00030517578125, -2.762451171875, -2.52459716796875, -2.2867431640625, -2.04888916015625, -1.81103515625, -1.57318115234375, -1.3353271484375, -1.09747314453125, -0.859619140625, -0.62176513671875, -0.3839111328125, -0.14605712890625, 0.091796875, 0.32965087890625, 0.5675048828125, 0.80535888671875, 1.043212890625, 1.28106689453125, 1.5189208984375, 1.75677490234375, 1.99462890625, 2.23248291015625, 2.4703369140625, 2.70819091796875, 2.946044921875, 3.18389892578125, 3.4217529296875, 3.65960693359375, 3.8974609375, 4.13531494140625, 4.3731689453125, 4.61102294921875, 4.848876953125, 5.08673095703125, 5.3245849609375, 5.56243896484375, 5.80029296875, 6.03814697265625, 6.2760009765625, 6.51385498046875, 6.751708984375, 6.98956298828125, 7.2274169921875, 7.46527099609375, 7.703125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 8.0, 7.0, 11.0, 17.0, 24.0, 29.0, 24.0, 53.0, 54.0, 61.0, 105.0, 132.0, 182.0, 279.0, 497.0, 923.0, 1895.0, 4584.0, 11531.0, 34365.0, 116285.0, 450872.0, 308114.0, 78761.0, 24335.0, 8412.0, 3412.0, 1494.0, 728.0, 436.0, 240.0, 167.0, 128.0, 87.0, 55.0, 45.0, 56.0, 29.0, 25.0, 19.0, 16.0, 12.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.38330078125, -9.0791015625, -8.77490234375, -8.470703125, -8.16650390625, -7.8623046875, -7.55810546875, -7.25390625, -6.94970703125, -6.6455078125, -6.34130859375, -6.037109375, -5.73291015625, -5.4287109375, -5.12451171875, -4.8203125, -4.51611328125, -4.2119140625, -3.90771484375, -3.603515625, -3.29931640625, -2.9951171875, -2.69091796875, -2.38671875, -2.08251953125, -1.7783203125, -1.47412109375, -1.169921875, -0.86572265625, -0.5615234375, -0.25732421875, 0.046875, 0.35107421875, 0.6552734375, 0.95947265625, 1.263671875, 1.56787109375, 1.8720703125, 2.17626953125, 2.48046875, 2.78466796875, 3.0888671875, 3.39306640625, 3.697265625, 4.00146484375, 4.3056640625, 4.60986328125, 4.9140625, 5.21826171875, 5.5224609375, 5.82666015625, 6.130859375, 6.43505859375, 6.7392578125, 7.04345703125, 7.34765625, 7.65185546875, 7.9560546875, 8.26025390625, 8.564453125, 8.86865234375, 9.1728515625, 9.47705078125, 9.78125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 10.0, 14.0, 10.0, 10.0, 12.0, 19.0, 17.0, 25.0, 24.0, 26.0, 26.0, 23.0, 34.0, 48.0, 40.0, 51.0, 64.0, 108.0, 221.0, 1490.0, 209.0, 95.0, 64.0, 46.0, 50.0, 29.0, 43.0, 37.0, 22.0, 27.0, 19.0, 21.0, 17.0, 16.0, 16.0, 16.0, 6.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.859375, -20.217041015625, -19.57470703125, -18.932373046875, -18.2900390625, -17.647705078125, -17.00537109375, -16.363037109375, -15.720703125, -15.078369140625, -14.43603515625, -13.793701171875, -13.1513671875, -12.509033203125, -11.86669921875, -11.224365234375, -10.58203125, -9.939697265625, -9.29736328125, -8.655029296875, -8.0126953125, -7.370361328125, -6.72802734375, -6.085693359375, -5.443359375, -4.801025390625, -4.15869140625, -3.516357421875, -2.8740234375, -2.231689453125, -1.58935546875, -0.947021484375, -0.3046875, 0.337646484375, 0.97998046875, 1.622314453125, 2.2646484375, 2.906982421875, 3.54931640625, 4.191650390625, 4.833984375, 5.476318359375, 6.11865234375, 6.760986328125, 7.4033203125, 8.045654296875, 8.68798828125, 9.330322265625, 9.97265625, 10.614990234375, 11.25732421875, 11.899658203125, 12.5419921875, 13.184326171875, 13.82666015625, 14.468994140625, 15.111328125, 15.753662109375, 16.39599609375, 17.038330078125, 17.6806640625, 18.322998046875, 18.96533203125, 19.607666015625, 20.25]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 10.0, 6.0, 12.0, 19.0, 25.0, 30.0, 43.0, 57.0, 91.0, 144.0, 197.0, 331.0, 657.0, 2585.0, 91752.0, 3014966.0, 31735.0, 1522.0, 559.0, 336.0, 182.0, 133.0, 90.0, 61.0, 35.0, 32.0, 28.0, 21.0, 12.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.09423828125, -32.7509765625, -31.40771484375, -30.064453125, -28.72119140625, -27.3779296875, -26.03466796875, -24.69140625, -23.34814453125, -22.0048828125, -20.66162109375, -19.318359375, -17.97509765625, -16.6318359375, -15.28857421875, -13.9453125, -12.60205078125, -11.2587890625, -9.91552734375, -8.572265625, -7.22900390625, -5.8857421875, -4.54248046875, -3.19921875, -1.85595703125, -0.5126953125, 0.83056640625, 2.173828125, 3.51708984375, 4.8603515625, 6.20361328125, 7.546875, 8.89013671875, 10.2333984375, 11.57666015625, 12.919921875, 14.26318359375, 15.6064453125, 16.94970703125, 18.29296875, 19.63623046875, 20.9794921875, 22.32275390625, 23.666015625, 25.00927734375, 26.3525390625, 27.69580078125, 29.0390625, 30.38232421875, 31.7255859375, 33.06884765625, 34.412109375, 35.75537109375, 37.0986328125, 38.44189453125, 39.78515625, 41.12841796875, 42.4716796875, 43.81494140625, 45.158203125, 46.50146484375, 47.8447265625, 49.18798828125, 50.53125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [2.0, 52.0, 878.0, 85.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.468585968017578, -9.919108390808105, -3.369630813598633, 3.1798477172851562, 9.729324340820312, 16.27880096435547, 22.82828140258789, 29.377758026123047, 35.9272346496582, 42.47671127319336, 49.02619171142578, 55.57566833496094, 62.125144958496094, 68.67462158203125, 75.22410583496094, 81.77357482910156, 88.32305908203125, 94.8725357055664, 101.42201232910156, 107.97149658203125, 114.52096557617188, 121.07044982910156, 127.61992645263672, 134.16940307617188, 140.7188720703125, 147.2683563232422, 153.8178253173828, 160.3673095703125, 166.91677856445312, 173.4662628173828, 180.0157470703125, 186.56521606445312, 193.11468505859375, 199.66416931152344, 206.21363830566406, 212.76312255859375, 219.31259155273438, 225.86207580566406, 232.41156005859375, 238.96102905273438, 245.510498046875, 252.0599822998047, 258.6094665527344, 265.158935546875, 271.7084045410156, 278.25787353515625, 284.807373046875, 291.3568420410156, 297.90631103515625, 304.4557800292969, 311.0052795410156, 317.55474853515625, 324.1042175292969, 330.6536865234375, 337.20318603515625, 343.7526550292969, 350.3021545410156, 356.85162353515625, 363.401123046875, 369.9505920410156, 376.50006103515625, 383.0495300292969, 389.5990295410156, 396.14849853515625, 402.6979675292969]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 6.0, 3.0, 12.0, 9.0, 12.0, 16.0, 19.0, 24.0, 24.0, 21.0, 24.0, 23.0, 26.0, 24.0, 33.0, 24.0, 38.0, 27.0, 35.0, 40.0, 44.0, 47.0, 41.0, 41.0, 37.0, 33.0, 37.0, 26.0, 38.0, 29.0, 15.0, 24.0, 25.0, 14.0, 14.0, 24.0, 6.0, 13.0, 7.0, 7.0, 8.0, 2.0, 8.0, 6.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.56782913208008, -43.14304733276367, -41.71826934814453, -40.293487548828125, -38.86870574951172, -37.44392395019531, -36.019142150878906, -34.594364166259766, -33.16958236694336, -31.744800567626953, -30.32002067565918, -28.895240783691406, -27.470458984375, -26.045677185058594, -24.62089729309082, -23.196117401123047, -21.77133560180664, -20.346553802490234, -18.92177391052246, -17.496994018554688, -16.07221221923828, -14.647431373596191, -13.222650527954102, -11.797869682312012, -10.373088836669922, -8.948307991027832, -7.523527145385742, -6.098746299743652, -4.6739654541015625, -3.2491846084594727, -1.8244037628173828, -0.39962291717529297, 1.0251579284667969, 2.4499387741088867, 3.8747196197509766, 5.299500465393066, 6.724281311035156, 8.149062156677246, 9.573843002319336, 10.998623847961426, 12.423404693603516, 13.848185539245605, 15.272966384887695, 16.69774627685547, 18.122528076171875, 19.54730987548828, 20.972089767456055, 22.396869659423828, 23.821651458740234, 25.24643325805664, 26.671213150024414, 28.095993041992188, 29.520774841308594, 30.945556640625, 32.370338439941406, 33.79511642456055, 35.21989822387695, 36.64468002319336, 38.0694580078125, 39.494239807128906, 40.91902160644531, 42.34380340576172, 43.768585205078125, 45.193363189697266, 46.61814498901367]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 3.0, 9.0, 9.0, 9.0, 12.0, 18.0, 18.0, 19.0, 14.0, 16.0, 33.0, 31.0, 24.0, 29.0, 34.0, 44.0, 38.0, 34.0, 37.0, 31.0, 29.0, 51.0, 34.0, 37.0, 43.0, 26.0, 37.0, 26.0, 23.0, 28.0, 27.0, 24.0, 24.0, 18.0, 18.0, 12.0, 15.0, 9.0, 8.0, 6.0, 8.0, 3.0, 9.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-7.921875, -7.6856689453125, -7.449462890625, -7.2132568359375, -6.97705078125, -6.7408447265625, -6.504638671875, -6.2684326171875, -6.0322265625, -5.7960205078125, -5.559814453125, -5.3236083984375, -5.08740234375, -4.8511962890625, -4.614990234375, -4.3787841796875, -4.142578125, -3.9063720703125, -3.670166015625, -3.4339599609375, -3.19775390625, -2.9615478515625, -2.725341796875, -2.4891357421875, -2.2529296875, -2.0167236328125, -1.780517578125, -1.5443115234375, -1.30810546875, -1.0718994140625, -0.835693359375, -0.5994873046875, -0.36328125, -0.1270751953125, 0.109130859375, 0.3453369140625, 0.58154296875, 0.8177490234375, 1.053955078125, 1.2901611328125, 1.5263671875, 1.7625732421875, 1.998779296875, 2.2349853515625, 2.47119140625, 2.7073974609375, 2.943603515625, 3.1798095703125, 3.416015625, 3.6522216796875, 3.888427734375, 4.1246337890625, 4.36083984375, 4.5970458984375, 4.833251953125, 5.0694580078125, 5.3056640625, 5.5418701171875, 5.778076171875, 6.0142822265625, 6.25048828125, 6.4866943359375, 6.722900390625, 6.9591064453125, 7.1953125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 5.0, 13.0, 19.0, 23.0, 13.0, 24.0, 35.0, 32.0, 41.0, 49.0, 89.0, 161.0, 349.0, 1218.0, 5671.0, 73331.0, 3047073.0, 1041844.0, 19964.0, 2909.0, 718.0, 245.0, 110.0, 53.0, 47.0, 30.0, 28.0, 28.0, 17.0, 21.0, 16.0, 14.0, 8.0, 15.0, 7.0, 9.0, 3.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.46875, -26.546875, -25.625, -24.703125, -23.78125, -22.859375, -21.9375, -21.015625, -20.09375, -19.171875, -18.25, -17.328125, -16.40625, -15.484375, -14.5625, -13.640625, -12.71875, -11.796875, -10.875, -9.953125, -9.03125, -8.109375, -7.1875, -6.265625, -5.34375, -4.421875, -3.5, -2.578125, -1.65625, -0.734375, 0.1875, 1.109375, 2.03125, 2.953125, 3.875, 4.796875, 5.71875, 6.640625, 7.5625, 8.484375, 9.40625, 10.328125, 11.25, 12.171875, 13.09375, 14.015625, 14.9375, 15.859375, 16.78125, 17.703125, 18.625, 19.546875, 20.46875, 21.390625, 22.3125, 23.234375, 24.15625, 25.078125, 26.0, 26.921875, 27.84375, 28.765625, 29.6875, 30.609375, 31.53125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 8.0, 7.0, 7.0, 10.0, 8.0, 20.0, 27.0, 21.0, 34.0, 50.0, 59.0, 75.0, 110.0, 171.0, 254.0, 352.0, 430.0, 539.0, 494.0, 427.0, 281.0, 188.0, 157.0, 81.0, 66.0, 52.0, 38.0, 25.0, 25.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.7119140625, -11.353515625, -10.9951171875, -10.63671875, -10.2783203125, -9.919921875, -9.5615234375, -9.203125, -8.8447265625, -8.486328125, -8.1279296875, -7.76953125, -7.4111328125, -7.052734375, -6.6943359375, -6.3359375, -5.9775390625, -5.619140625, -5.2607421875, -4.90234375, -4.5439453125, -4.185546875, -3.8271484375, -3.46875, -3.1103515625, -2.751953125, -2.3935546875, -2.03515625, -1.6767578125, -1.318359375, -0.9599609375, -0.6015625, -0.2431640625, 0.115234375, 0.4736328125, 0.83203125, 1.1904296875, 1.548828125, 1.9072265625, 2.265625, 2.6240234375, 2.982421875, 3.3408203125, 3.69921875, 4.0576171875, 4.416015625, 4.7744140625, 5.1328125, 5.4912109375, 5.849609375, 6.2080078125, 6.56640625, 6.9248046875, 7.283203125, 7.6416015625, 8.0, 8.3583984375, 8.716796875, 9.0751953125, 9.43359375, 9.7919921875, 10.150390625, 10.5087890625, 10.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 8.0, 12.0, 12.0, 21.0, 26.0, 28.0, 68.0, 77.0, 174.0, 325.0, 914.0, 4254.0, 53604.0, 3535002.0, 581137.0, 15267.0, 2089.0, 602.0, 246.0, 131.0, 89.0, 60.0, 44.0, 22.0, 20.0, 8.0, 9.0, 6.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-42.0625, -40.919189453125, -39.77587890625, -38.632568359375, -37.4892578125, -36.345947265625, -35.20263671875, -34.059326171875, -32.916015625, -31.772705078125, -30.62939453125, -29.486083984375, -28.3427734375, -27.199462890625, -26.05615234375, -24.912841796875, -23.76953125, -22.626220703125, -21.48291015625, -20.339599609375, -19.1962890625, -18.052978515625, -16.90966796875, -15.766357421875, -14.623046875, -13.479736328125, -12.33642578125, -11.193115234375, -10.0498046875, -8.906494140625, -7.76318359375, -6.619873046875, -5.4765625, -4.333251953125, -3.18994140625, -2.046630859375, -0.9033203125, 0.239990234375, 1.38330078125, 2.526611328125, 3.669921875, 4.813232421875, 5.95654296875, 7.099853515625, 8.2431640625, 9.386474609375, 10.52978515625, 11.673095703125, 12.81640625, 13.959716796875, 15.10302734375, 16.246337890625, 17.3896484375, 18.532958984375, 19.67626953125, 20.819580078125, 21.962890625, 23.106201171875, 24.24951171875, 25.392822265625, 26.5361328125, 27.679443359375, 28.82275390625, 29.966064453125, 31.109375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 46.0, 296.0, 457.0, 190.0, 22.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.51425170898438, -162.16485595703125, -156.81544494628906, -151.46604919433594, -146.11663818359375, -140.76724243164062, -135.4178466796875, -130.0684356689453, -124.71903991699219, -119.36963653564453, -114.02023315429688, -108.67083740234375, -103.3214340209961, -97.97203063964844, -92.62262725830078, -87.27322387695312, -81.92382049560547, -76.57441711425781, -71.22501373291016, -65.8756103515625, -60.526214599609375, -55.17681121826172, -49.82740783691406, -44.47800827026367, -39.128604888916016, -33.77920150756836, -28.42980194091797, -23.080398559570312, -17.73099708557129, -12.381595611572266, -7.032192230224609, -1.6827926635742188, 3.6666107177734375, 9.016012191772461, 14.3654146194458, 19.71481704711914, 25.064218521118164, 30.413619995117188, 35.763023376464844, 41.112422943115234, 46.46182632446289, 51.81122970581055, 57.16062927246094, 62.510032653808594, 67.85943603515625, 73.20883178710938, 78.55824279785156, 83.90763854980469, 89.25704193115234, 94.6064453125, 99.95584869384766, 105.30525207519531, 110.65464782714844, 116.0040512084961, 121.35345458984375, 126.70285034179688, 132.05226135253906, 137.4016571044922, 142.75106811523438, 148.1004638671875, 153.4498748779297, 158.7992706298828, 164.148681640625, 169.49807739257812, 174.84747314453125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 7.0, 8.0, 9.0, 11.0, 13.0, 18.0, 18.0, 23.0, 34.0, 27.0, 36.0, 23.0, 23.0, 31.0, 28.0, 36.0, 40.0, 21.0, 36.0, 38.0, 41.0, 53.0, 24.0, 41.0, 49.0, 31.0, 25.0, 22.0, 31.0, 33.0, 25.0, 14.0, 23.0, 15.0, 15.0, 9.0, 15.0, 7.0, 10.0, 8.0, 6.0, 3.0, 6.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.921142578125, -30.824615478515625, -29.72808837890625, -28.631561279296875, -27.5350341796875, -26.438507080078125, -25.34197998046875, -24.245452880859375, -23.14892578125, -22.052398681640625, -20.95587158203125, -19.859344482421875, -18.7628173828125, -17.666290283203125, -16.56976318359375, -15.473236083984375, -14.376708984375, -13.280181884765625, -12.18365478515625, -11.087127685546875, -9.9906005859375, -8.894073486328125, -7.79754638671875, -6.701019287109375, -5.6044921875, -4.507965087890625, -3.41143798828125, -2.314910888671875, -1.2183837890625, -0.121856689453125, 0.97467041015625, 2.071197509765625, 3.167724609375, 4.264251708984375, 5.36077880859375, 6.457305908203125, 7.5538330078125, 8.650360107421875, 9.74688720703125, 10.843414306640625, 11.93994140625, 13.036468505859375, 14.13299560546875, 15.229522705078125, 16.3260498046875, 17.422576904296875, 18.51910400390625, 19.615631103515625, 20.712158203125, 21.808685302734375, 22.90521240234375, 24.001739501953125, 25.0982666015625, 26.194793701171875, 27.29132080078125, 28.387847900390625, 29.484375, 30.580902099609375, 31.67742919921875, 32.773956298828125, 33.8704833984375, 34.967010498046875, 36.06353759765625, 37.160064697265625, 38.256591796875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 17.0, 21.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 28.0, 29.0, 61.0, 77.0, 125.0, 173.0, 275.0, 450.0, 704.0, 1105.0, 1686.0, 2702.0, 4171.0, 6606.0, 10400.0, 16147.0, 25838.0, 41588.0, 67314.0, 111828.0, 202906.0, 230200.0, 125667.0, 74728.0, 46022.0, 28516.0, 17783.0, 11332.0, 7248.0, 4648.0, 2935.0, 1870.0, 1196.0, 793.0, 490.0, 322.0, 208.0, 130.0, 88.0, 59.0, 26.0, 21.0, 14.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3192596435546875, -1.278167724609375, -1.2370758056640625, -1.19598388671875, -1.1548919677734375, -1.113800048828125, -1.0727081298828125, -1.0316162109375, -0.9905242919921875, -0.949432373046875, -0.9083404541015625, -0.86724853515625, -0.8261566162109375, -0.785064697265625, -0.7439727783203125, -0.702880859375, -0.6617889404296875, -0.620697021484375, -0.5796051025390625, -0.53851318359375, -0.4974212646484375, -0.456329345703125, -0.4152374267578125, -0.3741455078125, -0.3330535888671875, -0.291961669921875, -0.2508697509765625, -0.20977783203125, -0.1686859130859375, -0.127593994140625, -0.0865020751953125, -0.04541015625, -0.0043182373046875, 0.036773681640625, 0.0778656005859375, 0.11895751953125, 0.1600494384765625, 0.201141357421875, 0.2422332763671875, 0.2833251953125, 0.3244171142578125, 0.365509033203125, 0.4066009521484375, 0.44769287109375, 0.4887847900390625, 0.529876708984375, 0.5709686279296875, 0.612060546875, 0.6531524658203125, 0.694244384765625, 0.7353363037109375, 0.77642822265625, 0.8175201416015625, 0.858612060546875, 0.8997039794921875, 0.9407958984375, 0.9818878173828125, 1.022979736328125, 1.0640716552734375, 1.10516357421875, 1.1462554931640625, 1.187347412109375, 1.2284393310546875, 1.26953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 8.0, 10.0, 14.0, 12.0, 16.0, 25.0, 18.0, 25.0, 32.0, 30.0, 33.0, 26.0, 36.0, 36.0, 49.0, 35.0, 42.0, 45.0, 1061.0, 37.0, 48.0, 53.0, 25.0, 40.0, 30.0, 27.0, 42.0, 27.0, 20.0, 16.0, 22.0, 12.0, 7.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.65625, -5.4903564453125, -5.324462890625, -5.1585693359375, -4.99267578125, -4.8267822265625, -4.660888671875, -4.4949951171875, -4.3291015625, -4.1632080078125, -3.997314453125, -3.8314208984375, -3.66552734375, -3.4996337890625, -3.333740234375, -3.1678466796875, -3.001953125, -2.8360595703125, -2.670166015625, -2.5042724609375, -2.33837890625, -2.1724853515625, -2.006591796875, -1.8406982421875, -1.6748046875, -1.5089111328125, -1.343017578125, -1.1771240234375, -1.01123046875, -0.8453369140625, -0.679443359375, -0.5135498046875, -0.34765625, -0.1817626953125, -0.015869140625, 0.1500244140625, 0.31591796875, 0.4818115234375, 0.647705078125, 0.8135986328125, 0.9794921875, 1.1453857421875, 1.311279296875, 1.4771728515625, 1.64306640625, 1.8089599609375, 1.974853515625, 2.1407470703125, 2.306640625, 2.4725341796875, 2.638427734375, 2.8043212890625, 2.97021484375, 3.1361083984375, 3.302001953125, 3.4678955078125, 3.6337890625, 3.7996826171875, 3.965576171875, 4.1314697265625, 4.29736328125, 4.4632568359375, 4.629150390625, 4.7950439453125, 4.9609375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 4.0, 13.0, 24.0, 24.0, 32.0, 50.0, 93.0, 131.0, 181.0, 271.0, 444.0, 640.0, 908.0, 1373.0, 1979.0, 2951.0, 4389.0, 6773.0, 10523.0, 16655.0, 26665.0, 43635.0, 74338.0, 130586.0, 1299009.0, 204016.0, 108605.0, 61908.0, 37097.0, 22763.0, 14380.0, 8926.0, 5919.0, 3800.0, 2586.0, 1772.0, 1199.0, 795.0, 552.0, 359.0, 253.0, 169.0, 104.0, 81.0, 54.0, 37.0, 25.0, 12.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2509765625, -1.2116851806640625, -1.172393798828125, -1.1331024169921875, -1.09381103515625, -1.0545196533203125, -1.015228271484375, -0.9759368896484375, -0.9366455078125, -0.8973541259765625, -0.858062744140625, -0.8187713623046875, -0.77947998046875, -0.7401885986328125, -0.700897216796875, -0.6616058349609375, -0.622314453125, -0.5830230712890625, -0.543731689453125, -0.5044403076171875, -0.46514892578125, -0.4258575439453125, -0.386566162109375, -0.3472747802734375, -0.3079833984375, -0.2686920166015625, -0.229400634765625, -0.1901092529296875, -0.15081787109375, -0.1115264892578125, -0.072235107421875, -0.0329437255859375, 0.00634765625, 0.0456390380859375, 0.084930419921875, 0.1242218017578125, 0.16351318359375, 0.2028045654296875, 0.242095947265625, 0.2813873291015625, 0.3206787109375, 0.3599700927734375, 0.399261474609375, 0.4385528564453125, 0.47784423828125, 0.5171356201171875, 0.556427001953125, 0.5957183837890625, 0.635009765625, 0.6743011474609375, 0.713592529296875, 0.7528839111328125, 0.79217529296875, 0.8314666748046875, 0.870758056640625, 0.9100494384765625, 0.9493408203125, 0.9886322021484375, 1.027923583984375, 1.0672149658203125, 1.10650634765625, 1.1457977294921875, 1.185089111328125, 1.2243804931640625, 1.263671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 6.0, 7.0, 6.0, 6.0, 9.0, 12.0, 19.0, 25.0, 17.0, 22.0, 31.0, 41.0, 37.0, 58.0, 54.0, 58.0, 73.0, 57.0, 55.0, 71.0, 61.0, 46.0, 40.0, 35.0, 22.0, 27.0, 22.0, 20.0, 13.0, 13.0, 6.0, 2.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009264945983886719, -0.000896550714969635, -0.0008666068315505981, -0.0008366629481315613, -0.0008067190647125244, -0.0007767751812934875, -0.0007468312978744507, -0.0007168874144554138, -0.000686943531036377, -0.0006569996476173401, -0.0006270557641983032, -0.0005971118807792664, -0.0005671679973602295, -0.0005372241139411926, -0.0005072802305221558, -0.0004773363471031189, -0.00044739246368408203, -0.00041744858026504517, -0.0003875046968460083, -0.00035756081342697144, -0.00032761693000793457, -0.0002976730465888977, -0.00026772916316986084, -0.00023778527975082397, -0.0002078413963317871, -0.00017789751291275024, -0.00014795362949371338, -0.00011800974607467651, -8.806586265563965e-05, -5.812197923660278e-05, -2.8178095817565918e-05, 1.7657876014709473e-06, 3.170967102050781e-05, 6.165355443954468e-05, 9.159743785858154e-05, 0.00012154132127761841, 0.00015148520469665527, 0.00018142908811569214, 0.000211372971534729, 0.00024131685495376587, 0.00027126073837280273, 0.0003012046217918396, 0.00033114850521087646, 0.00036109238862991333, 0.0003910362720489502, 0.00042098015546798706, 0.0004509240388870239, 0.0004808679223060608, 0.0005108118057250977, 0.0005407556891441345, 0.0005706995725631714, 0.0006006434559822083, 0.0006305873394012451, 0.000660531222820282, 0.0006904751062393188, 0.0007204189896583557, 0.0007503628730773926, 0.0007803067564964294, 0.0008102506399154663, 0.0008401945233345032, 0.00087013840675354, 0.0009000822901725769, 0.0009300261735916138, 0.0009599700570106506, 0.0009899139404296875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 7.0, 6.0, 11.0, 13.0, 8.0, 10.0, 22.0, 25.0, 27.0, 38.0, 48.0, 62.0, 92.0, 110.0, 186.0, 338.0, 703.0, 12171.0, 1030639.0, 2360.0, 592.0, 292.0, 207.0, 139.0, 98.0, 82.0, 47.0, 42.0, 28.0, 36.0, 27.0, 15.0, 12.0, 19.0, 10.0, 9.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.019622802734375, -0.019016265869140625, -0.01840972900390625, -0.017803192138671875, -0.0171966552734375, -0.016590118408203125, -0.01598358154296875, -0.015377044677734375, -0.0147705078125, -0.014163970947265625, -0.01355743408203125, -0.012950897216796875, -0.0123443603515625, -0.011737823486328125, -0.01113128662109375, -0.010524749755859375, -0.009918212890625, -0.009311676025390625, -0.00870513916015625, -0.008098602294921875, -0.0074920654296875, -0.006885528564453125, -0.00627899169921875, -0.005672454833984375, -0.00506591796875, -0.004459381103515625, -0.00385284423828125, -0.003246307373046875, -0.0026397705078125, -0.002033233642578125, -0.00142669677734375, -0.000820159912109375, -0.000213623046875, 0.000392913818359375, 0.00099945068359375, 0.001605987548828125, 0.0022125244140625, 0.002819061279296875, 0.00342559814453125, 0.004032135009765625, 0.004638671875, 0.005245208740234375, 0.00585174560546875, 0.006458282470703125, 0.0070648193359375, 0.007671356201171875, 0.00827789306640625, 0.008884429931640625, 0.009490966796875, 0.010097503662109375, 0.01070404052734375, 0.011310577392578125, 0.0119171142578125, 0.012523651123046875, 0.01313018798828125, 0.013736724853515625, 0.01434326171875, 0.014949798583984375, 0.01555633544921875, 0.016162872314453125, 0.0167694091796875, 0.017375946044921875, 0.01798248291015625, 0.018589019775390625, 0.019195556640625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 20.0, 209.0, 563.0, 200.0, 18.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015271920710802078, -0.0014648339711129665, -0.0014024758711457253, -0.0013401176547631621, -0.0012777595547959208, -0.0012154014548286796, -0.0011530432384461164, -0.0010906851384788752, -0.0010283270385116339, -0.0009659689385443926, -0.0009036107803694904, -0.0008412526221945882, -0.0007788945222273469, -0.0007165364222601056, -0.0006541782640852034, -0.0005918201059103012, -0.0005294620059430599, -0.0004671038768719882, -0.00040474574780091643, -0.0003423876187298447, -0.00028002948965877295, -0.0002176713605877012, -0.00015531323151662946, -9.295510244555771e-05, -3.059697337448597e-05, 3.1761155696585774e-05, 9.411928476765752e-05, 0.00015647741383872926, 0.000218835542909801, 0.00028119367198087275, 0.0003435518010519445, 0.00040590993012301624, 0.000468268059194088, 0.0005306261591613293, 0.0005929843173362315, 0.0006553424755111337, 0.000717700575478375, 0.0007800586754456162, 0.0008424168336205184, 0.0009047749917954206, 0.0009671330917626619, 0.0010294911917299032, 0.0010918492916971445, 0.0011542075080797076, 0.001216565608046949, 0.0012789237080141902, 0.0013412819243967533, 0.0014036400243639946, 0.0014659981243312359, 0.0015283562242984772, 0.0015907143242657185, 0.0016530725406482816, 0.0017154306406155229, 0.0017777887405827641, 0.0018401469569653273, 0.0019025050569325686, 0.00196486315689981, 0.002027221256867051, 0.0020895793568342924, 0.0021519374568015337, 0.0022142957895994186, 0.00227665388956666, 0.002339011989533901, 0.0024013700895011425, 0.002463728189468384]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 5.0, 10.0, 12.0, 13.0, 7.0, 21.0, 10.0, 19.0, 26.0, 20.0, 34.0, 34.0, 39.0, 38.0, 34.0, 32.0, 37.0, 38.0, 36.0, 40.0, 49.0, 43.0, 43.0, 36.0, 39.0, 35.0, 35.0, 24.0, 28.0, 25.0, 15.0, 19.0, 21.0, 17.0, 5.0, 12.0, 11.0, 8.0, 8.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004550814628601074, -0.00044012628495693207, -0.0004251711070537567, -0.00041021592915058136, -0.000395260751247406, -0.00038030557334423065, -0.0003653503954410553, -0.00035039521753787994, -0.0003354400396347046, -0.00032048486173152924, -0.0003055296838283539, -0.00029057450592517853, -0.0002756193280220032, -0.0002606641501188278, -0.00024570897221565247, -0.0002307537943124771, -0.00021579861640930176, -0.0002008434385061264, -0.00018588826060295105, -0.0001709330826997757, -0.00015597790479660034, -0.000141022726893425, -0.00012606754899024963, -0.00011111237108707428, -9.615719318389893e-05, -8.120201528072357e-05, -6.624683737754822e-05, -5.1291659474372864e-05, -3.633648157119751e-05, -2.1381303668022156e-05, -6.426125764846802e-06, 8.529052138328552e-06, 2.3484230041503906e-05, 3.843940794467926e-05, 5.3394585847854614e-05, 6.834976375102997e-05, 8.330494165420532e-05, 9.826011955738068e-05, 0.00011321529746055603, 0.00012817047536373138, 0.00014312565326690674, 0.0001580808311700821, 0.00017303600907325745, 0.0001879911869764328, 0.00020294636487960815, 0.0002179015427827835, 0.00023285672068595886, 0.0002478118985891342, 0.00026276707649230957, 0.0002777222543954849, 0.0002926774322986603, 0.00030763261020183563, 0.000322587788105011, 0.00033754296600818634, 0.0003524981439113617, 0.00036745332181453705, 0.0003824084997177124, 0.00039736367762088776, 0.0004123188555240631, 0.00042727403342723846, 0.0004422292113304138, 0.00045718438923358917, 0.0004721395671367645, 0.0004870947450399399, 0.0005020499229431152]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 8.0, 5.0, 14.0, 17.0, 16.0, 16.0, 20.0, 21.0, 17.0, 25.0, 35.0, 35.0, 39.0, 38.0, 30.0, 32.0, 32.0, 34.0, 31.0, 35.0, 53.0, 42.0, 29.0, 36.0, 34.0, 27.0, 29.0, 27.0, 35.0, 30.0, 23.0, 16.0, 22.0, 18.0, 12.0, 18.0, 3.0, 15.0, 3.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.453125, -8.20648193359375, -7.9598388671875, -7.71319580078125, -7.466552734375, -7.21990966796875, -6.9732666015625, -6.72662353515625, -6.47998046875, -6.23333740234375, -5.9866943359375, -5.74005126953125, -5.493408203125, -5.24676513671875, -5.0001220703125, -4.75347900390625, -4.5068359375, -4.26019287109375, -4.0135498046875, -3.76690673828125, -3.520263671875, -3.27362060546875, -3.0269775390625, -2.78033447265625, -2.53369140625, -2.28704833984375, -2.0404052734375, -1.79376220703125, -1.547119140625, -1.30047607421875, -1.0538330078125, -0.80718994140625, -0.560546875, -0.31390380859375, -0.0672607421875, 0.17938232421875, 0.426025390625, 0.67266845703125, 0.9193115234375, 1.16595458984375, 1.41259765625, 1.65924072265625, 1.9058837890625, 2.15252685546875, 2.399169921875, 2.64581298828125, 2.8924560546875, 3.13909912109375, 3.3857421875, 3.63238525390625, 3.8790283203125, 4.12567138671875, 4.372314453125, 4.61895751953125, 4.8656005859375, 5.11224365234375, 5.35888671875, 5.60552978515625, 5.8521728515625, 6.09881591796875, 6.345458984375, 6.59210205078125, 6.8387451171875, 7.08538818359375, 7.33203125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 13.0, 16.0, 10.0, 22.0, 31.0, 40.0, 69.0, 85.0, 102.0, 142.0, 199.0, 298.0, 407.0, 583.0, 793.0, 1384.0, 2260.0, 4482.0, 10544.0, 28521.0, 91423.0, 299861.0, 402354.0, 135432.0, 41900.0, 14100.0, 5792.0, 2872.0, 1573.0, 997.0, 627.0, 429.0, 310.0, 238.0, 195.0, 122.0, 79.0, 79.0, 45.0, 34.0, 30.0, 18.0, 10.0, 12.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4765625, -8.195556640625, -7.91455078125, -7.633544921875, -7.3525390625, -7.071533203125, -6.79052734375, -6.509521484375, -6.228515625, -5.947509765625, -5.66650390625, -5.385498046875, -5.1044921875, -4.823486328125, -4.54248046875, -4.261474609375, -3.98046875, -3.699462890625, -3.41845703125, -3.137451171875, -2.8564453125, -2.575439453125, -2.29443359375, -2.013427734375, -1.732421875, -1.451416015625, -1.17041015625, -0.889404296875, -0.6083984375, -0.327392578125, -0.04638671875, 0.234619140625, 0.515625, 0.796630859375, 1.07763671875, 1.358642578125, 1.6396484375, 1.920654296875, 2.20166015625, 2.482666015625, 2.763671875, 3.044677734375, 3.32568359375, 3.606689453125, 3.8876953125, 4.168701171875, 4.44970703125, 4.730712890625, 5.01171875, 5.292724609375, 5.57373046875, 5.854736328125, 6.1357421875, 6.416748046875, 6.69775390625, 6.978759765625, 7.259765625, 7.540771484375, 7.82177734375, 8.102783203125, 8.3837890625, 8.664794921875, 8.94580078125, 9.226806640625, 9.5078125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 3.0, 5.0, 8.0, 14.0, 16.0, 8.0, 25.0, 11.0, 23.0, 27.0, 35.0, 35.0, 38.0, 36.0, 57.0, 74.0, 109.0, 253.0, 1538.0, 185.0, 102.0, 65.0, 46.0, 42.0, 41.0, 35.0, 34.0, 31.0, 19.0, 25.0, 21.0, 12.0, 11.0, 8.0, 8.0, 11.0, 5.0, 3.0, 1.0, 3.0, 5.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-22.484375, -21.8486328125, -21.212890625, -20.5771484375, -19.94140625, -19.3056640625, -18.669921875, -18.0341796875, -17.3984375, -16.7626953125, -16.126953125, -15.4912109375, -14.85546875, -14.2197265625, -13.583984375, -12.9482421875, -12.3125, -11.6767578125, -11.041015625, -10.4052734375, -9.76953125, -9.1337890625, -8.498046875, -7.8623046875, -7.2265625, -6.5908203125, -5.955078125, -5.3193359375, -4.68359375, -4.0478515625, -3.412109375, -2.7763671875, -2.140625, -1.5048828125, -0.869140625, -0.2333984375, 0.40234375, 1.0380859375, 1.673828125, 2.3095703125, 2.9453125, 3.5810546875, 4.216796875, 4.8525390625, 5.48828125, 6.1240234375, 6.759765625, 7.3955078125, 8.03125, 8.6669921875, 9.302734375, 9.9384765625, 10.57421875, 11.2099609375, 11.845703125, 12.4814453125, 13.1171875, 13.7529296875, 14.388671875, 15.0244140625, 15.66015625, 16.2958984375, 16.931640625, 17.5673828125, 18.203125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 7.0, 9.0, 9.0, 11.0, 9.0, 28.0, 35.0, 37.0, 54.0, 62.0, 97.0, 141.0, 179.0, 319.0, 454.0, 1237.0, 12762.0, 2677807.0, 444495.0, 5881.0, 829.0, 402.0, 247.0, 172.0, 105.0, 81.0, 55.0, 46.0, 34.0, 30.0, 22.0, 11.0, 10.0, 10.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.71875, -36.4970703125, -35.275390625, -34.0537109375, -32.83203125, -31.6103515625, -30.388671875, -29.1669921875, -27.9453125, -26.7236328125, -25.501953125, -24.2802734375, -23.05859375, -21.8369140625, -20.615234375, -19.3935546875, -18.171875, -16.9501953125, -15.728515625, -14.5068359375, -13.28515625, -12.0634765625, -10.841796875, -9.6201171875, -8.3984375, -7.1767578125, -5.955078125, -4.7333984375, -3.51171875, -2.2900390625, -1.068359375, 0.1533203125, 1.375, 2.5966796875, 3.818359375, 5.0400390625, 6.26171875, 7.4833984375, 8.705078125, 9.9267578125, 11.1484375, 12.3701171875, 13.591796875, 14.8134765625, 16.03515625, 17.2568359375, 18.478515625, 19.7001953125, 20.921875, 22.1435546875, 23.365234375, 24.5869140625, 25.80859375, 27.0302734375, 28.251953125, 29.4736328125, 30.6953125, 31.9169921875, 33.138671875, 34.3603515625, 35.58203125, 36.8037109375, 38.025390625, 39.2470703125, 40.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 244.0, 766.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-194.1175079345703, -183.98941040039062, -173.86129760742188, -163.7332000732422, -153.60508728027344, -143.47698974609375, -133.348876953125, -123.22077941894531, -113.0926742553711, -102.96456909179688, -92.83646392822266, -82.70835876464844, -72.58026123046875, -62.452152252197266, -52.32405090332031, -42.195945739746094, -32.067840576171875, -21.939735412597656, -11.81163215637207, -1.6835289001464844, 8.444576263427734, 18.572681427001953, 28.700782775878906, 38.828887939453125, 48.956993103027344, 59.08509826660156, 69.21320343017578, 79.34130859375, 89.46940612792969, 99.59751892089844, 109.72561645507812, 119.85372161865234, 129.9818115234375, 140.1099090576172, 150.23802185058594, 160.36611938476562, 170.49423217773438, 180.62232971191406, 190.75042724609375, 200.8785400390625, 211.00665283203125, 221.13475036621094, 231.2628631591797, 241.39096069335938, 251.51907348632812, 261.6471862792969, 271.7752685546875, 281.90338134765625, 292.031494140625, 302.15960693359375, 312.2876892089844, 322.4158020019531, 332.5439147949219, 342.6720275878906, 352.80010986328125, 362.92822265625, 373.0563049316406, 383.1844177246094, 393.3125, 403.44061279296875, 413.5687255859375, 423.69683837890625, 433.8249206542969, 443.9530334472656, 454.0811462402344]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 7.0, 8.0, 11.0, 5.0, 4.0, 21.0, 17.0, 12.0, 22.0, 20.0, 20.0, 27.0, 29.0, 25.0, 31.0, 29.0, 41.0, 30.0, 36.0, 42.0, 42.0, 39.0, 41.0, 29.0, 39.0, 27.0, 33.0, 40.0, 26.0, 18.0, 23.0, 32.0, 18.0, 27.0, 12.0, 12.0, 17.0, 19.0, 9.0, 8.0, 13.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.38108825683594, -36.10797119140625, -34.83485794067383, -33.561744689941406, -32.28862762451172, -31.015512466430664, -29.74239730834961, -28.469282150268555, -27.1961669921875, -25.923051834106445, -24.64993667602539, -23.376821517944336, -22.10370635986328, -20.830591201782227, -19.557476043701172, -18.284360885620117, -17.011245727539062, -15.738130569458008, -14.465015411376953, -13.191900253295898, -11.918785095214844, -10.645669937133789, -9.372554779052734, -8.09943962097168, -6.826324462890625, -5.55320930480957, -4.280094146728516, -3.006978988647461, -1.7338638305664062, -0.46074867248535156, 0.8123664855957031, 2.085481643676758, 3.3585968017578125, 4.631711959838867, 5.904827117919922, 7.177942276000977, 8.451057434082031, 9.724172592163086, 10.99728775024414, 12.270402908325195, 13.54351806640625, 14.816633224487305, 16.08974838256836, 17.362863540649414, 18.63597869873047, 19.909093856811523, 21.182209014892578, 22.455324172973633, 23.728439331054688, 25.001554489135742, 26.274669647216797, 27.54778480529785, 28.820899963378906, 30.09401512145996, 31.367130279541016, 32.64024353027344, 33.913360595703125, 35.18647766113281, 36.459590911865234, 37.732704162597656, 39.005821228027344, 40.27893829345703, 41.55205154418945, 42.825164794921875, 44.09828186035156]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 12.0, 12.0, 6.0, 12.0, 20.0, 21.0, 31.0, 27.0, 26.0, 37.0, 21.0, 28.0, 41.0, 47.0, 29.0, 40.0, 54.0, 49.0, 38.0, 46.0, 26.0, 43.0, 36.0, 35.0, 35.0, 34.0, 28.0, 33.0, 18.0, 28.0, 15.0, 14.0, 18.0, 9.0, 7.0, 3.0, 10.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.765625, -9.49163818359375, -9.2176513671875, -8.94366455078125, -8.669677734375, -8.39569091796875, -8.1217041015625, -7.84771728515625, -7.57373046875, -7.29974365234375, -7.0257568359375, -6.75177001953125, -6.477783203125, -6.20379638671875, -5.9298095703125, -5.65582275390625, -5.3818359375, -5.10784912109375, -4.8338623046875, -4.55987548828125, -4.285888671875, -4.01190185546875, -3.7379150390625, -3.46392822265625, -3.18994140625, -2.91595458984375, -2.6419677734375, -2.36798095703125, -2.093994140625, -1.82000732421875, -1.5460205078125, -1.27203369140625, -0.998046875, -0.72406005859375, -0.4500732421875, -0.17608642578125, 0.097900390625, 0.37188720703125, 0.6458740234375, 0.91986083984375, 1.19384765625, 1.46783447265625, 1.7418212890625, 2.01580810546875, 2.289794921875, 2.56378173828125, 2.8377685546875, 3.11175537109375, 3.3857421875, 3.65972900390625, 3.9337158203125, 4.20770263671875, 4.481689453125, 4.75567626953125, 5.0296630859375, 5.30364990234375, 5.57763671875, 5.85162353515625, 6.1256103515625, 6.39959716796875, 6.673583984375, 6.94757080078125, 7.2215576171875, 7.49554443359375, 7.76953125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 16.0, 11.0, 18.0, 20.0, 27.0, 27.0, 52.0, 50.0, 77.0, 86.0, 122.0, 176.0, 254.0, 289.0, 404.0, 490.0, 21437.0, 4168190.0, 784.0, 401.0, 304.0, 261.0, 190.0, 120.0, 109.0, 68.0, 58.0, 44.0, 39.0, 25.0, 25.0, 23.0, 10.0, 15.0, 8.0, 6.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-237.625, -229.744140625, -221.86328125, -213.982421875, -206.1015625, -198.220703125, -190.33984375, -182.458984375, -174.578125, -166.697265625, -158.81640625, -150.935546875, -143.0546875, -135.173828125, -127.29296875, -119.412109375, -111.53125, -103.650390625, -95.76953125, -87.888671875, -80.0078125, -72.126953125, -64.24609375, -56.365234375, -48.484375, -40.603515625, -32.72265625, -24.841796875, -16.9609375, -9.080078125, -1.19921875, 6.681640625, 14.5625, 22.443359375, 30.32421875, 38.205078125, 46.0859375, 53.966796875, 61.84765625, 69.728515625, 77.609375, 85.490234375, 93.37109375, 101.251953125, 109.1328125, 117.013671875, 124.89453125, 132.775390625, 140.65625, 148.537109375, 156.41796875, 164.298828125, 172.1796875, 180.060546875, 187.94140625, 195.822265625, 203.703125, 211.583984375, 219.46484375, 227.345703125, 235.2265625, 243.107421875, 250.98828125, 258.869140625, 266.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 3.0, 9.0, 17.0, 16.0, 37.0, 62.0, 99.0, 153.0, 281.0, 555.0, 938.0, 894.0, 449.0, 223.0, 111.0, 67.0, 62.0, 26.0, 19.0, 15.0, 13.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.546875, -23.8623046875, -23.177734375, -22.4931640625, -21.80859375, -21.1240234375, -20.439453125, -19.7548828125, -19.0703125, -18.3857421875, -17.701171875, -17.0166015625, -16.33203125, -15.6474609375, -14.962890625, -14.2783203125, -13.59375, -12.9091796875, -12.224609375, -11.5400390625, -10.85546875, -10.1708984375, -9.486328125, -8.8017578125, -8.1171875, -7.4326171875, -6.748046875, -6.0634765625, -5.37890625, -4.6943359375, -4.009765625, -3.3251953125, -2.640625, -1.9560546875, -1.271484375, -0.5869140625, 0.09765625, 0.7822265625, 1.466796875, 2.1513671875, 2.8359375, 3.5205078125, 4.205078125, 4.8896484375, 5.57421875, 6.2587890625, 6.943359375, 7.6279296875, 8.3125, 8.9970703125, 9.681640625, 10.3662109375, 11.05078125, 11.7353515625, 12.419921875, 13.1044921875, 13.7890625, 14.4736328125, 15.158203125, 15.8427734375, 16.52734375, 17.2119140625, 17.896484375, 18.5810546875, 19.265625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 15.0, 13.0, 18.0, 31.0, 46.0, 60.0, 85.0, 105.0, 335.0, 3426790.0, 766139.0, 271.0, 108.0, 77.0, 48.0, 42.0, 35.0, 19.0, 16.0, 12.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-309.25, -301.8828125, -294.515625, -287.1484375, -279.78125, -272.4140625, -265.046875, -257.6796875, -250.3125, -242.9453125, -235.578125, -228.2109375, -220.84375, -213.4765625, -206.109375, -198.7421875, -191.375, -184.0078125, -176.640625, -169.2734375, -161.90625, -154.5390625, -147.171875, -139.8046875, -132.4375, -125.0703125, -117.703125, -110.3359375, -102.96875, -95.6015625, -88.234375, -80.8671875, -73.5, -66.1328125, -58.765625, -51.3984375, -44.03125, -36.6640625, -29.296875, -21.9296875, -14.5625, -7.1953125, 0.171875, 7.5390625, 14.90625, 22.2734375, 29.640625, 37.0078125, 44.375, 51.7421875, 59.109375, 66.4765625, 73.84375, 81.2109375, 88.578125, 95.9453125, 103.3125, 110.6796875, 118.046875, 125.4140625, 132.78125, 140.1484375, 147.515625, 154.8828125, 162.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 166.0, 590.0, 233.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-252.12466430664062, -245.7600555419922, -239.39544677734375, -233.03085327148438, -226.66624450683594, -220.3016357421875, -213.93702697753906, -207.57241821289062, -201.2078094482422, -194.84320068359375, -188.4785919189453, -182.11398315429688, -175.7493896484375, -169.38478088378906, -163.02017211914062, -156.6555633544922, -150.29095458984375, -143.9263458251953, -137.56173706054688, -131.1971435546875, -124.83252716064453, -118.46792602539062, -112.10331726074219, -105.73870849609375, -99.37411499023438, -93.00950622558594, -86.64490509033203, -80.2802963256836, -73.91568756103516, -67.55108642578125, -61.18647766113281, -54.821868896484375, -48.45726013183594, -42.092655181884766, -35.72804641723633, -29.363441467285156, -22.99883460998535, -16.634227752685547, -10.269622802734375, -3.9050140380859375, 2.4595909118652344, 8.824197769165039, 15.188803672790527, 21.553409576416016, 27.91801643371582, 34.282623291015625, 40.6472282409668, 47.011837005615234, 53.376441955566406, 59.74104690551758, 66.10565185546875, 72.47026062011719, 78.83486938476562, 85.19947814941406, 91.56407928466797, 97.9286880493164, 104.29328918457031, 110.65789794921875, 117.02249908447266, 123.3871078491211, 129.751708984375, 136.11631774902344, 142.48092651367188, 148.8455352783203, 155.21014404296875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 1.0, 1.0, 5.0, 7.0, 8.0, 6.0, 9.0, 13.0, 15.0, 17.0, 25.0, 17.0, 27.0, 25.0, 28.0, 30.0, 40.0, 30.0, 30.0, 33.0, 40.0, 41.0, 42.0, 47.0, 46.0, 31.0, 33.0, 38.0, 34.0, 38.0, 28.0, 35.0, 21.0, 23.0, 18.0, 23.0, 23.0, 15.0, 9.0, 14.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-45.00749206542969, -43.69382858276367, -42.38016891479492, -41.066505432128906, -39.752845764160156, -38.43918228149414, -37.12552261352539, -35.811859130859375, -34.498199462890625, -33.18453598022461, -31.87087631225586, -30.557214736938477, -29.243553161621094, -27.929889678955078, -26.616228103637695, -25.302566528320312, -23.988903045654297, -22.675241470336914, -21.36157989501953, -20.04791831970215, -18.734256744384766, -17.42059326171875, -16.106931686401367, -14.793270111083984, -13.479608535766602, -12.165946960449219, -10.852285385131836, -9.538622856140137, -8.224961280822754, -6.911299705505371, -5.59763765335083, -4.283975601196289, -2.9703140258789062, -1.6566522121429443, -0.3429903984069824, 0.9706714153289795, 2.2843332290649414, 3.597994804382324, 4.911656856536865, 6.225318908691406, 7.538980484008789, 8.852642059326172, 10.166303634643555, 11.479966163635254, 12.793627738952637, 14.10728931427002, 15.420951843261719, 16.7346134185791, 18.048274993896484, 19.361936569213867, 20.67559814453125, 21.989259719848633, 23.302921295166016, 24.61658477783203, 25.930246353149414, 27.243907928466797, 28.55756950378418, 29.871231079101562, 31.184892654418945, 32.49855422973633, 33.812217712402344, 35.125877380371094, 36.43954086303711, 37.753204345703125, 39.066864013671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 34.0, 29.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 9.0, 7.0, 19.0, 19.0, 34.0, 58.0, 79.0, 129.0, 174.0, 277.0, 451.0, 679.0, 1055.0, 1628.0, 2514.0, 3986.0, 6182.0, 9278.0, 14787.0, 22706.0, 34954.0, 54965.0, 88466.0, 152187.0, 251405.0, 155173.0, 91144.0, 55507.0, 35591.0, 23072.0, 14925.0, 9502.0, 6199.0, 4038.0, 2567.0, 1703.0, 1090.0, 696.0, 440.0, 304.0, 206.0, 127.0, 78.0, 49.0, 33.0, 23.0, 17.0, 10.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.245635986328125, -1.20611572265625, -1.166595458984375, -1.1270751953125, -1.087554931640625, -1.04803466796875, -1.008514404296875, -0.968994140625, -0.929473876953125, -0.88995361328125, -0.850433349609375, -0.8109130859375, -0.771392822265625, -0.73187255859375, -0.692352294921875, -0.65283203125, -0.613311767578125, -0.57379150390625, -0.534271240234375, -0.4947509765625, -0.455230712890625, -0.41571044921875, -0.376190185546875, -0.336669921875, -0.297149658203125, -0.25762939453125, -0.218109130859375, -0.1785888671875, -0.139068603515625, -0.09954833984375, -0.060028076171875, -0.0205078125, 0.019012451171875, 0.05853271484375, 0.098052978515625, 0.1375732421875, 0.177093505859375, 0.21661376953125, 0.256134033203125, 0.295654296875, 0.335174560546875, 0.37469482421875, 0.414215087890625, 0.4537353515625, 0.493255615234375, 0.53277587890625, 0.572296142578125, 0.61181640625, 0.651336669921875, 0.69085693359375, 0.730377197265625, 0.7698974609375, 0.809417724609375, 0.84893798828125, 0.888458251953125, 0.927978515625, 0.967498779296875, 1.00701904296875, 1.046539306640625, 1.0860595703125, 1.125579833984375, 1.16510009765625, 1.204620361328125, 1.244140625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 13.0, 14.0, 11.0, 12.0, 24.0, 17.0, 25.0, 20.0, 25.0, 35.0, 26.0, 33.0, 28.0, 27.0, 33.0, 40.0, 46.0, 39.0, 1061.0, 32.0, 27.0, 37.0, 23.0, 27.0, 38.0, 30.0, 29.0, 28.0, 19.0, 20.0, 19.0, 24.0, 16.0, 19.0, 16.0, 12.0, 8.0, 8.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.0703125, -3.932373046875, -3.79443359375, -3.656494140625, -3.5185546875, -3.380615234375, -3.24267578125, -3.104736328125, -2.966796875, -2.828857421875, -2.69091796875, -2.552978515625, -2.4150390625, -2.277099609375, -2.13916015625, -2.001220703125, -1.86328125, -1.725341796875, -1.58740234375, -1.449462890625, -1.3115234375, -1.173583984375, -1.03564453125, -0.897705078125, -0.759765625, -0.621826171875, -0.48388671875, -0.345947265625, -0.2080078125, -0.070068359375, 0.06787109375, 0.205810546875, 0.34375, 0.481689453125, 0.61962890625, 0.757568359375, 0.8955078125, 1.033447265625, 1.17138671875, 1.309326171875, 1.447265625, 1.585205078125, 1.72314453125, 1.861083984375, 1.9990234375, 2.136962890625, 2.27490234375, 2.412841796875, 2.55078125, 2.688720703125, 2.82666015625, 2.964599609375, 3.1025390625, 3.240478515625, 3.37841796875, 3.516357421875, 3.654296875, 3.792236328125, 3.93017578125, 4.068115234375, 4.2060546875, 4.343994140625, 4.48193359375, 4.619873046875, 4.7578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 6.0, 17.0, 19.0, 19.0, 37.0, 64.0, 86.0, 116.0, 192.0, 264.0, 407.0, 564.0, 813.0, 1254.0, 1804.0, 2646.0, 3938.0, 5717.0, 8449.0, 12644.0, 18760.0, 28894.0, 43980.0, 69117.0, 113843.0, 199641.0, 1257802.0, 118639.0, 72086.0, 45711.0, 29391.0, 19482.0, 13224.0, 8718.0, 5975.0, 4068.0, 2788.0, 1890.0, 1306.0, 836.0, 635.0, 439.0, 273.0, 207.0, 127.0, 85.0, 55.0, 41.0, 27.0, 18.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.1396484375, -1.106170654296875, -1.07269287109375, -1.039215087890625, -1.0057373046875, -0.972259521484375, -0.93878173828125, -0.905303955078125, -0.871826171875, -0.838348388671875, -0.80487060546875, -0.771392822265625, -0.7379150390625, -0.704437255859375, -0.67095947265625, -0.637481689453125, -0.60400390625, -0.570526123046875, -0.53704833984375, -0.503570556640625, -0.4700927734375, -0.436614990234375, -0.40313720703125, -0.369659423828125, -0.336181640625, -0.302703857421875, -0.26922607421875, -0.235748291015625, -0.2022705078125, -0.168792724609375, -0.13531494140625, -0.101837158203125, -0.068359375, -0.034881591796875, -0.00140380859375, 0.032073974609375, 0.0655517578125, 0.099029541015625, 0.13250732421875, 0.165985107421875, 0.199462890625, 0.232940673828125, 0.26641845703125, 0.299896240234375, 0.3333740234375, 0.366851806640625, 0.40032958984375, 0.433807373046875, 0.46728515625, 0.500762939453125, 0.53424072265625, 0.567718505859375, 0.6011962890625, 0.634674072265625, 0.66815185546875, 0.701629638671875, 0.735107421875, 0.768585205078125, 0.80206298828125, 0.835540771484375, 0.8690185546875, 0.902496337890625, 0.93597412109375, 0.969451904296875, 1.0029296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 3.0, 5.0, 9.0, 6.0, 18.0, 21.0, 18.0, 28.0, 51.0, 71.0, 94.0, 104.0, 134.0, 121.0, 89.0, 66.0, 38.0, 17.0, 25.0, 15.0, 13.0, 13.0, 5.0, 5.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014142990112304688, -0.0013765990734100342, -0.0013388991355895996, -0.001301199197769165, -0.0012634992599487305, -0.001225799322128296, -0.0011880993843078613, -0.0011503994464874268, -0.0011126995086669922, -0.0010749995708465576, -0.001037299633026123, -0.0009995996952056885, -0.0009618997573852539, -0.0009241998195648193, -0.0008864998817443848, -0.0008487999439239502, -0.0008111000061035156, -0.0007734000682830811, -0.0007357001304626465, -0.0006980001926422119, -0.0006603002548217773, -0.0006226003170013428, -0.0005849003791809082, -0.0005472004413604736, -0.0005095005035400391, -0.0004718005657196045, -0.0004341006278991699, -0.00039640069007873535, -0.0003587007522583008, -0.0003210008144378662, -0.00028330087661743164, -0.00024560093879699707, -0.0002079010009765625, -0.00017020106315612793, -0.00013250112533569336, -9.480118751525879e-05, -5.710124969482422e-05, -1.940131187438965e-05, 1.8298625946044922e-05, 5.599856376647949e-05, 9.369850158691406e-05, 0.00013139843940734863, 0.0001690983772277832, 0.00020679831504821777, 0.00024449825286865234, 0.0002821981906890869, 0.0003198981285095215, 0.00035759806632995605, 0.0003952980041503906, 0.0004329979419708252, 0.00047069787979125977, 0.0005083978176116943, 0.0005460977554321289, 0.0005837976932525635, 0.000621497631072998, 0.0006591975688934326, 0.0006968975067138672, 0.0007345974445343018, 0.0007722973823547363, 0.0008099973201751709, 0.0008476972579956055, 0.00088539719581604, 0.0009230971336364746, 0.0009607970714569092, 0.0009984970092773438]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 8.0, 11.0, 16.0, 14.0, 13.0, 23.0, 42.0, 39.0, 67.0, 95.0, 167.0, 267.0, 409.0, 1045.0, 559244.0, 484729.0, 1044.0, 469.0, 273.0, 175.0, 97.0, 76.0, 58.0, 42.0, 31.0, 14.0, 19.0, 18.0, 7.0, 14.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01666259765625, -0.016045331954956055, -0.01542806625366211, -0.014810800552368164, -0.014193534851074219, -0.013576269149780273, -0.012959003448486328, -0.012341737747192383, -0.011724472045898438, -0.011107206344604492, -0.010489940643310547, -0.009872674942016602, -0.009255409240722656, -0.008638143539428711, -0.008020877838134766, -0.00740361213684082, -0.006786346435546875, -0.00616908073425293, -0.005551815032958984, -0.004934549331665039, -0.004317283630371094, -0.0037000179290771484, -0.003082752227783203, -0.002465486526489258, -0.0018482208251953125, -0.0012309551239013672, -0.0006136894226074219, 3.5762786865234375e-06, 0.0006208419799804688, 0.001238107681274414, 0.0018553733825683594, 0.0024726390838623047, 0.00308990478515625, 0.0037071704864501953, 0.004324436187744141, 0.004941701889038086, 0.005558967590332031, 0.0061762332916259766, 0.006793498992919922, 0.007410764694213867, 0.008028030395507812, 0.008645296096801758, 0.009262561798095703, 0.009879827499389648, 0.010497093200683594, 0.011114358901977539, 0.011731624603271484, 0.01234889030456543, 0.012966156005859375, 0.01358342170715332, 0.014200687408447266, 0.014817953109741211, 0.015435218811035156, 0.0160524845123291, 0.016669750213623047, 0.017287015914916992, 0.017904281616210938, 0.018521547317504883, 0.019138813018798828, 0.019756078720092773, 0.02037334442138672, 0.020990610122680664, 0.02160787582397461, 0.022225141525268555, 0.0228424072265625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 12.0, 686.0, 309.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00072041607927531, -0.0006152072455734015, -0.0005099984118714929, -0.0004047896363772452, -0.0002995808026753366, -0.000194371968973428, -8.916319347918034e-05, 1.6045640222728252e-05, 0.00012125447392463684, 0.0002264632930746302, 0.00033167211222462356, 0.0004368809168227017, 0.0005420897505246103, 0.0006472985842265189, 0.0007525073597207665, 0.0008577161934226751, 0.0009629250271245837, 0.0010681338608264923, 0.001173342694528401, 0.0012785515282303095, 0.0013837602455168962, 0.0014889691956341267, 0.0015941779129207134, 0.001699386746622622, 0.0018045955803245306, 0.0019098044140264392, 0.0020150132477283478, 0.0021202219650149345, 0.002225430915132165, 0.0023306396324187517, 0.002435848582535982, 0.002541057299822569, 0.0026462660171091557, 0.0027514747343957424, 0.002856683684512973, 0.0029618924017995596, 0.00306710135191679, 0.0031723100692033768, 0.0032775187864899635, 0.003382727736607194, 0.0034879366867244244, 0.003593145404011011, 0.0036983543541282415, 0.0038035630714148283, 0.003908772021532059, 0.0040139807388186455, 0.004119189456105232, 0.004224398173391819, 0.004329606890678406, 0.0044348156079649925, 0.004540024325251579, 0.004645233508199453, 0.00475044222548604, 0.004855650942772627, 0.004960859660059214, 0.005066068843007088, 0.0051712775602936745, 0.005276486277580261, 0.005381694994866848, 0.005486904177814722, 0.005592112895101309, 0.005697321612387896, 0.005802530329674482, 0.005907739512622356, 0.006012948229908943]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 2.0, 8.0, 17.0, 6.0, 10.0, 6.0, 15.0, 12.0, 21.0, 23.0, 27.0, 16.0, 23.0, 30.0, 34.0, 28.0, 34.0, 35.0, 42.0, 48.0, 50.0, 30.0, 33.0, 38.0, 28.0, 38.0, 31.0, 28.0, 36.0, 21.0, 33.0, 27.0, 25.0, 20.0, 17.0, 13.0, 21.0, 17.0, 13.0, 2.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003616213798522949, -0.00034914351999759674, -0.00033666566014289856, -0.0003241878002882004, -0.0003117099404335022, -0.000299232080578804, -0.00028675422072410583, -0.00027427636086940765, -0.00026179850101470947, -0.0002493206411600113, -0.0002368427813053131, -0.00022436492145061493, -0.00021188706159591675, -0.00019940920174121857, -0.00018693134188652039, -0.0001744534820318222, -0.00016197562217712402, -0.00014949776232242584, -0.00013701990246772766, -0.00012454204261302948, -0.0001120641827583313, -9.958632290363312e-05, -8.710846304893494e-05, -7.463060319423676e-05, -6.215274333953857e-05, -4.967488348484039e-05, -3.719702363014221e-05, -2.471916377544403e-05, -1.224130392074585e-05, 2.3655593395233154e-07, 1.2714415788650513e-05, 2.5192275643348694e-05, 3.7670135498046875e-05, 5.0147995352745056e-05, 6.262585520744324e-05, 7.510371506214142e-05, 8.75815749168396e-05, 0.00010005943477153778, 0.00011253729462623596, 0.00012501515448093414, 0.00013749301433563232, 0.0001499708741903305, 0.0001624487340450287, 0.00017492659389972687, 0.00018740445375442505, 0.00019988231360912323, 0.0002123601734638214, 0.0002248380333185196, 0.00023731589317321777, 0.00024979375302791595, 0.00026227161288261414, 0.0002747494727373123, 0.0002872273325920105, 0.0002997051924467087, 0.00031218305230140686, 0.00032466091215610504, 0.0003371387720108032, 0.0003496166318655014, 0.0003620944917201996, 0.00037457235157489777, 0.00038705021142959595, 0.00039952807128429413, 0.0004120059311389923, 0.0004244837909936905, 0.00043696165084838867]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 10.0, 6.0, 11.0, 13.0, 12.0, 23.0, 23.0, 17.0, 25.0, 23.0, 28.0, 23.0, 28.0, 27.0, 44.0, 32.0, 31.0, 41.0, 33.0, 30.0, 44.0, 39.0, 36.0, 42.0, 39.0, 37.0, 29.0, 25.0, 19.0, 28.0, 22.0, 25.0, 17.0, 28.0, 23.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.87506103515625, -6.6368408203125, -6.39862060546875, -6.160400390625, -5.92218017578125, -5.6839599609375, -5.44573974609375, -5.20751953125, -4.96929931640625, -4.7310791015625, -4.49285888671875, -4.254638671875, -4.01641845703125, -3.7781982421875, -3.53997802734375, -3.3017578125, -3.06353759765625, -2.8253173828125, -2.58709716796875, -2.348876953125, -2.11065673828125, -1.8724365234375, -1.63421630859375, -1.39599609375, -1.15777587890625, -0.9195556640625, -0.68133544921875, -0.443115234375, -0.20489501953125, 0.0333251953125, 0.27154541015625, 0.509765625, 0.74798583984375, 0.9862060546875, 1.22442626953125, 1.462646484375, 1.70086669921875, 1.9390869140625, 2.17730712890625, 2.41552734375, 2.65374755859375, 2.8919677734375, 3.13018798828125, 3.368408203125, 3.60662841796875, 3.8448486328125, 4.08306884765625, 4.3212890625, 4.55950927734375, 4.7977294921875, 5.03594970703125, 5.274169921875, 5.51239013671875, 5.7506103515625, 5.98883056640625, 6.22705078125, 6.46527099609375, 6.7034912109375, 6.94171142578125, 7.179931640625, 7.41815185546875, 7.6563720703125, 7.89459228515625, 8.1328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 9.0, 2.0, 5.0, 23.0, 13.0, 22.0, 33.0, 40.0, 56.0, 92.0, 108.0, 135.0, 200.0, 206.0, 299.0, 373.0, 450.0, 564.0, 714.0, 857.0, 1165.0, 1975.0, 4425.0, 13642.0, 57837.0, 256005.0, 505602.0, 150958.0, 34322.0, 8929.0, 3009.0, 1559.0, 1010.0, 786.0, 662.0, 571.0, 426.0, 356.0, 267.0, 220.0, 151.0, 123.0, 99.0, 66.0, 46.0, 39.0, 24.0, 25.0, 20.0, 6.0, 10.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0], "bins": [-11.3984375, -11.0457763671875, -10.693115234375, -10.3404541015625, -9.98779296875, -9.6351318359375, -9.282470703125, -8.9298095703125, -8.5771484375, -8.2244873046875, -7.871826171875, -7.5191650390625, -7.16650390625, -6.8138427734375, -6.461181640625, -6.1085205078125, -5.755859375, -5.4031982421875, -5.050537109375, -4.6978759765625, -4.34521484375, -3.9925537109375, -3.639892578125, -3.2872314453125, -2.9345703125, -2.5819091796875, -2.229248046875, -1.8765869140625, -1.52392578125, -1.1712646484375, -0.818603515625, -0.4659423828125, -0.11328125, 0.2393798828125, 0.592041015625, 0.9447021484375, 1.29736328125, 1.6500244140625, 2.002685546875, 2.3553466796875, 2.7080078125, 3.0606689453125, 3.413330078125, 3.7659912109375, 4.11865234375, 4.4713134765625, 4.823974609375, 5.1766357421875, 5.529296875, 5.8819580078125, 6.234619140625, 6.5872802734375, 6.93994140625, 7.2926025390625, 7.645263671875, 7.9979248046875, 8.3505859375, 8.7032470703125, 9.055908203125, 9.4085693359375, 9.76123046875, 10.1138916015625, 10.466552734375, 10.8192138671875, 11.171875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 8.0, 6.0, 6.0, 11.0, 18.0, 12.0, 23.0, 12.0, 18.0, 29.0, 38.0, 40.0, 55.0, 49.0, 60.0, 106.0, 280.0, 1605.0, 151.0, 67.0, 64.0, 49.0, 51.0, 41.0, 42.0, 37.0, 31.0, 26.0, 16.0, 17.0, 15.0, 11.0, 8.0, 8.0, 4.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.640625, -15.982177734375, -15.32373046875, -14.665283203125, -14.0068359375, -13.348388671875, -12.68994140625, -12.031494140625, -11.373046875, -10.714599609375, -10.05615234375, -9.397705078125, -8.7392578125, -8.080810546875, -7.42236328125, -6.763916015625, -6.10546875, -5.447021484375, -4.78857421875, -4.130126953125, -3.4716796875, -2.813232421875, -2.15478515625, -1.496337890625, -0.837890625, -0.179443359375, 0.47900390625, 1.137451171875, 1.7958984375, 2.454345703125, 3.11279296875, 3.771240234375, 4.4296875, 5.088134765625, 5.74658203125, 6.405029296875, 7.0634765625, 7.721923828125, 8.38037109375, 9.038818359375, 9.697265625, 10.355712890625, 11.01416015625, 11.672607421875, 12.3310546875, 12.989501953125, 13.64794921875, 14.306396484375, 14.96484375, 15.623291015625, 16.28173828125, 16.940185546875, 17.5986328125, 18.257080078125, 18.91552734375, 19.573974609375, 20.232421875, 20.890869140625, 21.54931640625, 22.207763671875, 22.8662109375, 23.524658203125, 24.18310546875, 24.841552734375, 25.5]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 8.0, 5.0, 7.0, 9.0, 10.0, 15.0, 22.0, 30.0, 26.0, 41.0, 38.0, 65.0, 100.0, 147.0, 240.0, 346.0, 680.0, 2053.0, 2903397.0, 235483.0, 1523.0, 564.0, 312.0, 163.0, 114.0, 81.0, 55.0, 48.0, 25.0, 18.0, 15.0, 17.0, 14.0, 9.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.0625, -66.8974609375, -64.732421875, -62.5673828125, -60.40234375, -58.2373046875, -56.072265625, -53.9072265625, -51.7421875, -49.5771484375, -47.412109375, -45.2470703125, -43.08203125, -40.9169921875, -38.751953125, -36.5869140625, -34.421875, -32.2568359375, -30.091796875, -27.9267578125, -25.76171875, -23.5966796875, -21.431640625, -19.2666015625, -17.1015625, -14.9365234375, -12.771484375, -10.6064453125, -8.44140625, -6.2763671875, -4.111328125, -1.9462890625, 0.21875, 2.3837890625, 4.548828125, 6.7138671875, 8.87890625, 11.0439453125, 13.208984375, 15.3740234375, 17.5390625, 19.7041015625, 21.869140625, 24.0341796875, 26.19921875, 28.3642578125, 30.529296875, 32.6943359375, 34.859375, 37.0244140625, 39.189453125, 41.3544921875, 43.51953125, 45.6845703125, 47.849609375, 50.0146484375, 52.1796875, 54.3447265625, 56.509765625, 58.6748046875, 60.83984375, 63.0048828125, 65.169921875, 67.3349609375, 69.5]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 848.0, 155.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.08770751953125, -261.9179992675781, -251.74827575683594, -241.57855224609375, -231.40884399414062, -221.2391357421875, -211.0694122314453, -200.89968872070312, -190.72998046875, -180.56027221679688, -170.3905487060547, -160.2208251953125, -150.05111694335938, -139.88140869140625, -129.71168518066406, -119.5419692993164, -109.37225341796875, -99.2025375366211, -89.03282165527344, -78.86310577392578, -68.69338989257812, -58.52367401123047, -48.35395812988281, -38.184242248535156, -28.0145263671875, -17.844810485839844, -7.6750946044921875, 2.4946212768554688, 12.664337158203125, 22.83405303955078, 33.00376892089844, 43.173484802246094, 53.343170166015625, 63.51288604736328, 73.68260192871094, 83.8523178100586, 94.02203369140625, 104.1917495727539, 114.36146545410156, 124.53118133544922, 134.70089721679688, 144.87060546875, 155.0403289794922, 165.21005249023438, 175.3797607421875, 185.54946899414062, 195.7191925048828, 205.888916015625, 216.05862426757812, 226.22833251953125, 236.39805603027344, 246.56777954101562, 256.73748779296875, 266.9071960449219, 277.076904296875, 287.24664306640625, 297.4163513183594, 307.5860595703125, 317.75579833984375, 327.9255065917969, 338.09521484375, 348.2649230957031, 358.43463134765625, 368.6043701171875, 378.7740783691406]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 6.0, 9.0, 12.0, 21.0, 17.0, 16.0, 24.0, 22.0, 36.0, 28.0, 26.0, 34.0, 23.0, 40.0, 26.0, 41.0, 55.0, 51.0, 47.0, 51.0, 34.0, 34.0, 24.0, 39.0, 38.0, 37.0, 29.0, 31.0, 19.0, 19.0, 18.0, 21.0, 7.0, 17.0, 9.0, 10.0, 7.0, 4.0, 5.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.91034698486328, -50.182552337646484, -48.45476150512695, -46.726966857910156, -44.999176025390625, -43.27138137817383, -41.54358673095703, -39.8157958984375, -38.0880012512207, -36.360206604003906, -34.632415771484375, -32.90462112426758, -31.176828384399414, -29.44903564453125, -27.721240997314453, -25.99344825744629, -24.265655517578125, -22.53786277770996, -20.810070037841797, -19.082275390625, -17.354482650756836, -15.626689910888672, -13.898896217346191, -12.171102523803711, -10.443309783935547, -8.715517044067383, -6.987723350524902, -5.25993013381958, -3.532136917114258, -1.8043441772460938, -0.07655048370361328, 1.6512432098388672, 3.3790359497070312, 5.1068291664123535, 6.834622383117676, 8.562416076660156, 10.29020881652832, 12.018001556396484, 13.745795249938965, 15.473588943481445, 17.20138168334961, 18.929174423217773, 20.656967163085938, 22.384761810302734, 24.1125545501709, 25.840347290039062, 27.56814193725586, 29.295934677124023, 31.023727416992188, 32.751522064208984, 34.479312896728516, 36.20710754394531, 37.934898376464844, 39.66269302368164, 41.39048767089844, 43.11827850341797, 44.846073150634766, 46.57386779785156, 48.301658630371094, 50.02945327758789, 51.75724792480469, 53.48503875732422, 55.212833404541016, 56.94062805175781, 58.668418884277344]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 8.0, 12.0, 7.0, 24.0, 10.0, 13.0, 21.0, 23.0, 34.0, 25.0, 43.0, 39.0, 40.0, 39.0, 48.0, 51.0, 43.0, 56.0, 42.0, 46.0, 42.0, 40.0, 42.0, 34.0, 26.0, 28.0, 27.0, 24.0, 25.0, 14.0, 22.0, 16.0, 12.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.1971435546875, -7.917724609375, -7.6383056640625, -7.35888671875, -7.0794677734375, -6.800048828125, -6.5206298828125, -6.2412109375, -5.9617919921875, -5.682373046875, -5.4029541015625, -5.12353515625, -4.8441162109375, -4.564697265625, -4.2852783203125, -4.005859375, -3.7264404296875, -3.447021484375, -3.1676025390625, -2.88818359375, -2.6087646484375, -2.329345703125, -2.0499267578125, -1.7705078125, -1.4910888671875, -1.211669921875, -0.9322509765625, -0.65283203125, -0.3734130859375, -0.093994140625, 0.1854248046875, 0.46484375, 0.7442626953125, 1.023681640625, 1.3031005859375, 1.58251953125, 1.8619384765625, 2.141357421875, 2.4207763671875, 2.7001953125, 2.9796142578125, 3.259033203125, 3.5384521484375, 3.81787109375, 4.0972900390625, 4.376708984375, 4.6561279296875, 4.935546875, 5.2149658203125, 5.494384765625, 5.7738037109375, 6.05322265625, 6.3326416015625, 6.612060546875, 6.8914794921875, 7.1708984375, 7.4503173828125, 7.729736328125, 8.0091552734375, 8.28857421875, 8.5679931640625, 8.847412109375, 9.1268310546875, 9.40625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 5.0, 8.0, 10.0, 11.0, 15.0, 24.0, 30.0, 41.0, 58.0, 63.0, 83.0, 99.0, 120.0, 159.0, 245.0, 417.0, 984.0, 4015.0, 42689.0, 2030262.0, 2065570.0, 42800.0, 4167.0, 1052.0, 378.0, 224.0, 152.0, 135.0, 95.0, 72.0, 54.0, 52.0, 40.0, 37.0, 26.0, 20.0, 20.0, 11.0, 11.0, 5.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.421875, -26.537353515625, -25.65283203125, -24.768310546875, -23.8837890625, -22.999267578125, -22.11474609375, -21.230224609375, -20.345703125, -19.461181640625, -18.57666015625, -17.692138671875, -16.8076171875, -15.923095703125, -15.03857421875, -14.154052734375, -13.26953125, -12.385009765625, -11.50048828125, -10.615966796875, -9.7314453125, -8.846923828125, -7.96240234375, -7.077880859375, -6.193359375, -5.308837890625, -4.42431640625, -3.539794921875, -2.6552734375, -1.770751953125, -0.88623046875, -0.001708984375, 0.8828125, 1.767333984375, 2.65185546875, 3.536376953125, 4.4208984375, 5.305419921875, 6.18994140625, 7.074462890625, 7.958984375, 8.843505859375, 9.72802734375, 10.612548828125, 11.4970703125, 12.381591796875, 13.26611328125, 14.150634765625, 15.03515625, 15.919677734375, 16.80419921875, 17.688720703125, 18.5732421875, 19.457763671875, 20.34228515625, 21.226806640625, 22.111328125, 22.995849609375, 23.88037109375, 24.764892578125, 25.6494140625, 26.533935546875, 27.41845703125, 28.302978515625, 29.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 13.0, 11.0, 17.0, 31.0, 39.0, 49.0, 71.0, 107.0, 110.0, 149.0, 222.0, 300.0, 425.0, 591.0, 516.0, 425.0, 237.0, 173.0, 150.0, 99.0, 86.0, 66.0, 42.0, 38.0, 25.0, 12.0, 19.0, 11.0, 9.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7578125, -13.309814453125, -12.86181640625, -12.413818359375, -11.9658203125, -11.517822265625, -11.06982421875, -10.621826171875, -10.173828125, -9.725830078125, -9.27783203125, -8.829833984375, -8.3818359375, -7.933837890625, -7.48583984375, -7.037841796875, -6.58984375, -6.141845703125, -5.69384765625, -5.245849609375, -4.7978515625, -4.349853515625, -3.90185546875, -3.453857421875, -3.005859375, -2.557861328125, -2.10986328125, -1.661865234375, -1.2138671875, -0.765869140625, -0.31787109375, 0.130126953125, 0.578125, 1.026123046875, 1.47412109375, 1.922119140625, 2.3701171875, 2.818115234375, 3.26611328125, 3.714111328125, 4.162109375, 4.610107421875, 5.05810546875, 5.506103515625, 5.9541015625, 6.402099609375, 6.85009765625, 7.298095703125, 7.74609375, 8.194091796875, 8.64208984375, 9.090087890625, 9.5380859375, 9.986083984375, 10.43408203125, 10.882080078125, 11.330078125, 11.778076171875, 12.22607421875, 12.674072265625, 13.1220703125, 13.570068359375, 14.01806640625, 14.466064453125, 14.9140625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 2.0, 8.0, 15.0, 15.0, 44.0, 60.0, 134.0, 257.0, 813.0, 5636.0, 4060491.0, 124258.0, 1738.0, 426.0, 168.0, 104.0, 45.0, 28.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9375, -79.435546875, -76.93359375, -74.431640625, -71.9296875, -69.427734375, -66.92578125, -64.423828125, -61.921875, -59.419921875, -56.91796875, -54.416015625, -51.9140625, -49.412109375, -46.91015625, -44.408203125, -41.90625, -39.404296875, -36.90234375, -34.400390625, -31.8984375, -29.396484375, -26.89453125, -24.392578125, -21.890625, -19.388671875, -16.88671875, -14.384765625, -11.8828125, -9.380859375, -6.87890625, -4.376953125, -1.875, 0.626953125, 3.12890625, 5.630859375, 8.1328125, 10.634765625, 13.13671875, 15.638671875, 18.140625, 20.642578125, 23.14453125, 25.646484375, 28.1484375, 30.650390625, 33.15234375, 35.654296875, 38.15625, 40.658203125, 43.16015625, 45.662109375, 48.1640625, 50.666015625, 53.16796875, 55.669921875, 58.171875, 60.673828125, 63.17578125, 65.677734375, 68.1796875, 70.681640625, 73.18359375, 75.685546875, 78.1875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 18.0, 410.0, 567.0, 18.0, 3.0, 2.0, 0.0, 1.0], "bins": [-562.8705444335938, -553.1758422851562, -543.4810791015625, -533.786376953125, -524.0916748046875, -514.3969116210938, -504.70220947265625, -495.00750732421875, -485.3127746582031, -475.6180419921875, -465.92333984375, -456.2286071777344, -446.53387451171875, -436.83917236328125, -427.1444396972656, -417.44970703125, -407.7550048828125, -398.0602722167969, -388.3655700683594, -378.67083740234375, -368.9761047363281, -359.2814025878906, -349.586669921875, -339.8919677734375, -330.19720458984375, -320.5024719238281, -310.8077697753906, -301.113037109375, -291.4183044433594, -281.7236022949219, -272.02886962890625, -262.33416748046875, -252.63941955566406, -242.9447021484375, -233.24996948242188, -223.5552520751953, -213.86053466796875, -204.16580200195312, -194.47108459472656, -184.7763671875, -175.08163452148438, -165.3869171142578, -155.6921844482422, -145.99746704101562, -136.30274963378906, -126.60802459716797, -116.91329956054688, -107.21858215332031, -97.52386474609375, -87.82913970947266, -78.1344223022461, -68.439697265625, -58.74497604370117, -49.050254821777344, -39.35552978515625, -29.660812377929688, -19.966087341308594, -10.27136516571045, -0.5766429901123047, 9.118080139160156, 18.812801361083984, 28.507522583007812, 38.202247619628906, 47.89696502685547, 57.59169006347656]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 5.0, 12.0, 18.0, 16.0, 14.0, 20.0, 30.0, 27.0, 18.0, 27.0, 35.0, 46.0, 53.0, 45.0, 52.0, 46.0, 41.0, 41.0, 41.0, 49.0, 34.0, 49.0, 39.0, 36.0, 27.0, 20.0, 21.0, 17.0, 16.0, 19.0, 9.0, 12.0, 10.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.919647216796875, -47.3433723449707, -45.76709747314453, -44.19082260131836, -42.61454772949219, -41.03827667236328, -39.46200180053711, -37.88572692871094, -36.309452056884766, -34.733177185058594, -33.15690231323242, -31.580629348754883, -30.00435447692871, -28.42807960510254, -26.851806640625, -25.275531768798828, -23.699256896972656, -22.122982025146484, -20.546707153320312, -18.970434188842773, -17.3941593170166, -15.81788444519043, -14.241610527038574, -12.665336608886719, -11.089061737060547, -9.512786865234375, -7.9365129470825195, -6.360238552093506, -4.783964157104492, -3.2076897621154785, -1.6314153671264648, -0.055141448974609375, 1.5211334228515625, 3.097407817840576, 4.67368221282959, 6.2499566078186035, 7.826231002807617, 9.402505874633789, 10.978779792785645, 12.5550537109375, 14.131328582763672, 15.707603454589844, 17.283878326416016, 18.860151290893555, 20.436426162719727, 22.0127010345459, 23.588973999023438, 25.16524887084961, 26.74152374267578, 28.317798614501953, 29.894073486328125, 31.470346450805664, 33.04662322998047, 34.622894287109375, 36.19916915893555, 37.77544403076172, 39.35171890258789, 40.92799377441406, 42.504268646240234, 44.080543518066406, 45.65681457519531, 47.233089447021484, 48.809364318847656, 50.38563919067383, 51.9619140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 11.0, 8.0, 21.0, 35.0, 48.0, 70.0, 103.0, 135.0, 239.0, 402.0, 581.0, 851.0, 1368.0, 2148.0, 3559.0, 5660.0, 9228.0, 14969.0, 24545.0, 40881.0, 68386.0, 121283.0, 235941.0, 230607.0, 118275.0, 66884.0, 39696.0, 24247.0, 14510.0, 8974.0, 5524.0, 3426.0, 2076.0, 1449.0, 837.0, 530.0, 361.0, 256.0, 139.0, 90.0, 71.0, 51.0, 25.0, 19.0, 13.0, 8.0, 7.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.056640625, -1.021392822265625, -0.98614501953125, -0.950897216796875, -0.9156494140625, -0.880401611328125, -0.84515380859375, -0.809906005859375, -0.774658203125, -0.739410400390625, -0.70416259765625, -0.668914794921875, -0.6336669921875, -0.598419189453125, -0.56317138671875, -0.527923583984375, -0.49267578125, -0.457427978515625, -0.42218017578125, -0.386932373046875, -0.3516845703125, -0.316436767578125, -0.28118896484375, -0.245941162109375, -0.210693359375, -0.175445556640625, -0.14019775390625, -0.104949951171875, -0.0697021484375, -0.034454345703125, 0.00079345703125, 0.036041259765625, 0.0712890625, 0.106536865234375, 0.14178466796875, 0.177032470703125, 0.2122802734375, 0.247528076171875, 0.28277587890625, 0.318023681640625, 0.353271484375, 0.388519287109375, 0.42376708984375, 0.459014892578125, 0.4942626953125, 0.529510498046875, 0.56475830078125, 0.600006103515625, 0.63525390625, 0.670501708984375, 0.70574951171875, 0.740997314453125, 0.7762451171875, 0.811492919921875, 0.84674072265625, 0.881988525390625, 0.917236328125, 0.952484130859375, 0.98773193359375, 1.022979736328125, 1.0582275390625, 1.093475341796875, 1.12872314453125, 1.163970947265625, 1.19921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 11.0, 11.0, 18.0, 19.0, 16.0, 15.0, 26.0, 26.0, 27.0, 32.0, 28.0, 24.0, 34.0, 37.0, 32.0, 38.0, 39.0, 1081.0, 33.0, 30.0, 38.0, 42.0, 46.0, 32.0, 47.0, 23.0, 30.0, 33.0, 27.0, 17.0, 20.0, 12.0, 12.0, 8.0, 12.0, 5.0, 3.0, 5.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3671875, -4.237152099609375, -4.10711669921875, -3.977081298828125, -3.8470458984375, -3.717010498046875, -3.58697509765625, -3.456939697265625, -3.326904296875, -3.196868896484375, -3.06683349609375, -2.936798095703125, -2.8067626953125, -2.676727294921875, -2.54669189453125, -2.416656494140625, -2.28662109375, -2.156585693359375, -2.02655029296875, -1.896514892578125, -1.7664794921875, -1.636444091796875, -1.50640869140625, -1.376373291015625, -1.246337890625, -1.116302490234375, -0.98626708984375, -0.856231689453125, -0.7261962890625, -0.596160888671875, -0.46612548828125, -0.336090087890625, -0.2060546875, -0.076019287109375, 0.05401611328125, 0.184051513671875, 0.3140869140625, 0.444122314453125, 0.57415771484375, 0.704193115234375, 0.834228515625, 0.964263916015625, 1.09429931640625, 1.224334716796875, 1.3543701171875, 1.484405517578125, 1.61444091796875, 1.744476318359375, 1.87451171875, 2.004547119140625, 2.13458251953125, 2.264617919921875, 2.3946533203125, 2.524688720703125, 2.65472412109375, 2.784759521484375, 2.914794921875, 3.044830322265625, 3.17486572265625, 3.304901123046875, 3.4349365234375, 3.564971923828125, 3.69500732421875, 3.825042724609375, 3.955078125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 8.0, 10.0, 10.0, 9.0, 32.0, 35.0, 45.0, 79.0, 118.0, 205.0, 281.0, 445.0, 633.0, 944.0, 1404.0, 2033.0, 3222.0, 4869.0, 7306.0, 11425.0, 17637.0, 27430.0, 43137.0, 69060.0, 113360.0, 204137.0, 1266911.0, 121157.0, 73469.0, 45648.0, 28908.0, 18343.0, 11704.0, 7883.0, 5112.0, 3407.0, 2282.0, 1526.0, 937.0, 610.0, 439.0, 305.0, 218.0, 140.0, 84.0, 71.0, 51.0, 22.0, 15.0, 14.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89501953125, -0.8652420043945312, -0.8354644775390625, -0.8056869506835938, -0.775909423828125, -0.7461318969726562, -0.7163543701171875, -0.6865768432617188, -0.65679931640625, -0.6270217895507812, -0.5972442626953125, -0.5674667358398438, -0.537689208984375, -0.5079116821289062, -0.4781341552734375, -0.44835662841796875, -0.4185791015625, -0.38880157470703125, -0.3590240478515625, -0.32924652099609375, -0.299468994140625, -0.26969146728515625, -0.2399139404296875, -0.21013641357421875, -0.18035888671875, -0.15058135986328125, -0.1208038330078125, -0.09102630615234375, -0.061248779296875, -0.03147125244140625, -0.0016937255859375, 0.02808380126953125, 0.057861328125, 0.08763885498046875, 0.1174163818359375, 0.14719390869140625, 0.176971435546875, 0.20674896240234375, 0.2365264892578125, 0.26630401611328125, 0.29608154296875, 0.32585906982421875, 0.3556365966796875, 0.38541412353515625, 0.415191650390625, 0.44496917724609375, 0.4747467041015625, 0.5045242309570312, 0.5343017578125, 0.5640792846679688, 0.5938568115234375, 0.6236343383789062, 0.653411865234375, 0.6831893920898438, 0.7129669189453125, 0.7427444458007812, 0.77252197265625, 0.8022994995117188, 0.8320770263671875, 0.8618545532226562, 0.891632080078125, 0.9214096069335938, 0.9511871337890625, 0.9809646606445312, 1.0107421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 7.0, 14.0, 22.0, 26.0, 26.0, 33.0, 34.0, 53.0, 64.0, 72.0, 82.0, 89.0, 82.0, 74.0, 57.0, 45.0, 44.0, 23.0, 35.0, 13.0, 14.0, 12.0, 13.0, 15.0, 6.0, 6.0, 10.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005064010620117188, -0.00048795342445373535, -0.00046950578689575195, -0.00045105814933776855, -0.00043261051177978516, -0.00041416287422180176, -0.00039571523666381836, -0.00037726759910583496, -0.00035881996154785156, -0.00034037232398986816, -0.00032192468643188477, -0.00030347704887390137, -0.00028502941131591797, -0.00026658177375793457, -0.00024813413619995117, -0.00022968649864196777, -0.00021123886108398438, -0.00019279122352600098, -0.00017434358596801758, -0.00015589594841003418, -0.00013744831085205078, -0.00011900067329406738, -0.00010055303573608398, -8.210539817810059e-05, -6.365776062011719e-05, -4.521012306213379e-05, -2.676248550415039e-05, -8.314847946166992e-06, 1.0132789611816406e-05, 2.8580427169799805e-05, 4.70280647277832e-05, 6.54757022857666e-05, 8.392333984375e-05, 0.0001023709774017334, 0.0001208186149597168, 0.0001392662525177002, 0.0001577138900756836, 0.000176161527633667, 0.0001946091651916504, 0.0002130568027496338, 0.0002315044403076172, 0.0002499520778656006, 0.000268399715423584, 0.0002868473529815674, 0.0003052949905395508, 0.0003237426280975342, 0.0003421902656555176, 0.000360637903213501, 0.0003790855407714844, 0.0003975331783294678, 0.00041598081588745117, 0.00043442845344543457, 0.00045287609100341797, 0.00047132372856140137, 0.0004897713661193848, 0.0005082190036773682, 0.0005266666412353516, 0.000545114278793335, 0.0005635619163513184, 0.0005820095539093018, 0.0006004571914672852, 0.0006189048290252686, 0.000637352466583252, 0.0006558001041412354, 0.0006742477416992188]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 21.0, 12.0, 29.0, 21.0, 44.0, 49.0, 49.0, 73.0, 115.0, 175.0, 266.0, 391.0, 777.0, 3341.0, 1028392.0, 12477.0, 869.0, 504.0, 287.0, 153.0, 137.0, 85.0, 59.0, 48.0, 45.0, 22.0, 21.0, 19.0, 10.0, 4.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0120086669921875, -0.011640310287475586, -0.011271953582763672, -0.010903596878051758, -0.010535240173339844, -0.01016688346862793, -0.009798526763916016, -0.009430170059204102, -0.009061813354492188, -0.008693456649780273, -0.00832509994506836, -0.007956743240356445, -0.007588386535644531, -0.007220029830932617, -0.006851673126220703, -0.006483316421508789, -0.006114959716796875, -0.005746603012084961, -0.005378246307373047, -0.005009889602661133, -0.004641532897949219, -0.004273176193237305, -0.0039048194885253906, -0.0035364627838134766, -0.0031681060791015625, -0.0027997493743896484, -0.0024313926696777344, -0.0020630359649658203, -0.0016946792602539062, -0.0013263225555419922, -0.0009579658508300781, -0.0005896091461181641, -0.00022125244140625, 0.00014710426330566406, 0.0005154609680175781, 0.0008838176727294922, 0.0012521743774414062, 0.0016205310821533203, 0.0019888877868652344, 0.0023572444915771484, 0.0027256011962890625, 0.0030939579010009766, 0.0034623146057128906, 0.0038306713104248047, 0.004199028015136719, 0.004567384719848633, 0.004935741424560547, 0.005304098129272461, 0.005672454833984375, 0.006040811538696289, 0.006409168243408203, 0.006777524948120117, 0.007145881652832031, 0.007514238357543945, 0.00788259506225586, 0.008250951766967773, 0.008619308471679688, 0.008987665176391602, 0.009356021881103516, 0.00972437858581543, 0.010092735290527344, 0.010461091995239258, 0.010829448699951172, 0.011197805404663086, 0.011566162109375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 42.0, 417.0, 478.0, 71.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007842280901968479, -0.0007322087767533958, -0.0006801894633099437, -0.0006281701498664916, -0.0005761508364230394, -0.0005241315229795873, -0.0004721122095361352, -0.0004200928960926831, -0.00036807358264923096, -0.00031605426920577884, -0.0002640349557623267, -0.0002120156423188746, -0.00015999632887542248, -0.00010797701543197036, -5.595770198851824e-05, -3.938388545066118e-06, 4.8080924898386e-05, 0.00010010023834183812, 0.00015211955178529024, 0.00020413886522874236, 0.0002561581786721945, 0.0003081774921156466, 0.0003601968055590987, 0.00041221611900255084, 0.00046423543244600296, 0.0005162547458894551, 0.0005682740593329072, 0.0006202933727763593, 0.0006723126862198114, 0.0007243319996632636, 0.0007763513131067157, 0.0008283706265501678, 0.0008803899399936199, 0.000932409253437072, 0.0009844285668805242, 0.0010364479385316372, 0.0010884671937674284, 0.0011404864490032196, 0.0011925058206543326, 0.0012445251923054457, 0.0012965444475412369, 0.001348563702777028, 0.0014005830744281411, 0.0014526024460792542, 0.0015046217013150454, 0.0015566409565508366, 0.0016086603282019496, 0.0016606796998530626, 0.0017126989550888538, 0.001764718210324645, 0.001816737581975758, 0.0018687569536268711, 0.0019207762088626623, 0.0019727954640984535, 0.0020248149521648884, 0.0020768342074006796, 0.002128853462636471, 0.002180872717872262, 0.002232891973108053, 0.002284911461174488, 0.0023369307164102793, 0.0023889499716460705, 0.0024409694597125053, 0.0024929887149482965, 0.0025450079701840878]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 5.0, 9.0, 6.0, 8.0, 13.0, 20.0, 14.0, 15.0, 26.0, 25.0, 25.0, 21.0, 29.0, 37.0, 44.0, 43.0, 40.0, 35.0, 43.0, 45.0, 40.0, 52.0, 47.0, 37.0, 41.0, 41.0, 36.0, 38.0, 27.0, 19.0, 27.0, 24.0, 16.0, 11.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 9.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002828240394592285, -0.0002743285149335861, -0.0002658329904079437, -0.00025733746588230133, -0.00024884194135665894, -0.00024034641683101654, -0.00023185089230537415, -0.00022335536777973175, -0.00021485984325408936, -0.00020636431872844696, -0.00019786879420280457, -0.00018937326967716217, -0.00018087774515151978, -0.00017238222062587738, -0.00016388669610023499, -0.0001553911715745926, -0.0001468956470489502, -0.0001384001225233078, -0.0001299045979976654, -0.00012140907347202301, -0.00011291354894638062, -0.00010441802442073822, -9.592249989509583e-05, -8.742697536945343e-05, -7.893145084381104e-05, -7.043592631816864e-05, -6.194040179252625e-05, -5.344487726688385e-05, -4.4949352741241455e-05, -3.645382821559906e-05, -2.7958303689956665e-05, -1.946277916431427e-05, -1.0967254638671875e-05, -2.47173011302948e-06, 6.023794412612915e-06, 1.451931893825531e-05, 2.3014843463897705e-05, 3.15103679895401e-05, 4.0005892515182495e-05, 4.850141704082489e-05, 5.6996941566467285e-05, 6.549246609210968e-05, 7.398799061775208e-05, 8.248351514339447e-05, 9.097903966903687e-05, 9.947456419467926e-05, 0.00010797008872032166, 0.00011646561324596405, 0.00012496113777160645, 0.00013345666229724884, 0.00014195218682289124, 0.00015044771134853363, 0.00015894323587417603, 0.00016743876039981842, 0.00017593428492546082, 0.0001844298094511032, 0.0001929253339767456, 0.000201420858502388, 0.0002099163830280304, 0.0002184119075536728, 0.00022690743207931519, 0.00023540295660495758, 0.00024389848113059998, 0.00025239400565624237, 0.00026088953018188477]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 14.0, 21.0, 21.0, 14.0, 25.0, 24.0, 42.0, 38.0, 30.0, 36.0, 48.0, 34.0, 33.0, 44.0, 52.0, 59.0, 50.0, 44.0, 39.0, 45.0, 46.0, 38.0, 30.0, 22.0, 27.0, 22.0, 20.0, 18.0, 12.0, 12.0, 5.0, 6.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.48248291015625, -7.2540283203125, -7.02557373046875, -6.797119140625, -6.56866455078125, -6.3402099609375, -6.11175537109375, -5.88330078125, -5.65484619140625, -5.4263916015625, -5.19793701171875, -4.969482421875, -4.74102783203125, -4.5125732421875, -4.28411865234375, -4.0556640625, -3.82720947265625, -3.5987548828125, -3.37030029296875, -3.141845703125, -2.91339111328125, -2.6849365234375, -2.45648193359375, -2.22802734375, -1.99957275390625, -1.7711181640625, -1.54266357421875, -1.314208984375, -1.08575439453125, -0.8572998046875, -0.62884521484375, -0.400390625, -0.17193603515625, 0.0565185546875, 0.28497314453125, 0.513427734375, 0.74188232421875, 0.9703369140625, 1.19879150390625, 1.42724609375, 1.65570068359375, 1.8841552734375, 2.11260986328125, 2.341064453125, 2.56951904296875, 2.7979736328125, 3.02642822265625, 3.2548828125, 3.48333740234375, 3.7117919921875, 3.94024658203125, 4.168701171875, 4.39715576171875, 4.6256103515625, 4.85406494140625, 5.08251953125, 5.31097412109375, 5.5394287109375, 5.76788330078125, 5.996337890625, 6.22479248046875, 6.4532470703125, 6.68170166015625, 6.91015625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 12.0, 15.0, 11.0, 20.0, 39.0, 60.0, 79.0, 136.0, 201.0, 292.0, 424.0, 677.0, 1091.0, 1732.0, 3107.0, 6679.0, 27989.0, 373184.0, 574544.0, 41568.0, 8039.0, 3390.0, 1919.0, 1171.0, 769.0, 489.0, 319.0, 184.0, 112.0, 90.0, 73.0, 49.0, 25.0, 14.0, 24.0, 3.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.55712890625, -16.9736328125, -16.39013671875, -15.806640625, -15.22314453125, -14.6396484375, -14.05615234375, -13.47265625, -12.88916015625, -12.3056640625, -11.72216796875, -11.138671875, -10.55517578125, -9.9716796875, -9.38818359375, -8.8046875, -8.22119140625, -7.6376953125, -7.05419921875, -6.470703125, -5.88720703125, -5.3037109375, -4.72021484375, -4.13671875, -3.55322265625, -2.9697265625, -2.38623046875, -1.802734375, -1.21923828125, -0.6357421875, -0.05224609375, 0.53125, 1.11474609375, 1.6982421875, 2.28173828125, 2.865234375, 3.44873046875, 4.0322265625, 4.61572265625, 5.19921875, 5.78271484375, 6.3662109375, 6.94970703125, 7.533203125, 8.11669921875, 8.7001953125, 9.28369140625, 9.8671875, 10.45068359375, 11.0341796875, 11.61767578125, 12.201171875, 12.78466796875, 13.3681640625, 13.95166015625, 14.53515625, 15.11865234375, 15.7021484375, 16.28564453125, 16.869140625, 17.45263671875, 18.0361328125, 18.61962890625, 19.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 3.0, 7.0, 9.0, 14.0, 17.0, 18.0, 29.0, 33.0, 27.0, 41.0, 46.0, 48.0, 43.0, 79.0, 204.0, 1624.0, 279.0, 97.0, 63.0, 47.0, 57.0, 46.0, 28.0, 43.0, 26.0, 21.0, 12.0, 12.0, 13.0, 9.0, 7.0, 3.0, 6.0, 5.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-18.875, -18.2978515625, -17.720703125, -17.1435546875, -16.56640625, -15.9892578125, -15.412109375, -14.8349609375, -14.2578125, -13.6806640625, -13.103515625, -12.5263671875, -11.94921875, -11.3720703125, -10.794921875, -10.2177734375, -9.640625, -9.0634765625, -8.486328125, -7.9091796875, -7.33203125, -6.7548828125, -6.177734375, -5.6005859375, -5.0234375, -4.4462890625, -3.869140625, -3.2919921875, -2.71484375, -2.1376953125, -1.560546875, -0.9833984375, -0.40625, 0.1708984375, 0.748046875, 1.3251953125, 1.90234375, 2.4794921875, 3.056640625, 3.6337890625, 4.2109375, 4.7880859375, 5.365234375, 5.9423828125, 6.51953125, 7.0966796875, 7.673828125, 8.2509765625, 8.828125, 9.4052734375, 9.982421875, 10.5595703125, 11.13671875, 11.7138671875, 12.291015625, 12.8681640625, 13.4453125, 14.0224609375, 14.599609375, 15.1767578125, 15.75390625, 16.3310546875, 16.908203125, 17.4853515625, 18.0625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 8.0, 7.0, 4.0, 9.0, 14.0, 29.0, 20.0, 27.0, 40.0, 43.0, 60.0, 57.0, 102.0, 124.0, 168.0, 267.0, 477.0, 1117.0, 7103.0, 3107598.0, 25295.0, 1459.0, 586.0, 305.0, 181.0, 134.0, 107.0, 83.0, 48.0, 57.0, 42.0, 26.0, 19.0, 18.0, 20.0, 9.0, 5.0, 12.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.9677734375, -44.466796875, -42.9658203125, -41.46484375, -39.9638671875, -38.462890625, -36.9619140625, -35.4609375, -33.9599609375, -32.458984375, -30.9580078125, -29.45703125, -27.9560546875, -26.455078125, -24.9541015625, -23.453125, -21.9521484375, -20.451171875, -18.9501953125, -17.44921875, -15.9482421875, -14.447265625, -12.9462890625, -11.4453125, -9.9443359375, -8.443359375, -6.9423828125, -5.44140625, -3.9404296875, -2.439453125, -0.9384765625, 0.5625, 2.0634765625, 3.564453125, 5.0654296875, 6.56640625, 8.0673828125, 9.568359375, 11.0693359375, 12.5703125, 14.0712890625, 15.572265625, 17.0732421875, 18.57421875, 20.0751953125, 21.576171875, 23.0771484375, 24.578125, 26.0791015625, 27.580078125, 29.0810546875, 30.58203125, 32.0830078125, 33.583984375, 35.0849609375, 36.5859375, 38.0869140625, 39.587890625, 41.0888671875, 42.58984375, 44.0908203125, 45.591796875, 47.0927734375, 48.59375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 8.0, 17.0, 40.0, 70.0, 114.0, 164.0, 167.0, 180.0, 107.0, 72.0, 28.0, 20.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.86111831665039, -41.53313446044922, -40.20515060424805, -38.87716293334961, -37.54917907714844, -36.221195220947266, -34.893211364746094, -33.56522750854492, -32.23724365234375, -30.909259796142578, -29.581274032592773, -28.2532901763916, -26.925304412841797, -25.597320556640625, -24.269336700439453, -22.94135284423828, -21.613365173339844, -20.285381317138672, -18.957395553588867, -17.629411697387695, -16.30142593383789, -14.973442077636719, -13.645458221435547, -12.317473411560059, -10.98948860168457, -9.661503791809082, -8.333518981933594, -7.005535125732422, -5.677550315856934, -4.349565505981445, -3.0215811729431152, -1.6935968399047852, -0.36560821533203125, 0.9623763561248779, 2.290360927581787, 3.6183454990386963, 4.9463300704956055, 6.274314880371094, 7.602299213409424, 8.930283546447754, 10.258268356323242, 11.58625316619873, 12.914237976074219, 14.24222183227539, 15.570206642150879, 16.898191452026367, 18.22617530822754, 19.554161071777344, 20.882144927978516, 22.210128784179688, 23.538114547729492, 24.866098403930664, 26.19408416748047, 27.52206802368164, 28.850051879882812, 30.178035736083984, 31.50602149963379, 32.834007263183594, 34.161991119384766, 35.48997497558594, 36.81795883178711, 38.14594268798828, 39.47393035888672, 40.80191421508789, 42.12989807128906]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 7.0, 9.0, 12.0, 7.0, 14.0, 14.0, 19.0, 18.0, 33.0, 39.0, 26.0, 21.0, 40.0, 41.0, 48.0, 37.0, 39.0, 55.0, 49.0, 47.0, 30.0, 48.0, 31.0, 19.0, 33.0, 36.0, 24.0, 22.0, 34.0, 19.0, 25.0, 16.0, 16.0, 9.0, 14.0, 9.0, 11.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-54.39656066894531, -52.722900390625, -51.04924392700195, -49.37558364868164, -47.701927185058594, -46.02826690673828, -44.354610443115234, -42.68095016479492, -41.007293701171875, -39.33363342285156, -37.659976959228516, -35.9863166809082, -34.312660217285156, -32.638999938964844, -30.965343475341797, -29.291683197021484, -27.618024826049805, -25.944366455078125, -24.270708084106445, -22.597049713134766, -20.923391342163086, -19.249732971191406, -17.576072692871094, -15.90241527557373, -14.22875690460205, -12.555098533630371, -10.881440162658691, -9.207780838012695, -7.534122943878174, -5.860464096069336, -4.186805725097656, -2.5131473541259766, -0.8394889831542969, 0.8341695070266724, 2.5078279972076416, 4.1814866065979, 5.85514497756958, 7.528803825378418, 9.202462196350098, 10.876120567321777, 12.549778938293457, 14.223437309265137, 15.897095680236816, 17.570755004882812, 19.244413375854492, 20.918071746826172, 22.59173011779785, 24.26538848876953, 25.93904685974121, 27.61270523071289, 29.28636360168457, 30.96002197265625, 32.63368225097656, 34.30733871459961, 35.98099899291992, 37.65465545654297, 39.32831573486328, 41.001976013183594, 42.67563247680664, 44.34929275512695, 46.02294921875, 47.69660949707031, 49.37026596069336, 51.04392623901367, 52.71758270263672]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 9.0, 9.0, 4.0, 15.0, 15.0, 16.0, 23.0, 22.0, 20.0, 34.0, 51.0, 33.0, 35.0, 52.0, 58.0, 52.0, 54.0, 41.0, 54.0, 34.0, 46.0, 41.0, 39.0, 37.0, 29.0, 29.0, 26.0, 20.0, 17.0, 34.0, 17.0, 12.0, 5.0, 8.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.140625, -8.8951416015625, -8.649658203125, -8.4041748046875, -8.15869140625, -7.9132080078125, -7.667724609375, -7.4222412109375, -7.1767578125, -6.9312744140625, -6.685791015625, -6.4403076171875, -6.19482421875, -5.9493408203125, -5.703857421875, -5.4583740234375, -5.212890625, -4.9674072265625, -4.721923828125, -4.4764404296875, -4.23095703125, -3.9854736328125, -3.739990234375, -3.4945068359375, -3.2490234375, -3.0035400390625, -2.758056640625, -2.5125732421875, -2.26708984375, -2.0216064453125, -1.776123046875, -1.5306396484375, -1.28515625, -1.0396728515625, -0.794189453125, -0.5487060546875, -0.30322265625, -0.0577392578125, 0.187744140625, 0.4332275390625, 0.6787109375, 0.9241943359375, 1.169677734375, 1.4151611328125, 1.66064453125, 1.9061279296875, 2.151611328125, 2.3970947265625, 2.642578125, 2.8880615234375, 3.133544921875, 3.3790283203125, 3.62451171875, 3.8699951171875, 4.115478515625, 4.3609619140625, 4.6064453125, 4.8519287109375, 5.097412109375, 5.3428955078125, 5.58837890625, 5.8338623046875, 6.079345703125, 6.3248291015625, 6.5703125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 24.0, 26.0, 21.0, 43.0, 36.0, 76.0, 95.0, 145.0, 183.0, 325.0, 469.0, 785.0, 1252.0, 2412.0, 5423.0, 15014.0, 66552.0, 489791.0, 2062971.0, 1298972.0, 198383.0, 33438.0, 9602.0, 3630.0, 1808.0, 1013.0, 566.0, 371.0, 266.0, 157.0, 113.0, 81.0, 69.0, 41.0, 28.0, 24.0, 12.0, 15.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-12.5234375, -12.1734619140625, -11.823486328125, -11.4735107421875, -11.12353515625, -10.7735595703125, -10.423583984375, -10.0736083984375, -9.7236328125, -9.3736572265625, -9.023681640625, -8.6737060546875, -8.32373046875, -7.9737548828125, -7.623779296875, -7.2738037109375, -6.923828125, -6.5738525390625, -6.223876953125, -5.8739013671875, -5.52392578125, -5.1739501953125, -4.823974609375, -4.4739990234375, -4.1240234375, -3.7740478515625, -3.424072265625, -3.0740966796875, -2.72412109375, -2.3741455078125, -2.024169921875, -1.6741943359375, -1.32421875, -0.9742431640625, -0.624267578125, -0.2742919921875, 0.07568359375, 0.4256591796875, 0.775634765625, 1.1256103515625, 1.4755859375, 1.8255615234375, 2.175537109375, 2.5255126953125, 2.87548828125, 3.2254638671875, 3.575439453125, 3.9254150390625, 4.275390625, 4.6253662109375, 4.975341796875, 5.3253173828125, 5.67529296875, 6.0252685546875, 6.375244140625, 6.7252197265625, 7.0751953125, 7.4251708984375, 7.775146484375, 8.1251220703125, 8.47509765625, 8.8250732421875, 9.175048828125, 9.5250244140625, 9.875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 13.0, 15.0, 41.0, 108.0, 393.0, 1098.0, 1620.0, 561.0, 167.0, 50.0, 10.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.650390625, -40.26953125, -38.888671875, -37.5078125, -36.126953125, -34.74609375, -33.365234375, -31.984375, -30.603515625, -29.22265625, -27.841796875, -26.4609375, -25.080078125, -23.69921875, -22.318359375, -20.9375, -19.556640625, -18.17578125, -16.794921875, -15.4140625, -14.033203125, -12.65234375, -11.271484375, -9.890625, -8.509765625, -7.12890625, -5.748046875, -4.3671875, -2.986328125, -1.60546875, -0.224609375, 1.15625, 2.537109375, 3.91796875, 5.298828125, 6.6796875, 8.060546875, 9.44140625, 10.822265625, 12.203125, 13.583984375, 14.96484375, 16.345703125, 17.7265625, 19.107421875, 20.48828125, 21.869140625, 23.25, 24.630859375, 26.01171875, 27.392578125, 28.7734375, 30.154296875, 31.53515625, 32.916015625, 34.296875, 35.677734375, 37.05859375, 38.439453125, 39.8203125, 41.201171875, 42.58203125, 43.962890625, 45.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 4.0, 19.0, 42.0, 75.0, 205.0, 756.0, 4187.0, 4170022.0, 17055.0, 1309.0, 360.0, 130.0, 48.0, 21.0, 12.0, 8.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3125, -87.548828125, -84.78515625, -82.021484375, -79.2578125, -76.494140625, -73.73046875, -70.966796875, -68.203125, -65.439453125, -62.67578125, -59.912109375, -57.1484375, -54.384765625, -51.62109375, -48.857421875, -46.09375, -43.330078125, -40.56640625, -37.802734375, -35.0390625, -32.275390625, -29.51171875, -26.748046875, -23.984375, -21.220703125, -18.45703125, -15.693359375, -12.9296875, -10.166015625, -7.40234375, -4.638671875, -1.875, 0.888671875, 3.65234375, 6.416015625, 9.1796875, 11.943359375, 14.70703125, 17.470703125, 20.234375, 22.998046875, 25.76171875, 28.525390625, 31.2890625, 34.052734375, 36.81640625, 39.580078125, 42.34375, 45.107421875, 47.87109375, 50.634765625, 53.3984375, 56.162109375, 58.92578125, 61.689453125, 64.453125, 67.216796875, 69.98046875, 72.744140625, 75.5078125, 78.271484375, 81.03515625, 83.798828125, 86.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 85.0, 592.0, 319.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.76255798339844, -240.84356689453125, -233.92457580566406, -227.00558471679688, -220.08657836914062, -213.16758728027344, -206.24859619140625, -199.32960510253906, -192.41061401367188, -185.4916229248047, -178.5726318359375, -171.65362548828125, -164.73463439941406, -157.81564331054688, -150.8966522216797, -143.9776611328125, -137.05865478515625, -130.13966369628906, -123.22066497802734, -116.30167388916016, -109.38267517089844, -102.46368408203125, -95.54469299316406, -88.62570190429688, -81.70670318603516, -74.78771209716797, -67.86871337890625, -60.94972229003906, -54.03072738647461, -47.111732482910156, -40.19274139404297, -33.273746490478516, -26.354736328125, -19.435741424560547, -12.516748428344727, -5.597755432128906, 1.3212394714355469, 8.240234375, 15.159225463867188, 22.07822036743164, 28.997215270996094, 35.91621017456055, 42.835205078125, 49.75419616699219, 56.67319107055664, 63.592185974121094, 70.51117706298828, 77.43017578125, 84.34916687011719, 91.26815795898438, 98.1871566772461, 105.10614776611328, 112.025146484375, 118.94413757324219, 125.86312866210938, 132.78211975097656, 139.70111083984375, 146.62010192871094, 153.53909301757812, 160.45809936523438, 167.37709045410156, 174.29608154296875, 181.21507263183594, 188.13406372070312, 195.05307006835938]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 7.0, 13.0, 12.0, 14.0, 14.0, 18.0, 18.0, 31.0, 30.0, 29.0, 29.0, 26.0, 55.0, 52.0, 41.0, 48.0, 42.0, 34.0, 46.0, 29.0, 48.0, 38.0, 38.0, 32.0, 28.0, 36.0, 23.0, 23.0, 26.0, 17.0, 19.0, 26.0, 9.0, 9.0, 6.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.628509521484375, -38.98917770385742, -37.3498420715332, -35.71051025390625, -34.0711784362793, -32.431846618652344, -30.792510986328125, -29.153179168701172, -27.513845443725586, -25.87451171875, -24.235179901123047, -22.59584617614746, -20.956512451171875, -19.317180633544922, -17.677846908569336, -16.03851318359375, -14.399181365966797, -12.759848594665527, -11.120515823364258, -9.481182098388672, -7.841849327087402, -6.202516555786133, -4.563182830810547, -2.9238500595092773, -1.2845172882080078, 0.3548157215118408, 1.9941487312316895, 3.633481979370117, 5.272814750671387, 6.912147521972656, 8.551481246948242, 10.190814018249512, 11.830146789550781, 13.46947956085205, 15.10881233215332, 16.748146057128906, 18.38747787475586, 20.026811599731445, 21.66614532470703, 23.305477142333984, 24.94481086730957, 26.584144592285156, 28.22347640991211, 29.862810134887695, 31.50214385986328, 33.141475677490234, 34.78080749511719, 36.420143127441406, 38.05947494506836, 39.69880676269531, 41.33814239501953, 42.977474212646484, 44.61680603027344, 46.256141662597656, 47.89547348022461, 49.53480529785156, 51.17414093017578, 52.813472747802734, 54.45280838012695, 56.092140197753906, 57.73147201538086, 59.37080383300781, 61.01013946533203, 62.649471282958984, 64.28880310058594]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 31.0, 25.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 11.0, 17.0, 10.0, 29.0, 60.0, 76.0, 120.0, 199.0, 333.0, 531.0, 823.0, 1387.0, 2300.0, 3780.0, 6559.0, 11006.0, 18940.0, 32984.0, 59873.0, 112297.0, 224341.0, 271457.0, 136546.0, 71385.0, 39389.0, 22318.0, 12918.0, 7511.0, 4451.0, 2707.0, 1603.0, 946.0, 589.0, 384.0, 262.0, 150.0, 92.0, 51.0, 44.0, 22.0, 14.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.962890625, -0.9298553466796875, -0.896820068359375, -0.8637847900390625, -0.83074951171875, -0.7977142333984375, -0.764678955078125, -0.7316436767578125, -0.6986083984375, -0.6655731201171875, -0.632537841796875, -0.5995025634765625, -0.56646728515625, -0.5334320068359375, -0.500396728515625, -0.4673614501953125, -0.434326171875, -0.4012908935546875, -0.368255615234375, -0.3352203369140625, -0.30218505859375, -0.2691497802734375, -0.236114501953125, -0.2030792236328125, -0.1700439453125, -0.1370086669921875, -0.103973388671875, -0.0709381103515625, -0.03790283203125, -0.0048675537109375, 0.028167724609375, 0.0612030029296875, 0.09423828125, 0.1272735595703125, 0.160308837890625, 0.1933441162109375, 0.22637939453125, 0.2594146728515625, 0.292449951171875, 0.3254852294921875, 0.3585205078125, 0.3915557861328125, 0.424591064453125, 0.4576263427734375, 0.49066162109375, 0.5236968994140625, 0.556732177734375, 0.5897674560546875, 0.622802734375, 0.6558380126953125, 0.688873291015625, 0.7219085693359375, 0.75494384765625, 0.7879791259765625, 0.821014404296875, 0.8540496826171875, 0.8870849609375, 0.9201202392578125, 0.953155517578125, 0.9861907958984375, 1.01922607421875, 1.0522613525390625, 1.085296630859375, 1.1183319091796875, 1.1513671875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 11.0, 18.0, 13.0, 12.0, 29.0, 26.0, 21.0, 25.0, 27.0, 34.0, 33.0, 37.0, 59.0, 44.0, 30.0, 1086.0, 34.0, 45.0, 45.0, 43.0, 39.0, 39.0, 32.0, 31.0, 25.0, 25.0, 26.0, 14.0, 18.0, 21.0, 10.0, 5.0, 9.0, 9.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.10302734375, -2.9912109375, -2.87939453125, -2.767578125, -2.65576171875, -2.5439453125, -2.43212890625, -2.3203125, -2.20849609375, -2.0966796875, -1.98486328125, -1.873046875, -1.76123046875, -1.6494140625, -1.53759765625, -1.42578125, -1.31396484375, -1.2021484375, -1.09033203125, -0.978515625, -0.86669921875, -0.7548828125, -0.64306640625, -0.53125, -0.41943359375, -0.3076171875, -0.19580078125, -0.083984375, 0.02783203125, 0.1396484375, 0.25146484375, 0.36328125, 0.47509765625, 0.5869140625, 0.69873046875, 0.810546875, 0.92236328125, 1.0341796875, 1.14599609375, 1.2578125, 1.36962890625, 1.4814453125, 1.59326171875, 1.705078125, 1.81689453125, 1.9287109375, 2.04052734375, 2.15234375, 2.26416015625, 2.3759765625, 2.48779296875, 2.599609375, 2.71142578125, 2.8232421875, 2.93505859375, 3.046875, 3.15869140625, 3.2705078125, 3.38232421875, 3.494140625, 3.60595703125, 3.7177734375, 3.82958984375, 3.94140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 11.0, 24.0, 20.0, 53.0, 73.0, 115.0, 152.0, 261.0, 377.0, 560.0, 819.0, 1430.0, 2106.0, 3165.0, 4943.0, 7481.0, 11731.0, 18655.0, 29653.0, 48221.0, 80743.0, 144426.0, 1299193.0, 184080.0, 101107.0, 59432.0, 36068.0, 22623.0, 14003.0, 9042.0, 5726.0, 3860.0, 2417.0, 1577.0, 1022.0, 708.0, 445.0, 272.0, 191.0, 113.0, 88.0, 49.0, 35.0, 18.0, 16.0, 7.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.86572265625, -0.8400344848632812, -0.8143463134765625, -0.7886581420898438, -0.762969970703125, -0.7372817993164062, -0.7115936279296875, -0.6859054565429688, -0.66021728515625, -0.6345291137695312, -0.6088409423828125, -0.5831527709960938, -0.557464599609375, -0.5317764282226562, -0.5060882568359375, -0.48040008544921875, -0.4547119140625, -0.42902374267578125, -0.4033355712890625, -0.37764739990234375, -0.351959228515625, -0.32627105712890625, -0.3005828857421875, -0.27489471435546875, -0.24920654296875, -0.22351837158203125, -0.1978302001953125, -0.17214202880859375, -0.146453857421875, -0.12076568603515625, -0.0950775146484375, -0.06938934326171875, -0.043701171875, -0.01801300048828125, 0.0076751708984375, 0.03336334228515625, 0.059051513671875, 0.08473968505859375, 0.1104278564453125, 0.13611602783203125, 0.16180419921875, 0.18749237060546875, 0.2131805419921875, 0.23886871337890625, 0.264556884765625, 0.29024505615234375, 0.3159332275390625, 0.34162139892578125, 0.3673095703125, 0.39299774169921875, 0.4186859130859375, 0.44437408447265625, 0.470062255859375, 0.49575042724609375, 0.5214385986328125, 0.5471267700195312, 0.57281494140625, 0.5985031127929688, 0.6241912841796875, 0.6498794555664062, 0.675567626953125, 0.7012557983398438, 0.7269439697265625, 0.7526321411132812, 0.7783203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 11.0, 13.0, 19.0, 31.0, 29.0, 38.0, 52.0, 54.0, 73.0, 66.0, 76.0, 68.0, 74.0, 71.0, 61.0, 51.0, 35.0, 31.0, 17.0, 16.0, 19.0, 17.0, 7.0, 8.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007538646459579468, -0.0007290542125701904, -0.0007042437791824341, -0.0006794333457946777, -0.0006546229124069214, -0.000629812479019165, -0.0006050020456314087, -0.0005801916122436523, -0.000555381178855896, -0.0005305707454681396, -0.0005057603120803833, -0.00048094987869262695, -0.0004561394453048706, -0.00043132901191711426, -0.0004065185785293579, -0.00038170814514160156, -0.0003568977117538452, -0.00033208727836608887, -0.0003072768449783325, -0.00028246641159057617, -0.0002576559782028198, -0.00023284554481506348, -0.00020803511142730713, -0.00018322467803955078, -0.00015841424465179443, -0.00013360381126403809, -0.00010879337787628174, -8.398294448852539e-05, -5.917251110076904e-05, -3.4362077713012695e-05, -9.551644325256348e-06, 1.52587890625e-05, 4.006922245025635e-05, 6.48796558380127e-05, 8.969008922576904e-05, 0.00011450052261352539, 0.00013931095600128174, 0.00016412138938903809, 0.00018893182277679443, 0.00021374225616455078, 0.00023855268955230713, 0.0002633631229400635, 0.0002881735563278198, 0.00031298398971557617, 0.0003377944231033325, 0.00036260485649108887, 0.0003874152898788452, 0.00041222572326660156, 0.0004370361566543579, 0.00046184659004211426, 0.0004866570234298706, 0.000511467456817627, 0.0005362778902053833, 0.0005610883235931396, 0.000585898756980896, 0.0006107091903686523, 0.0006355196237564087, 0.000660330057144165, 0.0006851404905319214, 0.0007099509239196777, 0.0007347613573074341, 0.0007595717906951904, 0.0007843822240829468, 0.0008091926574707031]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 11.0, 12.0, 13.0, 18.0, 15.0, 33.0, 31.0, 34.0, 53.0, 72.0, 92.0, 144.0, 218.0, 280.0, 497.0, 1020.0, 23066.0, 1019262.0, 1576.0, 707.0, 397.0, 254.0, 175.0, 146.0, 96.0, 69.0, 55.0, 46.0, 35.0, 28.0, 18.0, 21.0, 12.0, 12.0, 4.0, 7.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01226806640625, -0.011887550354003906, -0.011507034301757812, -0.011126518249511719, -0.010746002197265625, -0.010365486145019531, -0.009984970092773438, -0.009604454040527344, -0.00922393798828125, -0.008843421936035156, -0.008462905883789062, -0.008082389831542969, -0.007701873779296875, -0.007321357727050781, -0.0069408416748046875, -0.006560325622558594, -0.0061798095703125, -0.005799293518066406, -0.0054187774658203125, -0.005038261413574219, -0.004657745361328125, -0.004277229309082031, -0.0038967132568359375, -0.0035161972045898438, -0.00313568115234375, -0.0027551651000976562, -0.0023746490478515625, -0.0019941329956054688, -0.001613616943359375, -0.0012331008911132812, -0.0008525848388671875, -0.00047206878662109375, -9.1552734375e-05, 0.00028896331787109375, 0.0006694793701171875, 0.0010499954223632812, 0.001430511474609375, 0.0018110275268554688, 0.0021915435791015625, 0.0025720596313476562, 0.00295257568359375, 0.0033330917358398438, 0.0037136077880859375, 0.004094123840332031, 0.004474639892578125, 0.004855155944824219, 0.0052356719970703125, 0.005616188049316406, 0.0059967041015625, 0.006377220153808594, 0.0067577362060546875, 0.007138252258300781, 0.007518768310546875, 0.007899284362792969, 0.008279800415039062, 0.008660316467285156, 0.00904083251953125, 0.009421348571777344, 0.009801864624023438, 0.010182380676269531, 0.010562896728515625, 0.010943412780761719, 0.011323928833007812, 0.011704444885253906, 0.0120849609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 815.0, 192.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019121458753943443, -0.0018243335653096437, -0.0017365212552249432, -0.0016487089451402426, -0.0015608965186402202, -0.0014730842085555196, -0.001385271898470819, -0.0012974594719707966, -0.001209647161886096, -0.0011218348518013954, -0.0010340225417166948, -0.0009462101734243333, -0.0008583978051319718, -0.0007705854950472713, -0.0006827731849625707, -0.0005949608166702092, -0.0005071485647931695, -0.00041933622560463846, -0.0003315238864161074, -0.00024371157633140683, -0.0001558992371428758, -6.808689795434475e-05, 1.9725412130355835e-05, 0.00010753778042271733, 0.00019535009050741792, 0.00028316242969594896, 0.00037097476888448, 0.0004587870789691806, 0.0005465993890538812, 0.0006344117573462427, 0.0007222240674309433, 0.0008100364357233047, 0.0008978487458080053, 0.000985661055892706, 0.0010734733659774065, 0.001161285676062107, 0.0012490981025621295, 0.00133691041264683, 0.0014247227227315307, 0.001512535149231553, 0.0016003474593162537, 0.0016881597694009542, 0.0017759720794856548, 0.0018637843895703554, 0.0019515968160703778, 0.0020394092425704002, 0.002127221319824457, 0.0022150338627398014, 0.0023028459399938583, 0.002390658250078559, 0.0024784705601632595, 0.00256628287024796, 0.0026540951803326607, 0.002741907723248005, 0.002829719800502062, 0.002917532343417406, 0.0030053446535021067, 0.0030931569635868073, 0.003180969273671508, 0.0032687815837562084, 0.003356593893840909, 0.0034444062039256096, 0.003532218746840954, 0.0036200310569256544, 0.003707843367010355]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 6.0, 4.0, 10.0, 10.0, 10.0, 9.0, 11.0, 13.0, 17.0, 17.0, 23.0, 33.0, 28.0, 30.0, 43.0, 33.0, 40.0, 34.0, 42.0, 47.0, 35.0, 40.0, 40.0, 33.0, 41.0, 37.0, 39.0, 33.0, 28.0, 34.0, 25.0, 28.0, 22.0, 11.0, 21.0, 14.0, 8.0, 13.0, 13.0, 6.0, 4.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000335693359375, -0.0003247419372200966, -0.0003137905150651932, -0.00030283909291028976, -0.00029188767075538635, -0.00028093624860048294, -0.00026998482644557953, -0.0002590334042906761, -0.0002480819821357727, -0.0002371305599808693, -0.00022617913782596588, -0.00021522771567106247, -0.00020427629351615906, -0.00019332487136125565, -0.00018237344920635223, -0.00017142202705144882, -0.0001604706048965454, -0.000149519182741642, -0.00013856776058673859, -0.00012761633843183517, -0.00011666491627693176, -0.00010571349412202835, -9.476207196712494e-05, -8.381064981222153e-05, -7.285922765731812e-05, -6.19078055024147e-05, -5.095638334751129e-05, -4.000496119260788e-05, -2.9053539037704468e-05, -1.8102116882801056e-05, -7.150694727897644e-06, 3.800727427005768e-06, 1.475214958190918e-05, 2.570357173681259e-05, 3.6654993891716003e-05, 4.7606416046619415e-05, 5.855783820152283e-05, 6.950926035642624e-05, 8.046068251132965e-05, 9.141210466623306e-05, 0.00010236352682113647, 0.00011331494897603989, 0.0001242663711309433, 0.0001352177932858467, 0.00014616921544075012, 0.00015712063759565353, 0.00016807205975055695, 0.00017902348190546036, 0.00018997490406036377, 0.00020092632621526718, 0.0002118777483701706, 0.000222829170525074, 0.00023378059267997742, 0.00024473201483488083, 0.00025568343698978424, 0.00026663485914468765, 0.00027758628129959106, 0.0002885377034544945, 0.0002994891256093979, 0.0003104405477643013, 0.0003213919699192047, 0.0003323433920741081, 0.00034329481422901154, 0.00035424623638391495, 0.00036519765853881836]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 8.0, 12.0, 7.0, 13.0, 12.0, 12.0, 13.0, 15.0, 18.0, 25.0, 25.0, 28.0, 23.0, 26.0, 41.0, 38.0, 35.0, 37.0, 42.0, 43.0, 51.0, 38.0, 36.0, 30.0, 38.0, 44.0, 27.0, 29.0, 32.0, 30.0, 26.0, 18.0, 21.0, 14.0, 14.0, 11.0, 6.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.62109375, -4.46685791015625, -4.3126220703125, -4.15838623046875, -4.004150390625, -3.84991455078125, -3.6956787109375, -3.54144287109375, -3.38720703125, -3.23297119140625, -3.0787353515625, -2.92449951171875, -2.770263671875, -2.61602783203125, -2.4617919921875, -2.30755615234375, -2.1533203125, -1.99908447265625, -1.8448486328125, -1.69061279296875, -1.536376953125, -1.38214111328125, -1.2279052734375, -1.07366943359375, -0.91943359375, -0.76519775390625, -0.6109619140625, -0.45672607421875, -0.302490234375, -0.14825439453125, 0.0059814453125, 0.16021728515625, 0.314453125, 0.46868896484375, 0.6229248046875, 0.77716064453125, 0.931396484375, 1.08563232421875, 1.2398681640625, 1.39410400390625, 1.54833984375, 1.70257568359375, 1.8568115234375, 2.01104736328125, 2.165283203125, 2.31951904296875, 2.4737548828125, 2.62799072265625, 2.7822265625, 2.93646240234375, 3.0906982421875, 3.24493408203125, 3.399169921875, 3.55340576171875, 3.7076416015625, 3.86187744140625, 4.01611328125, 4.17034912109375, 4.3245849609375, 4.47882080078125, 4.633056640625, 4.78729248046875, 4.9415283203125, 5.09576416015625, 5.25]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 9.0, 11.0, 13.0, 18.0, 21.0, 29.0, 29.0, 47.0, 40.0, 80.0, 88.0, 134.0, 177.0, 254.0, 378.0, 604.0, 1000.0, 1737.0, 3690.0, 8814.0, 25052.0, 98952.0, 542341.0, 282807.0, 54008.0, 15715.0, 5930.0, 2650.0, 1400.0, 817.0, 529.0, 326.0, 224.0, 173.0, 112.0, 76.0, 59.0, 52.0, 36.0, 28.0, 22.0, 16.0, 12.0, 5.0, 9.0, 4.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-8.890625, -8.6019287109375, -8.313232421875, -8.0245361328125, -7.73583984375, -7.4471435546875, -7.158447265625, -6.8697509765625, -6.5810546875, -6.2923583984375, -6.003662109375, -5.7149658203125, -5.42626953125, -5.1375732421875, -4.848876953125, -4.5601806640625, -4.271484375, -3.9827880859375, -3.694091796875, -3.4053955078125, -3.11669921875, -2.8280029296875, -2.539306640625, -2.2506103515625, -1.9619140625, -1.6732177734375, -1.384521484375, -1.0958251953125, -0.80712890625, -0.5184326171875, -0.229736328125, 0.0589599609375, 0.34765625, 0.6363525390625, 0.925048828125, 1.2137451171875, 1.50244140625, 1.7911376953125, 2.079833984375, 2.3685302734375, 2.6572265625, 2.9459228515625, 3.234619140625, 3.5233154296875, 3.81201171875, 4.1007080078125, 4.389404296875, 4.6781005859375, 4.966796875, 5.2554931640625, 5.544189453125, 5.8328857421875, 6.12158203125, 6.4102783203125, 6.698974609375, 6.9876708984375, 7.2763671875, 7.5650634765625, 7.853759765625, 8.1424560546875, 8.43115234375, 8.7198486328125, 9.008544921875, 9.2972412109375, 9.5859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 3.0, 4.0, 12.0, 9.0, 18.0, 14.0, 17.0, 22.0, 39.0, 41.0, 48.0, 61.0, 64.0, 86.0, 264.0, 1801.0, 151.0, 76.0, 52.0, 46.0, 39.0, 43.0, 29.0, 29.0, 16.0, 16.0, 15.0, 7.0, 11.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.939208984375, -16.36279296875, -15.786376953125, -15.2099609375, -14.633544921875, -14.05712890625, -13.480712890625, -12.904296875, -12.327880859375, -11.75146484375, -11.175048828125, -10.5986328125, -10.022216796875, -9.44580078125, -8.869384765625, -8.29296875, -7.716552734375, -7.14013671875, -6.563720703125, -5.9873046875, -5.410888671875, -4.83447265625, -4.258056640625, -3.681640625, -3.105224609375, -2.52880859375, -1.952392578125, -1.3759765625, -0.799560546875, -0.22314453125, 0.353271484375, 0.9296875, 1.506103515625, 2.08251953125, 2.658935546875, 3.2353515625, 3.811767578125, 4.38818359375, 4.964599609375, 5.541015625, 6.117431640625, 6.69384765625, 7.270263671875, 7.8466796875, 8.423095703125, 8.99951171875, 9.575927734375, 10.15234375, 10.728759765625, 11.30517578125, 11.881591796875, 12.4580078125, 13.034423828125, 13.61083984375, 14.187255859375, 14.763671875, 15.340087890625, 15.91650390625, 16.492919921875, 17.0693359375, 17.645751953125, 18.22216796875, 18.798583984375, 19.375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 16.0, 23.0, 24.0, 41.0, 48.0, 62.0, 113.0, 241.0, 540.0, 1557.0, 3074440.0, 66520.0, 1073.0, 440.0, 195.0, 96.0, 80.0, 38.0, 29.0, 25.0, 19.0, 12.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.4775390625, -51.798828125, -50.1201171875, -48.44140625, -46.7626953125, -45.083984375, -43.4052734375, -41.7265625, -40.0478515625, -38.369140625, -36.6904296875, -35.01171875, -33.3330078125, -31.654296875, -29.9755859375, -28.296875, -26.6181640625, -24.939453125, -23.2607421875, -21.58203125, -19.9033203125, -18.224609375, -16.5458984375, -14.8671875, -13.1884765625, -11.509765625, -9.8310546875, -8.15234375, -6.4736328125, -4.794921875, -3.1162109375, -1.4375, 0.2412109375, 1.919921875, 3.5986328125, 5.27734375, 6.9560546875, 8.634765625, 10.3134765625, 11.9921875, 13.6708984375, 15.349609375, 17.0283203125, 18.70703125, 20.3857421875, 22.064453125, 23.7431640625, 25.421875, 27.1005859375, 28.779296875, 30.4580078125, 32.13671875, 33.8154296875, 35.494140625, 37.1728515625, 38.8515625, 40.5302734375, 42.208984375, 43.8876953125, 45.56640625, 47.2451171875, 48.923828125, 50.6025390625, 52.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 84.0, 550.0, 348.0, 28.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.81062316894531, -87.4964828491211, -85.18234252929688, -82.86819458007812, -80.5540542602539, -78.23991394042969, -75.92576599121094, -73.61162567138672, -71.2974853515625, -68.98334503173828, -66.66920471191406, -64.35505676269531, -62.040916442871094, -59.726776123046875, -57.41263198852539, -55.098487854003906, -52.78434753417969, -50.47020721435547, -48.156063079833984, -45.8419189453125, -43.52777862548828, -41.21363830566406, -38.89949417114258, -36.585350036621094, -34.271209716796875, -31.957067489624023, -29.642925262451172, -27.32878303527832, -25.01464080810547, -22.700498580932617, -20.386356353759766, -18.072214126586914, -15.758068084716797, -13.443925857543945, -11.129783630371094, -8.815641403198242, -6.501499176025391, -4.187356948852539, -1.8732147216796875, 0.44092750549316406, 2.7550697326660156, 5.069211959838867, 7.383354187011719, 9.69749641418457, 12.011638641357422, 14.325780868530273, 16.639923095703125, 18.954065322875977, 21.268207550048828, 23.58234977722168, 25.89649200439453, 28.210634231567383, 30.524776458740234, 32.83892059326172, 35.15306091308594, 37.467201232910156, 39.78134536743164, 42.095489501953125, 44.409629821777344, 46.72377014160156, 49.03791427612305, 51.35205841064453, 53.66619873046875, 55.98033905029297, 58.29448318481445]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 10.0, 6.0, 9.0, 26.0, 16.0, 17.0, 18.0, 24.0, 29.0, 34.0, 27.0, 23.0, 36.0, 35.0, 39.0, 34.0, 52.0, 53.0, 36.0, 51.0, 50.0, 43.0, 36.0, 29.0, 37.0, 26.0, 33.0, 25.0, 19.0, 22.0, 11.0, 13.0, 4.0, 17.0, 7.0, 4.0, 11.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.075252532958984, -32.07883834838867, -31.08242416381836, -30.086009979248047, -29.089595794677734, -28.093181610107422, -27.096765518188477, -26.100351333618164, -25.10393714904785, -24.10752296447754, -23.111108779907227, -22.114694595336914, -21.11827850341797, -20.121864318847656, -19.125450134277344, -18.12903594970703, -17.13262176513672, -16.136207580566406, -15.139793395996094, -14.143378257751465, -13.146964073181152, -12.15054988861084, -11.154134750366211, -10.157720565795898, -9.161306381225586, -8.164892196655273, -7.168477535247803, -6.172062873840332, -5.1756486892700195, -4.179234504699707, -3.1828198432922363, -2.1864051818847656, -1.1899909973144531, -0.19357657432556152, 0.8028378486633301, 1.7992522716522217, 2.7956666946411133, 3.792080879211426, 4.7884955406188965, 5.784910202026367, 6.78132438659668, 7.777738571166992, 8.774152755737305, 9.770567893981934, 10.766982078552246, 11.763396263122559, 12.759811401367188, 13.7562255859375, 14.752639770507812, 15.749053955078125, 16.745468139648438, 17.74188232421875, 18.738296508789062, 19.734710693359375, 20.73112678527832, 21.727540969848633, 22.723955154418945, 23.720369338989258, 24.71678352355957, 25.713197708129883, 26.709613800048828, 27.70602798461914, 28.702442169189453, 29.698856353759766, 30.695270538330078]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 3.0, 13.0, 7.0, 7.0, 14.0, 10.0, 9.0, 17.0, 19.0, 19.0, 26.0, 21.0, 22.0, 34.0, 38.0, 49.0, 42.0, 51.0, 37.0, 40.0, 56.0, 48.0, 39.0, 33.0, 37.0, 47.0, 32.0, 29.0, 29.0, 32.0, 22.0, 18.0, 19.0, 18.0, 8.0, 9.0, 11.0, 13.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.880859375, -5.6796875, -5.478515625, -5.27734375, -5.076171875, -4.875, -4.673828125, -4.47265625, -4.271484375, -4.0703125, -3.869140625, -3.66796875, -3.466796875, -3.265625, -3.064453125, -2.86328125, -2.662109375, -2.4609375, -2.259765625, -2.05859375, -1.857421875, -1.65625, -1.455078125, -1.25390625, -1.052734375, -0.8515625, -0.650390625, -0.44921875, -0.248046875, -0.046875, 0.154296875, 0.35546875, 0.556640625, 0.7578125, 0.958984375, 1.16015625, 1.361328125, 1.5625, 1.763671875, 1.96484375, 2.166015625, 2.3671875, 2.568359375, 2.76953125, 2.970703125, 3.171875, 3.373046875, 3.57421875, 3.775390625, 3.9765625, 4.177734375, 4.37890625, 4.580078125, 4.78125, 4.982421875, 5.18359375, 5.384765625, 5.5859375, 5.787109375, 5.98828125, 6.189453125, 6.390625, 6.591796875, 6.79296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 9.0, 12.0, 16.0, 21.0, 27.0, 34.0, 35.0, 44.0, 66.0, 54.0, 94.0, 74.0, 122.0, 175.0, 216.0, 319.0, 489.0, 900.0, 2054.0, 14125.0, 2930471.0, 1233033.0, 7681.0, 1772.0, 719.0, 436.0, 288.0, 241.0, 166.0, 119.0, 82.0, 59.0, 57.0, 46.0, 44.0, 36.0, 31.0, 19.0, 20.0, 14.0, 17.0, 12.0, 8.0, 10.0, 7.0, 0.0, 1.0, 4.0, 2.0], "bins": [-44.8125, -43.56396484375, -42.3154296875, -41.06689453125, -39.818359375, -38.56982421875, -37.3212890625, -36.07275390625, -34.82421875, -33.57568359375, -32.3271484375, -31.07861328125, -29.830078125, -28.58154296875, -27.3330078125, -26.08447265625, -24.8359375, -23.58740234375, -22.3388671875, -21.09033203125, -19.841796875, -18.59326171875, -17.3447265625, -16.09619140625, -14.84765625, -13.59912109375, -12.3505859375, -11.10205078125, -9.853515625, -8.60498046875, -7.3564453125, -6.10791015625, -4.859375, -3.61083984375, -2.3623046875, -1.11376953125, 0.134765625, 1.38330078125, 2.6318359375, 3.88037109375, 5.12890625, 6.37744140625, 7.6259765625, 8.87451171875, 10.123046875, 11.37158203125, 12.6201171875, 13.86865234375, 15.1171875, 16.36572265625, 17.6142578125, 18.86279296875, 20.111328125, 21.35986328125, 22.6083984375, 23.85693359375, 25.10546875, 26.35400390625, 27.6025390625, 28.85107421875, 30.099609375, 31.34814453125, 32.5966796875, 33.84521484375, 35.09375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 21.0, 23.0, 56.0, 82.0, 186.0, 375.0, 685.0, 951.0, 729.0, 428.0, 237.0, 114.0, 58.0, 45.0, 18.0, 10.0, 8.0, 7.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.3515625, -12.8302001953125, -12.308837890625, -11.7874755859375, -11.26611328125, -10.7447509765625, -10.223388671875, -9.7020263671875, -9.1806640625, -8.6593017578125, -8.137939453125, -7.6165771484375, -7.09521484375, -6.5738525390625, -6.052490234375, -5.5311279296875, -5.009765625, -4.4884033203125, -3.967041015625, -3.4456787109375, -2.92431640625, -2.4029541015625, -1.881591796875, -1.3602294921875, -0.8388671875, -0.3175048828125, 0.203857421875, 0.7252197265625, 1.24658203125, 1.7679443359375, 2.289306640625, 2.8106689453125, 3.33203125, 3.8533935546875, 4.374755859375, 4.8961181640625, 5.41748046875, 5.9388427734375, 6.460205078125, 6.9815673828125, 7.5029296875, 8.0242919921875, 8.545654296875, 9.0670166015625, 9.58837890625, 10.1097412109375, 10.631103515625, 11.1524658203125, 11.673828125, 12.1951904296875, 12.716552734375, 13.2379150390625, 13.75927734375, 14.2806396484375, 14.802001953125, 15.3233642578125, 15.8447265625, 16.3660888671875, 16.887451171875, 17.4088134765625, 17.93017578125, 18.4515380859375, 18.972900390625, 19.4942626953125, 20.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 17.0, 24.0, 50.0, 120.0, 186.0, 492.0, 1762.0, 10817.0, 349651.0, 3759685.0, 64873.0, 4799.0, 1037.0, 373.0, 138.0, 93.0, 63.0, 25.0, 12.0, 4.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.5625, -20.80078125, -20.0390625, -19.27734375, -18.515625, -17.75390625, -16.9921875, -16.23046875, -15.46875, -14.70703125, -13.9453125, -13.18359375, -12.421875, -11.66015625, -10.8984375, -10.13671875, -9.375, -8.61328125, -7.8515625, -7.08984375, -6.328125, -5.56640625, -4.8046875, -4.04296875, -3.28125, -2.51953125, -1.7578125, -0.99609375, -0.234375, 0.52734375, 1.2890625, 2.05078125, 2.8125, 3.57421875, 4.3359375, 5.09765625, 5.859375, 6.62109375, 7.3828125, 8.14453125, 8.90625, 9.66796875, 10.4296875, 11.19140625, 11.953125, 12.71484375, 13.4765625, 14.23828125, 15.0, 15.76171875, 16.5234375, 17.28515625, 18.046875, 18.80859375, 19.5703125, 20.33203125, 21.09375, 21.85546875, 22.6171875, 23.37890625, 24.140625, 24.90234375, 25.6640625, 26.42578125, 27.1875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 7.0, 2.0, 9.0, 13.0, 23.0, 32.0, 52.0, 106.0, 143.0, 145.0, 113.0, 135.0, 86.0, 52.0, 34.0, 26.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.99544525146484, -69.30860900878906, -66.62176513671875, -63.93492889404297, -61.24809265136719, -58.561256408691406, -55.87441635131836, -53.18757629394531, -50.50074005126953, -47.81390380859375, -45.1270637512207, -42.440223693847656, -39.753387451171875, -37.066551208496094, -34.37971115112305, -31.692873001098633, -29.00603485107422, -26.319196701049805, -23.63235855102539, -20.945520401000977, -18.258682250976562, -15.571844100952148, -12.885005950927734, -10.19816780090332, -7.511329650878906, -4.824491500854492, -2.137653350830078, 0.5491847991943359, 3.23602294921875, 5.922861099243164, 8.609699249267578, 11.296537399291992, 13.983367919921875, 16.67020606994629, 19.357044219970703, 22.043882369995117, 24.73072052001953, 27.417558670043945, 30.10439682006836, 32.791236877441406, 35.47807312011719, 38.16490936279297, 40.851749420166016, 43.53858947753906, 46.225425720214844, 48.912261962890625, 51.59910202026367, 54.28594207763672, 56.9727783203125, 59.65961456298828, 62.34645462036133, 65.03329467773438, 67.72013092041016, 70.40696716308594, 73.09381103515625, 75.78064727783203, 78.46748352050781, 81.1543197631836, 83.84115600585938, 86.52799987792969, 89.21483612060547, 91.90167236328125, 94.58851623535156, 97.27535247802734, 99.96218872070312]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 8.0, 9.0, 11.0, 16.0, 17.0, 20.0, 16.0, 21.0, 25.0, 32.0, 27.0, 41.0, 31.0, 44.0, 39.0, 40.0, 38.0, 39.0, 48.0, 41.0, 36.0, 34.0, 40.0, 33.0, 34.0, 35.0, 25.0, 28.0, 24.0, 30.0, 14.0, 17.0, 20.0, 10.0, 6.0, 6.0, 10.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.24128723144531, -31.13075065612793, -30.020212173461914, -28.90967559814453, -27.799137115478516, -26.688600540161133, -25.57806396484375, -24.467525482177734, -23.35698890686035, -22.24645233154297, -21.135913848876953, -20.02537727355957, -18.914840698242188, -17.804302215576172, -16.69376564025879, -15.58322811126709, -14.47269058227539, -13.362153053283691, -12.251615524291992, -11.14107894897461, -10.03054141998291, -8.920003890991211, -7.80946683883667, -6.698929786682129, -5.58839225769043, -4.4778547286987305, -3.3673176765441895, -2.2567803859710693, -1.1462430953979492, -0.03570556640625, 1.074831485748291, 2.185368537902832, 3.2959060668945312, 4.4064435958862305, 5.5169806480407715, 6.6275177001953125, 7.738055229187012, 8.848592758178711, 9.959129333496094, 11.069666862487793, 12.180204391479492, 13.290741920471191, 14.40127944946289, 15.511816024780273, 16.622352600097656, 17.732891082763672, 18.843427658081055, 19.953964233398438, 21.064502716064453, 22.175039291381836, 23.28557777404785, 24.396114349365234, 25.50665283203125, 26.617189407348633, 27.727725982666016, 28.83826446533203, 29.948801040649414, 31.059337615966797, 32.16987609863281, 33.28041458129883, 34.39094924926758, 35.501487731933594, 36.61202621459961, 37.72256088256836, 38.833099365234375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 23.0, 24.0, 39.0, 35.0, 38.0, 36.0, 53.0, 39.0, 50.0, 39.0, 41.0, 44.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 16.0, 28.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.60986328125, -45.8759765625, -44.14208984375, -42.408203125, -40.67431640625, -38.9404296875, -37.20654296875, -35.47265625, -33.73876953125, -32.0048828125, -30.27099609375, -28.537109375, -26.80322265625, -25.0693359375, -23.33544921875, -21.6015625, -19.86767578125, -18.1337890625, -16.39990234375, -14.666015625, -12.93212890625, -11.1982421875, -9.46435546875, -7.73046875, -5.99658203125, -4.2626953125, -2.52880859375, -0.794921875, 0.93896484375, 2.6728515625, 4.40673828125, 6.140625, 7.87451171875, 9.6083984375, 11.34228515625, 13.076171875, 14.81005859375, 16.5439453125, 18.27783203125, 20.01171875, 21.74560546875, 23.4794921875, 25.21337890625, 26.947265625, 28.68115234375, 30.4150390625, 32.14892578125, 33.8828125, 35.61669921875, 37.3505859375, 39.08447265625, 40.818359375, 42.55224609375, 44.2861328125, 46.02001953125, 47.75390625, 49.48779296875, 51.2216796875, 52.95556640625, 54.689453125, 56.42333984375, 58.1572265625, 59.89111328125, 61.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 11.0, 16.0, 21.0, 21.0, 24.0, 46.0, 80.0, 86.0, 150.0, 246.0, 498.0, 788.0, 1433.0, 2427.0, 4171.0, 7434.0, 13343.0, 25150.0, 48245.0, 95708.0, 194768.0, 303926.0, 172069.0, 84490.0, 42984.0, 22600.0, 12007.0, 6716.0, 3771.0, 2179.0, 1328.0, 691.0, 438.0, 260.0, 142.0, 96.0, 75.0, 38.0, 27.0, 11.0, 13.0, 9.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -10.120361328125, -9.76416015625, -9.407958984375, -9.0517578125, -8.695556640625, -8.33935546875, -7.983154296875, -7.626953125, -7.270751953125, -6.91455078125, -6.558349609375, -6.2021484375, -5.845947265625, -5.48974609375, -5.133544921875, -4.77734375, -4.421142578125, -4.06494140625, -3.708740234375, -3.3525390625, -2.996337890625, -2.64013671875, -2.283935546875, -1.927734375, -1.571533203125, -1.21533203125, -0.859130859375, -0.5029296875, -0.146728515625, 0.20947265625, 0.565673828125, 0.921875, 1.278076171875, 1.63427734375, 1.990478515625, 2.3466796875, 2.702880859375, 3.05908203125, 3.415283203125, 3.771484375, 4.127685546875, 4.48388671875, 4.840087890625, 5.1962890625, 5.552490234375, 5.90869140625, 6.264892578125, 6.62109375, 6.977294921875, 7.33349609375, 7.689697265625, 8.0458984375, 8.402099609375, 8.75830078125, 9.114501953125, 9.470703125, 9.826904296875, 10.18310546875, 10.539306640625, 10.8955078125, 11.251708984375, 11.60791015625, 11.964111328125, 12.3203125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 14.0, 16.0, 18.0, 12.0, 21.0, 26.0, 20.0, 31.0, 24.0, 27.0, 37.0, 40.0, 31.0, 34.0, 41.0, 39.0, 1070.0, 31.0, 46.0, 42.0, 40.0, 32.0, 32.0, 33.0, 28.0, 31.0, 21.0, 31.0, 20.0, 15.0, 17.0, 11.0, 10.0, 12.0, 7.0, 11.0, 7.0, 6.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.59375, -33.569580078125, -32.54541015625, -31.521240234375, -30.4970703125, -29.472900390625, -28.44873046875, -27.424560546875, -26.400390625, -25.376220703125, -24.35205078125, -23.327880859375, -22.3037109375, -21.279541015625, -20.25537109375, -19.231201171875, -18.20703125, -17.182861328125, -16.15869140625, -15.134521484375, -14.1103515625, -13.086181640625, -12.06201171875, -11.037841796875, -10.013671875, -8.989501953125, -7.96533203125, -6.941162109375, -5.9169921875, -4.892822265625, -3.86865234375, -2.844482421875, -1.8203125, -0.796142578125, 0.22802734375, 1.252197265625, 2.2763671875, 3.300537109375, 4.32470703125, 5.348876953125, 6.373046875, 7.397216796875, 8.42138671875, 9.445556640625, 10.4697265625, 11.493896484375, 12.51806640625, 13.542236328125, 14.56640625, 15.590576171875, 16.61474609375, 17.638916015625, 18.6630859375, 19.687255859375, 20.71142578125, 21.735595703125, 22.759765625, 23.783935546875, 24.80810546875, 25.832275390625, 26.8564453125, 27.880615234375, 28.90478515625, 29.928955078125, 30.953125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 9.0, 6.0, 13.0, 19.0, 28.0, 50.0, 69.0, 116.0, 148.0, 224.0, 368.0, 489.0, 856.0, 1244.0, 1912.0, 2789.0, 4096.0, 6190.0, 9393.0, 14672.0, 22080.0, 33854.0, 52633.0, 82189.0, 134749.0, 1268514.0, 171920.0, 103131.0, 64621.0, 41634.0, 26906.0, 17779.0, 11482.0, 7640.0, 5130.0, 3435.0, 2298.0, 1526.0, 1003.0, 657.0, 422.0, 300.0, 201.0, 112.0, 66.0, 69.0, 35.0, 20.0, 18.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.8984375, -7.664306640625, -7.43017578125, -7.196044921875, -6.9619140625, -6.727783203125, -6.49365234375, -6.259521484375, -6.025390625, -5.791259765625, -5.55712890625, -5.322998046875, -5.0888671875, -4.854736328125, -4.62060546875, -4.386474609375, -4.15234375, -3.918212890625, -3.68408203125, -3.449951171875, -3.2158203125, -2.981689453125, -2.74755859375, -2.513427734375, -2.279296875, -2.045166015625, -1.81103515625, -1.576904296875, -1.3427734375, -1.108642578125, -0.87451171875, -0.640380859375, -0.40625, -0.172119140625, 0.06201171875, 0.296142578125, 0.5302734375, 0.764404296875, 0.99853515625, 1.232666015625, 1.466796875, 1.700927734375, 1.93505859375, 2.169189453125, 2.4033203125, 2.637451171875, 2.87158203125, 3.105712890625, 3.33984375, 3.573974609375, 3.80810546875, 4.042236328125, 4.2763671875, 4.510498046875, 4.74462890625, 4.978759765625, 5.212890625, 5.447021484375, 5.68115234375, 5.915283203125, 6.1494140625, 6.383544921875, 6.61767578125, 6.851806640625, 7.0859375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 7.0, 9.0, 18.0, 15.0, 12.0, 19.0, 26.0, 31.0, 29.0, 38.0, 36.0, 36.0, 44.0, 56.0, 55.0, 72.0, 69.0, 56.0, 49.0, 38.0, 51.0, 34.0, 31.0, 30.0, 23.0, 18.0, 19.0, 22.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007305145263671875, -0.007081449031829834, -0.006857752799987793, -0.006634056568145752, -0.006410360336303711, -0.00618666410446167, -0.005962967872619629, -0.005739271640777588, -0.005515575408935547, -0.005291879177093506, -0.005068182945251465, -0.004844486713409424, -0.004620790481567383, -0.004397094249725342, -0.004173398017883301, -0.00394970178604126, -0.0037260055541992188, -0.0035023093223571777, -0.0032786130905151367, -0.0030549168586730957, -0.0028312206268310547, -0.0026075243949890137, -0.0023838281631469727, -0.0021601319313049316, -0.0019364356994628906, -0.0017127394676208496, -0.0014890432357788086, -0.0012653470039367676, -0.0010416507720947266, -0.0008179545402526855, -0.0005942583084106445, -0.0003705620765686035, -0.0001468658447265625, 7.683038711547852e-05, 0.00030052661895751953, 0.0005242228507995605, 0.0007479190826416016, 0.0009716153144836426, 0.0011953115463256836, 0.0014190077781677246, 0.0016427040100097656, 0.0018664002418518066, 0.0020900964736938477, 0.0023137927055358887, 0.0025374889373779297, 0.0027611851692199707, 0.0029848814010620117, 0.0032085776329040527, 0.0034322738647460938, 0.0036559700965881348, 0.0038796663284301758, 0.004103362560272217, 0.004327058792114258, 0.004550755023956299, 0.00477445125579834, 0.004998147487640381, 0.005221843719482422, 0.005445539951324463, 0.005669236183166504, 0.005892932415008545, 0.006116628646850586, 0.006340324878692627, 0.006564021110534668, 0.006787717342376709, 0.00701141357421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 16.0, 15.0, 13.0, 24.0, 26.0, 40.0, 66.0, 77.0, 108.0, 175.0, 252.0, 385.0, 634.0, 1109.0, 2881.0, 10136.0, 50185.0, 340683.0, 533954.0, 85041.0, 15307.0, 3879.0, 1479.0, 696.0, 402.0, 262.0, 203.0, 141.0, 100.0, 71.0, 55.0, 29.0, 23.0, 19.0, 20.0, 8.0, 6.0, 8.0, 7.0, 0.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.056182861328125, -0.05448770523071289, -0.05279254913330078, -0.05109739303588867, -0.04940223693847656, -0.04770708084106445, -0.046011924743652344, -0.044316768646240234, -0.042621612548828125, -0.040926456451416016, -0.039231300354003906, -0.0375361442565918, -0.03584098815917969, -0.03414583206176758, -0.03245067596435547, -0.03075551986694336, -0.02906036376953125, -0.02736520767211914, -0.02567005157470703, -0.023974895477294922, -0.022279739379882812, -0.020584583282470703, -0.018889427185058594, -0.017194271087646484, -0.015499114990234375, -0.013803958892822266, -0.012108802795410156, -0.010413646697998047, -0.008718490600585938, -0.007023334503173828, -0.005328178405761719, -0.0036330223083496094, -0.0019378662109375, -0.00024271011352539062, 0.0014524459838867188, 0.003147602081298828, 0.0048427581787109375, 0.006537914276123047, 0.008233070373535156, 0.009928226470947266, 0.011623382568359375, 0.013318538665771484, 0.015013694763183594, 0.016708850860595703, 0.018404006958007812, 0.020099163055419922, 0.02179431915283203, 0.02348947525024414, 0.02518463134765625, 0.02687978744506836, 0.02857494354248047, 0.030270099639892578, 0.03196525573730469, 0.0336604118347168, 0.035355567932128906, 0.037050724029541016, 0.038745880126953125, 0.040441036224365234, 0.042136192321777344, 0.04383134841918945, 0.04552650451660156, 0.04722166061401367, 0.04891681671142578, 0.05061197280883789, 0.05230712890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 14.0, 16.0, 25.0, 51.0, 95.0, 139.0, 170.0, 173.0, 139.0, 74.0, 56.0, 28.0, 13.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.014539824798703194, -0.014208639971911907, -0.013877456076443195, -0.013546271249651909, -0.013215087354183197, -0.01288390252739191, -0.012552717700600624, -0.012221533805131912, -0.0118903499096632, -0.011559165082871914, -0.011227981187403202, -0.010896796360611916, -0.010565612465143204, -0.010234427638351917, -0.00990324281156063, -0.009572058916091919, -0.009240874089300632, -0.008909689262509346, -0.008578505367040634, -0.008247320540249348, -0.007916136644780636, -0.007584951817989349, -0.00725376745685935, -0.006922583095729351, -0.006591398734599352, -0.006260214373469353, -0.0059290300123393536, -0.005597845651209354, -0.005266660824418068, -0.004935476928949356, -0.00460429210215807, -0.0042731077410280704, -0.003941923845559359, -0.0036107394844293594, -0.0032795551232993603, -0.0029483705293387175, -0.0026171861682087183, -0.002286001807078719, -0.0019548172131180763, -0.0016236328519880772, -0.001292448490858078, -0.0009612640715204179, -0.0006300796521827579, -0.00029889517463743687, 3.2289186492562294e-05, 0.00036347354762256145, 0.0006946581415832043, 0.0010258425027132034, 0.0013570268638432026, 0.0016882112249732018, 0.002019395586103201, 0.0023505801800638437, 0.002681764541193843, 0.003012948902323842, 0.003344133496284485, 0.003675317857414484, 0.004006502218544483, 0.004337686579674482, 0.0046688709408044815, 0.005000055767595768, 0.00533123966306448, 0.005662424489855766, 0.0059936088509857655, 0.006324793212115765, 0.006655977573245764]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 4.0, 5.0, 10.0, 9.0, 13.0, 11.0, 20.0, 20.0, 22.0, 26.0, 29.0, 19.0, 30.0, 25.0, 40.0, 23.0, 33.0, 31.0, 40.0, 53.0, 41.0, 40.0, 46.0, 28.0, 37.0, 28.0, 31.0, 32.0, 31.0, 29.0, 20.0, 28.0, 19.0, 20.0, 14.0, 17.0, 10.0, 17.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.003273904323577881, -0.003166566602885723, -0.0030592288821935654, -0.0029518911615014076, -0.00284455344080925, -0.002737215720117092, -0.0026298779994249344, -0.0025225402787327766, -0.002415202558040619, -0.002307864837348461, -0.0022005271166563034, -0.0020931893959641457, -0.001985851675271988, -0.0018785139545798302, -0.0017711762338876724, -0.0016638385131955147, -0.001556500792503357, -0.0014491630718111992, -0.0013418253511190414, -0.0012344876304268837, -0.001127149909734726, -0.0010198121890425682, -0.0009124744683504105, -0.0008051367476582527, -0.000697799026966095, -0.0005904613062739372, -0.0004831235855817795, -0.00037578586488962173, -0.000268448144197464, -0.00016111042350530624, -5.37727028131485e-05, 5.356501787900925e-05, 0.000160902738571167, 0.00026824045926332474, 0.0003755781799554825, 0.00048291590064764023, 0.000590253621339798, 0.0006975913420319557, 0.0008049290627241135, 0.0009122667834162712, 0.001019604504108429, 0.0011269422248005867, 0.0012342799454927444, 0.0013416176661849022, 0.00144895538687706, 0.0015562931075692177, 0.0016636308282613754, 0.0017709685489535332, 0.001878306269645691, 0.0019856439903378487, 0.0020929817110300064, 0.002200319431722164, 0.002307657152414322, 0.0024149948731064796, 0.0025223325937986374, 0.002629670314490795, 0.002737008035182953, 0.0028443457558751106, 0.0029516834765672684, 0.003059021197259426, 0.003166358917951584, 0.0032736966386437416, 0.0033810343593358994, 0.003488372080028057, 0.003595709800720215]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 9.0, 11.0, 22.0, 16.0, 23.0, 30.0, 24.0, 23.0, 39.0, 34.0, 39.0, 36.0, 53.0, 40.0, 49.0, 39.0, 44.0, 41.0, 40.0, 40.0, 28.0, 43.0, 30.0, 34.0, 29.0, 23.0, 18.0, 26.0, 12.0, 15.0, 11.0, 8.0, 10.0, 10.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.609375, -45.875, -44.140625, -42.40625, -40.671875, -38.9375, -37.203125, -35.46875, -33.734375, -32.0, -30.265625, -28.53125, -26.796875, -25.0625, -23.328125, -21.59375, -19.859375, -18.125, -16.390625, -14.65625, -12.921875, -11.1875, -9.453125, -7.71875, -5.984375, -4.25, -2.515625, -0.78125, 0.953125, 2.6875, 4.421875, 6.15625, 7.890625, 9.625, 11.359375, 13.09375, 14.828125, 16.5625, 18.296875, 20.03125, 21.765625, 23.5, 25.234375, 26.96875, 28.703125, 30.4375, 32.171875, 33.90625, 35.640625, 37.375, 39.109375, 40.84375, 42.578125, 44.3125, 46.046875, 47.78125, 49.515625, 51.25, 52.984375, 54.71875, 56.453125, 58.1875, 59.921875, 61.65625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 10.0, 11.0, 21.0, 22.0, 18.0, 33.0, 48.0, 76.0, 107.0, 167.0, 266.0, 498.0, 890.0, 1829.0, 3895.0, 9665.0, 35704.0, 241512.0, 621348.0, 100866.0, 19355.0, 6368.0, 2755.0, 1337.0, 704.0, 411.0, 196.0, 132.0, 88.0, 52.0, 45.0, 34.0, 22.0, 22.0, 18.0, 4.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.8828125, -13.3338623046875, -12.784912109375, -12.2359619140625, -11.68701171875, -11.1380615234375, -10.589111328125, -10.0401611328125, -9.4912109375, -8.9422607421875, -8.393310546875, -7.8443603515625, -7.29541015625, -6.7464599609375, -6.197509765625, -5.6485595703125, -5.099609375, -4.5506591796875, -4.001708984375, -3.4527587890625, -2.90380859375, -2.3548583984375, -1.805908203125, -1.2569580078125, -0.7080078125, -0.1590576171875, 0.389892578125, 0.9388427734375, 1.48779296875, 2.0367431640625, 2.585693359375, 3.1346435546875, 3.68359375, 4.2325439453125, 4.781494140625, 5.3304443359375, 5.87939453125, 6.4283447265625, 6.977294921875, 7.5262451171875, 8.0751953125, 8.6241455078125, 9.173095703125, 9.7220458984375, 10.27099609375, 10.8199462890625, 11.368896484375, 11.9178466796875, 12.466796875, 13.0157470703125, 13.564697265625, 14.1136474609375, 14.66259765625, 15.2115478515625, 15.760498046875, 16.3094482421875, 16.8583984375, 17.4073486328125, 17.956298828125, 18.5052490234375, 19.05419921875, 19.6031494140625, 20.152099609375, 20.7010498046875, 21.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 11.0, 14.0, 28.0, 28.0, 36.0, 48.0, 70.0, 103.0, 101.0, 2147.0, 107.0, 80.0, 84.0, 54.0, 41.0, 32.0, 24.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-162.5, -157.533203125, -152.56640625, -147.599609375, -142.6328125, -137.666015625, -132.69921875, -127.732421875, -122.765625, -117.798828125, -112.83203125, -107.865234375, -102.8984375, -97.931640625, -92.96484375, -87.998046875, -83.03125, -78.064453125, -73.09765625, -68.130859375, -63.1640625, -58.197265625, -53.23046875, -48.263671875, -43.296875, -38.330078125, -33.36328125, -28.396484375, -23.4296875, -18.462890625, -13.49609375, -8.529296875, -3.5625, 1.404296875, 6.37109375, 11.337890625, 16.3046875, 21.271484375, 26.23828125, 31.205078125, 36.171875, 41.138671875, 46.10546875, 51.072265625, 56.0390625, 61.005859375, 65.97265625, 70.939453125, 75.90625, 80.873046875, 85.83984375, 90.806640625, 95.7734375, 100.740234375, 105.70703125, 110.673828125, 115.640625, 120.607421875, 125.57421875, 130.541015625, 135.5078125, 140.474609375, 145.44140625, 150.408203125, 155.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 7.0, 12.0, 23.0, 33.0, 53.0, 72.0, 104.0, 248.0, 590.0, 1407.0, 5013.0, 162847.0, 2955788.0, 15637.0, 2225.0, 850.0, 357.0, 156.0, 91.0, 60.0, 37.0, 32.0, 18.0, 9.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.84375, -39.6142578125, -38.384765625, -37.1552734375, -35.92578125, -34.6962890625, -33.466796875, -32.2373046875, -31.0078125, -29.7783203125, -28.548828125, -27.3193359375, -26.08984375, -24.8603515625, -23.630859375, -22.4013671875, -21.171875, -19.9423828125, -18.712890625, -17.4833984375, -16.25390625, -15.0244140625, -13.794921875, -12.5654296875, -11.3359375, -10.1064453125, -8.876953125, -7.6474609375, -6.41796875, -5.1884765625, -3.958984375, -2.7294921875, -1.5, -0.2705078125, 0.958984375, 2.1884765625, 3.41796875, 4.6474609375, 5.876953125, 7.1064453125, 8.3359375, 9.5654296875, 10.794921875, 12.0244140625, 13.25390625, 14.4833984375, 15.712890625, 16.9423828125, 18.171875, 19.4013671875, 20.630859375, 21.8603515625, 23.08984375, 24.3193359375, 25.548828125, 26.7783203125, 28.0078125, 29.2373046875, 30.466796875, 31.6962890625, 32.92578125, 34.1552734375, 35.384765625, 36.6142578125, 37.84375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 16.0, 37.0, 70.0, 194.0, 354.0, 196.0, 67.0, 32.0, 10.0, 12.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.33833312988281, -79.69783020019531, -72.05732727050781, -64.41683197021484, -56.776329040527344, -49.135826110839844, -41.49532699584961, -33.854827880859375, -26.214324951171875, -18.573823928833008, -10.93332290649414, -3.2928218841552734, 4.347679138183594, 11.988182067871094, 19.628681182861328, 27.269180297851562, 34.90968322753906, 42.55018615722656, 50.1906852722168, 57.83118438720703, 65.47168731689453, 73.11219024658203, 80.752685546875, 88.3931884765625, 96.03369140625, 103.6741943359375, 111.314697265625, 118.95519256591797, 126.59569549560547, 134.2362060546875, 141.87669372558594, 149.51719665527344, 157.15768432617188, 164.79818725585938, 172.43869018554688, 180.07919311523438, 187.71969604492188, 195.36019897460938, 203.0006866455078, 210.6411895751953, 218.2816925048828, 225.9221954345703, 233.5626983642578, 241.2032012939453, 248.84368896484375, 256.48419189453125, 264.12469482421875, 271.76519775390625, 279.40570068359375, 287.04620361328125, 294.68670654296875, 302.32720947265625, 309.96771240234375, 317.60821533203125, 325.24871826171875, 332.88922119140625, 340.52972412109375, 348.17022705078125, 355.81072998046875, 363.45123291015625, 371.09173583984375, 378.73223876953125, 386.37274169921875, 394.01324462890625, 401.6537170410156]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 5.0, 7.0, 14.0, 16.0, 17.0, 17.0, 18.0, 22.0, 17.0, 37.0, 40.0, 39.0, 52.0, 50.0, 40.0, 52.0, 54.0, 49.0, 33.0, 37.0, 47.0, 52.0, 34.0, 28.0, 32.0, 27.0, 20.0, 20.0, 17.0, 14.0, 10.0, 7.0, 9.0, 11.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-96.98023986816406, -93.855224609375, -90.73020935058594, -87.60519409179688, -84.48017120361328, -81.35515594482422, -78.23014068603516, -75.1051254272461, -71.98011016845703, -68.85509490966797, -65.7300796508789, -62.60506057739258, -59.480045318603516, -56.35502624511719, -53.230010986328125, -50.10499572753906, -46.979976654052734, -43.85496139526367, -40.729942321777344, -37.60492706298828, -34.47991180419922, -31.354894638061523, -28.229877471923828, -25.104862213134766, -21.97984504699707, -18.854827880859375, -15.729812622070312, -12.604795455932617, -9.479779243469238, -6.354763031005859, -3.229745864868164, -0.10473060607910156, 3.0202865600585938, 6.145302772521973, 9.270318984985352, 12.395336151123047, 15.520352363586426, 18.645368576049805, 21.7703857421875, 24.895401000976562, 28.020418167114258, 31.145435333251953, 34.270450592041016, 37.395469665527344, 40.520484924316406, 43.64550018310547, 46.77051544189453, 49.895530700683594, 53.02054977416992, 56.145565032958984, 59.27058410644531, 62.395599365234375, 65.52061462402344, 68.6456298828125, 71.77064514160156, 74.89566040039062, 78.02068328857422, 81.14569854736328, 84.27071380615234, 87.39573669433594, 90.520751953125, 93.64576721191406, 96.77078247070312, 99.89579772949219, 103.02081298828125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 8.0, 9.0, 18.0, 30.0, 50.0, 57.0, 97.0, 160.0, 231.0, 346.0, 496.0, 721.0, 1221.0, 1041009.0, 1458.0, 876.0, 593.0, 392.0, 259.0, 180.0, 136.0, 76.0, 48.0, 33.0, 16.0, 14.0, 9.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.42410659790039, -38.71892547607422, -37.01374816894531, -35.30856704711914, -33.603389739990234, -31.898208618164062, -30.193029403686523, -28.487850189208984, -26.782670974731445, -25.077491760253906, -23.372312545776367, -21.667133331298828, -19.961952209472656, -18.25677490234375, -16.551593780517578, -14.846414566040039, -13.1412353515625, -11.436056137084961, -9.730876922607422, -8.025696754455566, -6.320517539978027, -4.615338325500488, -2.910158157348633, -1.2049789428710938, 0.5002002716064453, 2.2053797245025635, 3.9105591773986816, 5.615738868713379, 7.320918083190918, 9.026097297668457, 10.731277465820312, 12.436456680297852, 14.141632080078125, 15.846811294555664, 17.551990509033203, 19.257171630859375, 20.96234893798828, 22.667530059814453, 24.372709274291992, 26.07788848876953, 27.78306770324707, 29.48824691772461, 31.19342613220215, 32.89860534667969, 34.60378646850586, 36.308963775634766, 38.01414489746094, 39.719322204589844, 41.424503326416016, 43.12968444824219, 44.834861755371094, 46.540042877197266, 48.24522018432617, 49.950401306152344, 51.65557861328125, 53.36075973510742, 55.065940856933594, 56.771121978759766, 58.47629928588867, 60.181480407714844, 61.88665771484375, 63.59183883666992, 65.2970199584961, 67.002197265625, 68.7073745727539]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 12.0, 7.0, 9.0, 13.0, 29.0, 54.0, 425.0, 51462200.0, 191.0, 64.0, 27.0, 19.0, 7.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4720.0, -4518.69091796875, -4317.3818359375, -4116.07275390625, -3914.763671875, -3713.45458984375, -3512.1455078125, -3310.83642578125, -3109.52734375, -2908.21826171875, -2706.9091796875, -2505.60009765625, -2304.291015625, -2102.98193359375, -1901.6729736328125, -1700.3638916015625, -1499.054931640625, -1297.745849609375, -1096.436767578125, -895.1277465820312, -693.8186645507812, -492.50958251953125, -291.2005615234375, -89.8914794921875, 111.4176025390625, 312.7266845703125, 514.0357666015625, 715.3447875976562, 916.6538696289062, 1117.962890625, 1319.27197265625, 1520.5810546875, 1721.89013671875, 1923.19921875, 2124.50830078125, 2325.8173828125, 2527.12646484375, 2728.435546875, 2929.74462890625, 3131.0537109375, 3332.36279296875, 3533.671875, 3734.98095703125, 3936.2900390625, 4137.59912109375, 4338.908203125, 4540.21728515625, 4741.5263671875, 4942.8349609375, 5144.14404296875, 5345.453125, 5546.76220703125, 5748.0712890625, 5949.38037109375, 6150.689453125, 6351.99853515625, 6553.3076171875, 6754.61669921875, 6955.92578125, 7157.23486328125, 7358.5439453125, 7559.85302734375, 7761.162109375, 7962.47119140625, 8163.7802734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 12.0, 6.0, 13.0, 20.0, 21.0, 34.0, 51.0, 94.0, 121.0, 172.0, 271.0, 365.0, 599.0, 845.0, 1368.0, 2096.0, 3248.0, 5217.0, 8273.0, 13101.0, 21116.0, 34397.0, 57158.0, 98917.0, 175744.0, 340485.0, 1365169.0, 3323656.0, 378720.0, 193464.0, 106601.0, 62497.0, 37086.0, 22284.0, 13949.0, 8834.0, 5599.0, 3397.0, 2212.0, 1386.0, 915.0, 616.0, 424.0, 281.0, 202.0, 121.0, 72.0, 74.0, 55.0, 27.0, 14.0, 14.0, 12.0, 7.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.06640625, -4.9132080078125, -4.760009765625, -4.6068115234375, -4.45361328125, -4.3004150390625, -4.147216796875, -3.9940185546875, -3.8408203125, -3.6876220703125, -3.534423828125, -3.3812255859375, -3.22802734375, -3.0748291015625, -2.921630859375, -2.7684326171875, -2.615234375, -2.4620361328125, -2.308837890625, -2.1556396484375, -2.00244140625, -1.8492431640625, -1.696044921875, -1.5428466796875, -1.3896484375, -1.2364501953125, -1.083251953125, -0.9300537109375, -0.77685546875, -0.6236572265625, -0.470458984375, -0.3172607421875, -0.1640625, -0.0108642578125, 0.142333984375, 0.2955322265625, 0.44873046875, 0.6019287109375, 0.755126953125, 0.9083251953125, 1.0615234375, 1.2147216796875, 1.367919921875, 1.5211181640625, 1.67431640625, 1.8275146484375, 1.980712890625, 2.1339111328125, 2.287109375, 2.4403076171875, 2.593505859375, 2.7467041015625, 2.89990234375, 3.0531005859375, 3.206298828125, 3.3594970703125, 3.5126953125, 3.6658935546875, 3.819091796875, 3.9722900390625, 4.12548828125, 4.2786865234375, 4.431884765625, 4.5850830078125, 4.73828125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 9.0, 2.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 9.0, 20.0, 17.0, 27.0, 23.0, 29.0, 28.0, 31.0, 44.0, 34.0, 39.0, 50.0, 117.0, 355.0, 600.0, 101.0, 55.0, 40.0, 30.0, 34.0, 29.0, 37.0, 27.0, 27.0, 22.0, 18.0, 20.0, 17.0, 9.0, 12.0, 11.0, 8.0, 10.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.5703125, -11.1998291015625, -10.829345703125, -10.4588623046875, -10.08837890625, -9.7178955078125, -9.347412109375, -8.9769287109375, -8.6064453125, -8.2359619140625, -7.865478515625, -7.4949951171875, -7.12451171875, -6.7540283203125, -6.383544921875, -6.0130615234375, -5.642578125, -5.2720947265625, -4.901611328125, -4.5311279296875, -4.16064453125, -3.7901611328125, -3.419677734375, -3.0491943359375, -2.6787109375, -2.3082275390625, -1.937744140625, -1.5672607421875, -1.19677734375, -0.8262939453125, -0.455810546875, -0.0853271484375, 0.28515625, 0.6556396484375, 1.026123046875, 1.3966064453125, 1.76708984375, 2.1375732421875, 2.508056640625, 2.8785400390625, 3.2490234375, 3.6195068359375, 3.989990234375, 4.3604736328125, 4.73095703125, 5.1014404296875, 5.471923828125, 5.8424072265625, 6.212890625, 6.5833740234375, 6.953857421875, 7.3243408203125, 7.69482421875, 8.0653076171875, 8.435791015625, 8.8062744140625, 9.1767578125, 9.5472412109375, 9.917724609375, 10.2882080078125, 10.65869140625, 11.0291748046875, 11.399658203125, 11.7701416015625, 12.140625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 6.0, 11.0, 13.0, 22.0, 21.0, 55.0, 53.0, 120.0, 159.0, 326.0, 477.0, 773.0, 1331.0, 2328.0, 4158.0, 7435.0, 13803.0, 25708.0, 48981.0, 97003.0, 197367.0, 487541.0, 4177988.0, 730017.0, 250647.0, 118100.0, 58908.0, 30915.0, 16659.0, 8923.0, 4864.0, 2681.0, 1609.0, 913.0, 600.0, 342.0, 227.0, 132.0, 82.0, 40.0, 18.0, 19.0, 25.0, 16.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0], "bins": [-7.53515625, -7.31121826171875, -7.0872802734375, -6.86334228515625, -6.639404296875, -6.41546630859375, -6.1915283203125, -5.96759033203125, -5.74365234375, -5.51971435546875, -5.2957763671875, -5.07183837890625, -4.847900390625, -4.62396240234375, -4.4000244140625, -4.17608642578125, -3.9521484375, -3.72821044921875, -3.5042724609375, -3.28033447265625, -3.056396484375, -2.83245849609375, -2.6085205078125, -2.38458251953125, -2.16064453125, -1.93670654296875, -1.7127685546875, -1.48883056640625, -1.264892578125, -1.04095458984375, -0.8170166015625, -0.59307861328125, -0.369140625, -0.14520263671875, 0.0787353515625, 0.30267333984375, 0.526611328125, 0.75054931640625, 0.9744873046875, 1.19842529296875, 1.42236328125, 1.64630126953125, 1.8702392578125, 2.09417724609375, 2.318115234375, 2.54205322265625, 2.7659912109375, 2.98992919921875, 3.2138671875, 3.43780517578125, 3.6617431640625, 3.88568115234375, 4.109619140625, 4.33355712890625, 4.5574951171875, 4.78143310546875, 5.00537109375, 5.22930908203125, 5.4532470703125, 5.67718505859375, 5.901123046875, 6.12506103515625, 6.3489990234375, 6.57293701171875, 6.796875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 12.0, 10.0, 12.0, 10.0, 19.0, 21.0, 24.0, 26.0, 26.0, 29.0, 44.0, 36.0, 42.0, 62.0, 67.0, 215.0, 624.0, 220.0, 81.0, 65.0, 46.0, 43.0, 28.0, 36.0, 32.0, 27.0, 29.0, 24.0, 19.0, 20.0, 14.0, 17.0, 10.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5546875, -9.2708740234375, -8.987060546875, -8.7032470703125, -8.41943359375, -8.1356201171875, -7.851806640625, -7.5679931640625, -7.2841796875, -7.0003662109375, -6.716552734375, -6.4327392578125, -6.14892578125, -5.8651123046875, -5.581298828125, -5.2974853515625, -5.013671875, -4.7298583984375, -4.446044921875, -4.1622314453125, -3.87841796875, -3.5946044921875, -3.310791015625, -3.0269775390625, -2.7431640625, -2.4593505859375, -2.175537109375, -1.8917236328125, -1.60791015625, -1.3240966796875, -1.040283203125, -0.7564697265625, -0.47265625, -0.1888427734375, 0.094970703125, 0.3787841796875, 0.66259765625, 0.9464111328125, 1.230224609375, 1.5140380859375, 1.7978515625, 2.0816650390625, 2.365478515625, 2.6492919921875, 2.93310546875, 3.2169189453125, 3.500732421875, 3.7845458984375, 4.068359375, 4.3521728515625, 4.635986328125, 4.9197998046875, 5.20361328125, 5.4874267578125, 5.771240234375, 6.0550537109375, 6.3388671875, 6.6226806640625, 6.906494140625, 7.1903076171875, 7.47412109375, 7.7579345703125, 8.041748046875, 8.3255615234375, 8.609375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 7.0, 5.0, 7.0, 18.0, 1.0, 5.0, 34.0, 33.0, 31.0, 30.0, 64.0, 66.0, 89.0, 118.0, 146.0, 196.0, 250.0, 299.0, 443.0, 562.0, 860.0, 1045.0, 1550.0, 2413.0, 3574.0, 6380.0, 12575.0, 28197.0, 86109.0, 5842378.0, 215349.0, 46719.0, 18404.0, 8920.0, 4907.0, 2859.0, 1835.0, 1389.0, 847.0, 685.0, 450.0, 382.0, 247.0, 220.0, 165.0, 129.0, 104.0, 89.0, 49.0, 48.0, 46.0, 13.0, 14.0, 26.0, 21.0, 23.0, 14.0, 1.0, 3.0, 9.0], "bins": [-16.90625, -16.4053955078125, -15.904541015625, -15.4036865234375, -14.90283203125, -14.4019775390625, -13.901123046875, -13.4002685546875, -12.8994140625, -12.3985595703125, -11.897705078125, -11.3968505859375, -10.89599609375, -10.3951416015625, -9.894287109375, -9.3934326171875, -8.892578125, -8.3917236328125, -7.890869140625, -7.3900146484375, -6.88916015625, -6.3883056640625, -5.887451171875, -5.3865966796875, -4.8857421875, -4.3848876953125, -3.884033203125, -3.3831787109375, -2.88232421875, -2.3814697265625, -1.880615234375, -1.3797607421875, -0.87890625, -0.3780517578125, 0.122802734375, 0.6236572265625, 1.12451171875, 1.6253662109375, 2.126220703125, 2.6270751953125, 3.1279296875, 3.6287841796875, 4.129638671875, 4.6304931640625, 5.13134765625, 5.6322021484375, 6.133056640625, 6.6339111328125, 7.134765625, 7.6356201171875, 8.136474609375, 8.6373291015625, 9.13818359375, 9.6390380859375, 10.139892578125, 10.6407470703125, 11.1416015625, 11.6424560546875, 12.143310546875, 12.6441650390625, 13.14501953125, 13.6458740234375, 14.146728515625, 14.6475830078125, 15.1484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 6.0, 9.0, 7.0, 7.0, 17.0, 7.0, 12.0, 15.0, 18.0, 18.0, 19.0, 27.0, 36.0, 31.0, 36.0, 52.0, 53.0, 70.0, 114.0, 212.0, 443.0, 236.0, 107.0, 72.0, 54.0, 42.0, 30.0, 34.0, 39.0, 25.0, 25.0, 24.0, 14.0, 21.0, 10.0, 13.0, 16.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.94140625, -5.76544189453125, -5.5894775390625, -5.41351318359375, -5.237548828125, -5.06158447265625, -4.8856201171875, -4.70965576171875, -4.53369140625, -4.35772705078125, -4.1817626953125, -4.00579833984375, -3.829833984375, -3.65386962890625, -3.4779052734375, -3.30194091796875, -3.1259765625, -2.95001220703125, -2.7740478515625, -2.59808349609375, -2.422119140625, -2.24615478515625, -2.0701904296875, -1.89422607421875, -1.71826171875, -1.54229736328125, -1.3663330078125, -1.19036865234375, -1.014404296875, -0.83843994140625, -0.6624755859375, -0.48651123046875, -0.310546875, -0.13458251953125, 0.0413818359375, 0.21734619140625, 0.393310546875, 0.56927490234375, 0.7452392578125, 0.92120361328125, 1.09716796875, 1.27313232421875, 1.4490966796875, 1.62506103515625, 1.801025390625, 1.97698974609375, 2.1529541015625, 2.32891845703125, 2.5048828125, 2.68084716796875, 2.8568115234375, 3.03277587890625, 3.208740234375, 3.38470458984375, 3.5606689453125, 3.73663330078125, 3.91259765625, 4.08856201171875, 4.2645263671875, 4.44049072265625, 4.616455078125, 4.79241943359375, 4.9683837890625, 5.14434814453125, 5.3203125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 9.0, 16.0, 72.0, 251.0, 535.0, 92.0, 23.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-100.04877471923828, -98.23719787597656, -96.42562103271484, -94.6140365600586, -92.80245971679688, -90.99088287353516, -89.17930603027344, -87.36772918701172, -85.55615234375, -83.74457550048828, -81.93299865722656, -80.12141418457031, -78.3098373413086, -76.49826049804688, -74.68668365478516, -72.87510681152344, -71.06352233886719, -69.25194549560547, -67.44036865234375, -65.6287841796875, -63.81720733642578, -62.00563049316406, -60.194053649902344, -58.382476806640625, -56.57089614868164, -54.75931930541992, -52.94773864746094, -51.13616180419922, -49.3245849609375, -47.513004302978516, -45.7014274597168, -43.88984680175781, -42.07827377319336, -40.26669692993164, -38.455116271972656, -36.64353942871094, -34.83196258544922, -33.020381927490234, -31.208805084228516, -29.397226333618164, -27.585647583007812, -25.77406883239746, -23.96249008178711, -22.15091323852539, -20.33933448791504, -18.527755737304688, -16.71617889404297, -14.904600143432617, -13.093021392822266, -11.281442642211914, -9.469864845275879, -7.6582865715026855, -5.846708297729492, -4.035129547119141, -2.2235517501831055, -0.4119739532470703, 1.3996047973632812, 3.2111830711364746, 5.022761344909668, 6.834339618682861, 8.645917892456055, 10.457496643066406, 12.269074440002441, 14.080652236938477, 15.892230987548828]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 5.0, 5.0, 7.0, 13.0, 22.0, 14.0, 19.0, 32.0, 27.0, 29.0, 27.0, 38.0, 45.0, 43.0, 38.0, 41.0, 54.0, 49.0, 46.0, 33.0, 59.0, 43.0, 37.0, 41.0, 44.0, 22.0, 28.0, 26.0, 22.0, 28.0, 17.0, 14.0, 9.0, 8.0, 7.0, 3.0, 1.0, 8.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.205036163330078, -8.905710220336914, -8.60638427734375, -8.307058334350586, -8.007732391357422, -7.708406925201416, -7.409080982208252, -7.109755516052246, -6.810429573059082, -6.511103630065918, -6.211777687072754, -5.91245174407959, -5.613126277923584, -5.31380033493042, -5.014474391937256, -4.71514892578125, -4.415822505950928, -4.116496562957764, -3.8171708583831787, -3.5178449153900146, -3.2185192108154297, -2.9191932678222656, -2.6198673248291016, -2.3205416202545166, -2.0212156772613525, -1.721889853477478, -1.4225640296936035, -1.1232380867004395, -0.8239122629165649, -0.5245864391326904, -0.22526049613952637, 0.0740652084350586, 0.37339115142822266, 0.6727169752120972, 0.9720428586006165, 1.2713687419891357, 1.5706945657730103, 1.8700203895568848, 2.169346332550049, 2.468672037124634, 2.767997980117798, 3.067323923110962, 3.366649627685547, 3.665975570678711, 3.965301513671875, 4.264627456665039, 4.563953399658203, 4.863278865814209, 5.162604808807373, 5.461930751800537, 5.761256694793701, 6.060582160949707, 6.359908103942871, 6.659234046936035, 6.958559989929199, 7.257885932922363, 7.557211875915527, 7.856537818908691, 8.155863761901855, 8.45518970489502, 8.754515647888184, 9.053840637207031, 9.353166580200195, 9.65249252319336, 9.951818466186523]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 5.0, 8.0, 14.0, 19.0, 23.0, 26.0, 45.0, 59.0, 79.0, 144.0, 223.0, 348.0, 572.0, 959.0, 1741.0, 3219.0, 7224.0, 21686.0, 3264130.0, 858073.0, 22007.0, 7435.0, 3115.0, 1447.0, 696.0, 360.0, 210.0, 139.0, 74.0, 51.0, 33.0, 28.0, 21.0, 14.0, 9.0, 4.0, 6.0, 5.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.035125732421875, -0.03412199020385742, -0.033118247985839844, -0.032114505767822266, -0.031110763549804688, -0.03010702133178711, -0.02910327911376953, -0.028099536895751953, -0.027095794677734375, -0.026092052459716797, -0.02508831024169922, -0.02408456802368164, -0.023080825805664062, -0.022077083587646484, -0.021073341369628906, -0.020069599151611328, -0.01906585693359375, -0.018062114715576172, -0.017058372497558594, -0.016054630279541016, -0.015050888061523438, -0.01404714584350586, -0.013043403625488281, -0.012039661407470703, -0.011035919189453125, -0.010032176971435547, -0.009028434753417969, -0.00802469253540039, -0.0070209503173828125, -0.006017208099365234, -0.005013465881347656, -0.004009723663330078, -0.0030059814453125, -0.002002239227294922, -0.0009984970092773438, 5.245208740234375e-06, 0.0010089874267578125, 0.0020127296447753906, 0.0030164718627929688, 0.004020214080810547, 0.005023956298828125, 0.006027698516845703, 0.007031440734863281, 0.00803518295288086, 0.009038925170898438, 0.010042667388916016, 0.011046409606933594, 0.012050151824951172, 0.01305389404296875, 0.014057636260986328, 0.015061378479003906, 0.016065120697021484, 0.017068862915039062, 0.01807260513305664, 0.01907634735107422, 0.020080089569091797, 0.021083831787109375, 0.022087574005126953, 0.02309131622314453, 0.02409505844116211, 0.025098800659179688, 0.026102542877197266, 0.027106285095214844, 0.028110027313232422, 0.02911376953125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 6.0, 10.0, 6.0, 10.0, 6.0, 11.0, 14.0, 79.0, 499.0, 223.0, 23.0, 8.0, 9.0, 8.0, 10.0, 5.0, 11.0, 8.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0016803741455078125, -0.0016288608312606812, -0.0015773475170135498, -0.0015258342027664185, -0.0014743208885192871, -0.0014228075742721558, -0.0013712942600250244, -0.001319780945777893, -0.0012682676315307617, -0.0012167543172836304, -0.001165241003036499, -0.0011137276887893677, -0.0010622143745422363, -0.001010701060295105, -0.0009591877460479736, -0.0009076744318008423, -0.0008561611175537109, -0.0008046478033065796, -0.0007531344890594482, -0.0007016211748123169, -0.0006501078605651855, -0.0005985945463180542, -0.0005470812320709229, -0.0004955679178237915, -0.00044405460357666016, -0.0003925412893295288, -0.00034102797508239746, -0.0002895146608352661, -0.00023800134658813477, -0.00018648803234100342, -0.00013497471809387207, -8.346140384674072e-05, -3.1948089599609375e-05, 1.9565224647521973e-05, 7.107853889465332e-05, 0.00012259185314178467, 0.00017410516738891602, 0.00022561848163604736, 0.0002771317958831787, 0.00032864511013031006, 0.0003801584243774414, 0.00043167173862457275, 0.0004831850528717041, 0.0005346983671188354, 0.0005862116813659668, 0.0006377249956130981, 0.0006892383098602295, 0.0007407516241073608, 0.0007922649383544922, 0.0008437782526016235, 0.0008952915668487549, 0.0009468048810958862, 0.0009983181953430176, 0.001049831509590149, 0.0011013448238372803, 0.0011528581380844116, 0.001204371452331543, 0.0012558847665786743, 0.0013073980808258057, 0.001358911395072937, 0.0014104247093200684, 0.0014619380235671997, 0.001513451337814331, 0.0015649646520614624, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 14.0, 11.0, 9.0, 11.0, 19.0, 20.0, 31.0, 48.0, 78.0, 144.0, 213.0, 374.0, 689.0, 1334.0, 3684.0, 16811.0, 771253.0, 3372090.0, 20338.0, 3981.0, 1446.0, 680.0, 393.0, 217.0, 129.0, 75.0, 64.0, 34.0, 31.0, 13.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043060302734375, -0.041407108306884766, -0.03975391387939453, -0.0381007194519043, -0.03644752502441406, -0.03479433059692383, -0.033141136169433594, -0.03148794174194336, -0.029834747314453125, -0.02818155288696289, -0.026528358459472656, -0.024875164031982422, -0.023221969604492188, -0.021568775177001953, -0.01991558074951172, -0.018262386322021484, -0.01660919189453125, -0.014955997467041016, -0.013302803039550781, -0.011649608612060547, -0.009996414184570312, -0.008343219757080078, -0.006690025329589844, -0.005036830902099609, -0.003383636474609375, -0.0017304420471191406, -7.724761962890625e-05, 0.0015759468078613281, 0.0032291412353515625, 0.004882335662841797, 0.006535530090332031, 0.008188724517822266, 0.0098419189453125, 0.011495113372802734, 0.013148307800292969, 0.014801502227783203, 0.016454696655273438, 0.018107891082763672, 0.019761085510253906, 0.02141427993774414, 0.023067474365234375, 0.02472066879272461, 0.026373863220214844, 0.028027057647705078, 0.029680252075195312, 0.03133344650268555, 0.03298664093017578, 0.034639835357666016, 0.03629302978515625, 0.037946224212646484, 0.03959941864013672, 0.04125261306762695, 0.04290580749511719, 0.04455900192260742, 0.046212196350097656, 0.04786539077758789, 0.049518585205078125, 0.05117177963256836, 0.052824974060058594, 0.05447816848754883, 0.05613136291503906, 0.0577845573425293, 0.05943775177001953, 0.061090946197509766, 0.062744140625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 11.0, 15.0, 20.0, 24.0, 23.0, 41.0, 44.0, 54.0, 68.0, 99.0, 128.0, 175.0, 298.0, 1478.0, 699.0, 233.0, 166.0, 122.0, 71.0, 66.0, 59.0, 33.0, 29.0, 28.0, 16.0, 12.0, 17.0, 9.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0033664703369140625, -0.0032411515712738037, -0.003115832805633545, -0.002990514039993286, -0.0028651952743530273, -0.0027398765087127686, -0.0026145577430725098, -0.002489238977432251, -0.002363920211791992, -0.0022386014461517334, -0.0021132826805114746, -0.001987963914871216, -0.001862645149230957, -0.0017373263835906982, -0.0016120076179504395, -0.0014866888523101807, -0.0013613700866699219, -0.001236051321029663, -0.0011107325553894043, -0.0009854137897491455, -0.0008600950241088867, -0.0007347762584686279, -0.0006094574928283691, -0.00048413872718811035, -0.00035881996154785156, -0.00023350119590759277, -0.00010818243026733398, 1.7136335372924805e-05, 0.0001424551010131836, 0.0002677738666534424, 0.00039309263229370117, 0.00051841139793396, 0.0006437301635742188, 0.0007690489292144775, 0.0008943676948547363, 0.0010196864604949951, 0.001145005226135254, 0.0012703239917755127, 0.0013956427574157715, 0.0015209615230560303, 0.001646280288696289, 0.0017715990543365479, 0.0018969178199768066, 0.0020222365856170654, 0.0021475553512573242, 0.002272874116897583, 0.002398192882537842, 0.0025235116481781006, 0.0026488304138183594, 0.002774149179458618, 0.002899467945098877, 0.0030247867107391357, 0.0031501054763793945, 0.0032754242420196533, 0.003400743007659912, 0.003526061773300171, 0.0036513805389404297, 0.0037766993045806885, 0.0039020180702209473, 0.004027336835861206, 0.004152655601501465, 0.004277974367141724, 0.004403293132781982, 0.004528611898422241, 0.0046539306640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 10.0, 18.0, 66.0, 231.0, 472.0, 136.0, 39.0, 13.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0440877303481102, -0.04168759286403656, -0.03928745537996292, -0.03688731789588928, -0.03448718041181564, -0.032087042927742004, -0.029686905443668365, -0.027286767959594727, -0.024886630475521088, -0.02248649299144745, -0.02008635550737381, -0.01768621802330017, -0.015286080539226532, -0.012885943055152893, -0.010485805571079254, -0.008085668087005615, -0.005685530602931976, -0.0032853931188583374, -0.0008852556347846985, 0.0015148818492889404, 0.003915019333362579, 0.006315156817436218, 0.008715294301509857, 0.011115431785583496, 0.013515569269657135, 0.015915706753730774, 0.018315844237804413, 0.020715981721878052, 0.02311611920595169, 0.02551625669002533, 0.02791639417409897, 0.030316531658172607, 0.03271667659282684, 0.03511681407690048, 0.03751695156097412, 0.03991708904504776, 0.0423172265291214, 0.04471736401319504, 0.04711750149726868, 0.049517638981342316, 0.051917776465415955, 0.054317913949489594, 0.05671805143356323, 0.05911818891763687, 0.06151832640171051, 0.06391846388578415, 0.06631860136985779, 0.06871873885393143, 0.07111887633800507, 0.0735190138220787, 0.07591915130615234, 0.07831928879022598, 0.08071942627429962, 0.08311956375837326, 0.0855197012424469, 0.08791983872652054, 0.09031997621059418, 0.09272011369466782, 0.09512025117874146, 0.0975203886628151, 0.09992052614688873, 0.10232066363096237, 0.10472080111503601, 0.10712093859910965, 0.10952107608318329]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 13.0, 9.0, 21.0, 24.0, 33.0, 25.0, 35.0, 37.0, 53.0, 45.0, 47.0, 54.0, 61.0, 43.0, 60.0, 36.0, 48.0, 45.0, 55.0, 44.0, 29.0, 31.0, 28.0, 20.0, 21.0, 12.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.013874709606170654, -0.013360245153307915, -0.012845780700445175, -0.012331316247582436, -0.011816851794719696, -0.011302387341856956, -0.010787922888994217, -0.010273458436131477, -0.009758993983268738, -0.009244529530405998, -0.008730065077543259, -0.008215600624680519, -0.0077011361718177795, -0.00718667171895504, -0.0066722072660923, -0.006157742813229561, -0.005643278360366821, -0.005128813907504082, -0.004614349454641342, -0.004099885001778603, -0.003585420548915863, -0.0030709560960531235, -0.002556491643190384, -0.0020420271903276443, -0.0015275627374649048, -0.0010130982846021652, -0.0004986338317394257, 1.5830621123313904e-05, 0.0005302950739860535, 0.001044759526848793, 0.0015592239797115326, 0.002073688432574272, 0.0025881528854370117, 0.0031026173382997513, 0.003617081791162491, 0.00413154624402523, 0.00464601069688797, 0.0051604751497507095, 0.005674939602613449, 0.006189404055476189, 0.006703868508338928, 0.007218332961201668, 0.007732797414064407, 0.008247261866927147, 0.008761726319789886, 0.009276190772652626, 0.009790655225515366, 0.010305119678378105, 0.010819584131240845, 0.011334048584103584, 0.011848513036966324, 0.012362977489829063, 0.012877441942691803, 0.013391906395554543, 0.013906370848417282, 0.014420835301280022, 0.014935299754142761, 0.0154497642070055, 0.01596422865986824, 0.01647869311273098, 0.01699315756559372, 0.01750762201845646, 0.0180220864713192, 0.018536550924181938, 0.019051015377044678]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 6.0, 6.0, 12.0, 20.0, 23.0, 19.0, 32.0, 43.0, 57.0, 80.0, 89.0, 141.0, 195.0, 277.0, 333.0, 544.0, 732.0, 1039.0, 1465.0, 2224.0, 3380.0, 5384.0, 8461.0, 15292.0, 34971.0, 819884.0, 100946.0, 21920.0, 11352.0, 6620.0, 4237.0, 2709.0, 1807.0, 1241.0, 843.0, 604.0, 420.0, 284.0, 232.0, 166.0, 138.0, 95.0, 62.0, 36.0, 38.0, 24.0, 17.0, 17.0, 9.0, 7.0, 8.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0], "bins": [-0.01934814453125, -0.018757343292236328, -0.018166542053222656, -0.017575740814208984, -0.016984939575195312, -0.01639413833618164, -0.01580333709716797, -0.015212535858154297, -0.014621734619140625, -0.014030933380126953, -0.013440132141113281, -0.01284933090209961, -0.012258529663085938, -0.011667728424072266, -0.011076927185058594, -0.010486125946044922, -0.00989532470703125, -0.009304523468017578, -0.008713722229003906, -0.008122920989990234, -0.0075321197509765625, -0.006941318511962891, -0.006350517272949219, -0.005759716033935547, -0.005168914794921875, -0.004578113555908203, -0.003987312316894531, -0.0033965110778808594, -0.0028057098388671875, -0.0022149085998535156, -0.0016241073608398438, -0.0010333061218261719, -0.0004425048828125, 0.00014829635620117188, 0.0007390975952148438, 0.0013298988342285156, 0.0019207000732421875, 0.0025115013122558594, 0.0031023025512695312, 0.003693103790283203, 0.004283905029296875, 0.004874706268310547, 0.005465507507324219, 0.006056308746337891, 0.0066471099853515625, 0.007237911224365234, 0.007828712463378906, 0.008419513702392578, 0.00901031494140625, 0.009601116180419922, 0.010191917419433594, 0.010782718658447266, 0.011373519897460938, 0.01196432113647461, 0.012555122375488281, 0.013145923614501953, 0.013736724853515625, 0.014327526092529297, 0.014918327331542969, 0.01550912857055664, 0.016099929809570312, 0.016690731048583984, 0.017281532287597656, 0.017872333526611328, 0.018463134765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 9.0, 7.0, 9.0, 13.0, 11.0, 65.0, 333.0, 341.0, 72.0, 19.0, 7.0, 11.0, 7.0, 9.0, 12.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0017604827880859375, -0.001710057258605957, -0.0016596317291259766, -0.001609206199645996, -0.0015587806701660156, -0.0015083551406860352, -0.0014579296112060547, -0.0014075040817260742, -0.0013570785522460938, -0.0013066530227661133, -0.0012562274932861328, -0.0012058019638061523, -0.0011553764343261719, -0.0011049509048461914, -0.001054525375366211, -0.0010040998458862305, -0.00095367431640625, -0.0009032487869262695, -0.0008528232574462891, -0.0008023977279663086, -0.0007519721984863281, -0.0007015466690063477, -0.0006511211395263672, -0.0006006956100463867, -0.0005502700805664062, -0.0004998445510864258, -0.0004494190216064453, -0.00039899349212646484, -0.0003485679626464844, -0.0002981424331665039, -0.00024771690368652344, -0.00019729137420654297, -0.0001468658447265625, -9.644031524658203e-05, -4.601478576660156e-05, 4.410743713378906e-06, 5.4836273193359375e-05, 0.00010526180267333984, 0.0001556873321533203, 0.00020611286163330078, 0.00025653839111328125, 0.0003069639205932617, 0.0003573894500732422, 0.00040781497955322266, 0.0004582405090332031, 0.0005086660385131836, 0.0005590915679931641, 0.0006095170974731445, 0.000659942626953125, 0.0007103681564331055, 0.0007607936859130859, 0.0008112192153930664, 0.0008616447448730469, 0.0009120702743530273, 0.0009624958038330078, 0.0010129213333129883, 0.0010633468627929688, 0.0011137723922729492, 0.0011641979217529297, 0.0012146234512329102, 0.0012650489807128906, 0.001315474510192871, 0.0013659000396728516, 0.001416325569152832, 0.0014667510986328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 16.0, 9.0, 19.0, 25.0, 24.0, 40.0, 39.0, 67.0, 66.0, 107.0, 188.0, 253.0, 307.0, 511.0, 791.0, 1293.0, 2166.0, 4475.0, 11437.0, 57456.0, 854643.0, 88800.0, 14125.0, 5240.0, 2424.0, 1380.0, 849.0, 517.0, 331.0, 233.0, 206.0, 133.0, 79.0, 71.0, 53.0, 43.0, 29.0, 19.0, 19.0, 10.0, 15.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.0357666015625, -0.034668922424316406, -0.03357124328613281, -0.03247356414794922, -0.031375885009765625, -0.03027820587158203, -0.029180526733398438, -0.028082847595214844, -0.02698516845703125, -0.025887489318847656, -0.024789810180664062, -0.02369213104248047, -0.022594451904296875, -0.02149677276611328, -0.020399093627929688, -0.019301414489746094, -0.0182037353515625, -0.017106056213378906, -0.016008377075195312, -0.014910697937011719, -0.013813018798828125, -0.012715339660644531, -0.011617660522460938, -0.010519981384277344, -0.00942230224609375, -0.008324623107910156, -0.0072269439697265625, -0.006129264831542969, -0.005031585693359375, -0.003933906555175781, -0.0028362274169921875, -0.0017385482788085938, -0.000640869140625, 0.00045680999755859375, 0.0015544891357421875, 0.0026521682739257812, 0.003749847412109375, 0.004847526550292969, 0.0059452056884765625, 0.007042884826660156, 0.00814056396484375, 0.009238243103027344, 0.010335922241210938, 0.011433601379394531, 0.012531280517578125, 0.013628959655761719, 0.014726638793945312, 0.015824317932128906, 0.0169219970703125, 0.018019676208496094, 0.019117355346679688, 0.02021503448486328, 0.021312713623046875, 0.02241039276123047, 0.023508071899414062, 0.024605751037597656, 0.02570343017578125, 0.026801109313964844, 0.027898788452148438, 0.02899646759033203, 0.030094146728515625, 0.03119182586669922, 0.03228950500488281, 0.033387184143066406, 0.03448486328125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 6.0, 14.0, 11.0, 9.0, 12.0, 11.0, 18.0, 21.0, 28.0, 26.0, 30.0, 23.0, 41.0, 39.0, 37.0, 40.0, 46.0, 42.0, 39.0, 40.0, 37.0, 34.0, 47.0, 42.0, 41.0, 30.0, 26.0, 31.0, 40.0, 21.0, 18.0, 15.0, 17.0, 13.0, 7.0, 10.0, 6.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007640838623046875, -0.00741344690322876, -0.0071860551834106445, -0.006958663463592529, -0.006731271743774414, -0.006503880023956299, -0.006276488304138184, -0.006049096584320068, -0.005821704864501953, -0.005594313144683838, -0.005366921424865723, -0.005139529705047607, -0.004912137985229492, -0.004684746265411377, -0.004457354545593262, -0.0042299628257751465, -0.004002571105957031, -0.003775179386138916, -0.0035477876663208008, -0.0033203959465026855, -0.0030930042266845703, -0.002865612506866455, -0.00263822078704834, -0.0024108290672302246, -0.0021834373474121094, -0.001956045627593994, -0.001728653907775879, -0.0015012621879577637, -0.0012738704681396484, -0.0010464787483215332, -0.000819087028503418, -0.0005916953086853027, -0.0003643035888671875, -0.00013691186904907227, 9.047985076904297e-05, 0.0003178715705871582, 0.0005452632904052734, 0.0007726550102233887, 0.001000046730041504, 0.0012274384498596191, 0.0014548301696777344, 0.0016822218894958496, 0.0019096136093139648, 0.00213700532913208, 0.0023643970489501953, 0.0025917887687683105, 0.0028191804885864258, 0.003046572208404541, 0.0032739639282226562, 0.0035013556480407715, 0.0037287473678588867, 0.003956139087677002, 0.004183530807495117, 0.004410922527313232, 0.004638314247131348, 0.004865705966949463, 0.005093097686767578, 0.005320489406585693, 0.005547881126403809, 0.005775272846221924, 0.006002664566040039, 0.006230056285858154, 0.0064574480056762695, 0.006684839725494385, 0.0069122314453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 4.0, 9.0, 10.0, 8.0, 21.0, 42.0, 44.0, 86.0, 208.0, 671.0, 4318.0, 896820.0, 142225.0, 3062.0, 609.0, 164.0, 86.0, 39.0, 23.0, 12.0, 20.0, 12.0, 5.0, 10.0, 11.0, 1.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0294189453125, -0.02868199348449707, -0.02794504165649414, -0.02720808982849121, -0.02647113800048828, -0.02573418617248535, -0.024997234344482422, -0.024260282516479492, -0.023523330688476562, -0.022786378860473633, -0.022049427032470703, -0.021312475204467773, -0.020575523376464844, -0.019838571548461914, -0.019101619720458984, -0.018364667892456055, -0.017627716064453125, -0.016890764236450195, -0.016153812408447266, -0.015416860580444336, -0.014679908752441406, -0.013942956924438477, -0.013206005096435547, -0.012469053268432617, -0.011732101440429688, -0.010995149612426758, -0.010258197784423828, -0.009521245956420898, -0.008784294128417969, -0.008047342300415039, -0.007310390472412109, -0.00657343864440918, -0.00583648681640625, -0.00509953498840332, -0.004362583160400391, -0.003625631332397461, -0.0028886795043945312, -0.0021517276763916016, -0.0014147758483886719, -0.0006778240203857422, 5.91278076171875e-05, 0.0007960796356201172, 0.0015330314636230469, 0.0022699832916259766, 0.0030069351196289062, 0.003743886947631836, 0.004480838775634766, 0.005217790603637695, 0.005954742431640625, 0.006691694259643555, 0.007428646087646484, 0.008165597915649414, 0.008902549743652344, 0.009639501571655273, 0.010376453399658203, 0.011113405227661133, 0.011850357055664062, 0.012587308883666992, 0.013324260711669922, 0.014061212539672852, 0.014798164367675781, 0.015535116195678711, 0.01627206802368164, 0.01700901985168457, 0.0177459716796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 14.0, 10.0, 16.0, 24.0, 37.0, 57.0, 89.0, 110.0, 125.0, 124.0, 114.0, 77.0, 63.0, 30.0, 35.0, 22.0, 7.0, 10.0, 13.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0471553802490234e-05, -3.940518945455551e-05, -3.833882510662079e-05, -3.7272460758686066e-05, -3.620609641075134e-05, -3.513973206281662e-05, -3.40733677148819e-05, -3.3007003366947174e-05, -3.194063901901245e-05, -3.087427467107773e-05, -2.9807910323143005e-05, -2.8741545975208282e-05, -2.767518162727356e-05, -2.6608817279338837e-05, -2.5542452931404114e-05, -2.447608858346939e-05, -2.3409724235534668e-05, -2.2343359887599945e-05, -2.1276995539665222e-05, -2.02106311917305e-05, -1.9144266843795776e-05, -1.8077902495861053e-05, -1.701153814792633e-05, -1.5945173799991608e-05, -1.4878809452056885e-05, -1.3812445104122162e-05, -1.2746080756187439e-05, -1.1679716408252716e-05, -1.0613352060317993e-05, -9.54698771238327e-06, -8.480623364448547e-06, -7.4142590165138245e-06, -6.3478946685791016e-06, -5.281530320644379e-06, -4.215165972709656e-06, -3.148801624774933e-06, -2.08243727684021e-06, -1.016072928905487e-06, 5.029141902923584e-08, 1.1166557669639587e-06, 2.1830201148986816e-06, 3.2493844628334045e-06, 4.3157488107681274e-06, 5.38211315870285e-06, 6.448477506637573e-06, 7.514841854572296e-06, 8.581206202507019e-06, 9.647570550441742e-06, 1.0713934898376465e-05, 1.1780299246311188e-05, 1.284666359424591e-05, 1.3913027942180634e-05, 1.4979392290115356e-05, 1.604575663805008e-05, 1.7112120985984802e-05, 1.8178485333919525e-05, 1.9244849681854248e-05, 2.031121402978897e-05, 2.1377578377723694e-05, 2.2443942725658417e-05, 2.351030707359314e-05, 2.4576671421527863e-05, 2.5643035769462585e-05, 2.670940011739731e-05, 2.777576446533203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 4.0, 6.0, 11.0, 12.0, 15.0, 44.0, 57.0, 81.0, 111.0, 179.0, 293.0, 496.0, 993.0, 2428.0, 9335.0, 769458.0, 252584.0, 8059.0, 2137.0, 934.0, 508.0, 288.0, 157.0, 92.0, 69.0, 51.0, 42.0, 31.0, 13.0, 18.0, 7.0, 8.0, 4.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0278778076171875, -0.027005434036254883, -0.026133060455322266, -0.02526068687438965, -0.02438831329345703, -0.023515939712524414, -0.022643566131591797, -0.02177119255065918, -0.020898818969726562, -0.020026445388793945, -0.019154071807861328, -0.01828169822692871, -0.017409324645996094, -0.016536951065063477, -0.01566457748413086, -0.014792203903198242, -0.013919830322265625, -0.013047456741333008, -0.01217508316040039, -0.011302709579467773, -0.010430335998535156, -0.009557962417602539, -0.008685588836669922, -0.007813215255737305, -0.0069408416748046875, -0.00606846809387207, -0.005196094512939453, -0.004323720932006836, -0.0034513473510742188, -0.0025789737701416016, -0.0017066001892089844, -0.0008342266082763672, 3.814697265625e-05, 0.0009105205535888672, 0.0017828941345214844, 0.0026552677154541016, 0.0035276412963867188, 0.004400014877319336, 0.005272388458251953, 0.00614476203918457, 0.0070171356201171875, 0.007889509201049805, 0.008761882781982422, 0.009634256362915039, 0.010506629943847656, 0.011379003524780273, 0.01225137710571289, 0.013123750686645508, 0.013996124267578125, 0.014868497848510742, 0.01574087142944336, 0.016613245010375977, 0.017485618591308594, 0.01835799217224121, 0.019230365753173828, 0.020102739334106445, 0.020975112915039062, 0.02184748649597168, 0.022719860076904297, 0.023592233657836914, 0.02446460723876953, 0.02533698081970215, 0.026209354400634766, 0.027081727981567383, 0.0279541015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 3.0, 4.0, 2.0, 5.0, 2.0, 4.0, 4.0, 12.0, 12.0, 14.0, 22.0, 23.0, 34.0, 51.0, 74.0, 141.0, 195.0, 162.0, 81.0, 33.0, 32.0, 28.0, 17.0, 11.0, 7.0, 7.0, 6.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00684356689453125, -0.006638944149017334, -0.006434321403503418, -0.006229698657989502, -0.006025075912475586, -0.00582045316696167, -0.005615830421447754, -0.005411207675933838, -0.005206584930419922, -0.005001962184906006, -0.00479733943939209, -0.004592716693878174, -0.004388093948364258, -0.004183471202850342, -0.003978848457336426, -0.0037742257118225098, -0.0035696029663085938, -0.0033649802207946777, -0.0031603574752807617, -0.0029557347297668457, -0.0027511119842529297, -0.0025464892387390137, -0.0023418664932250977, -0.0021372437477111816, -0.0019326210021972656, -0.0017279982566833496, -0.0015233755111694336, -0.0013187527656555176, -0.0011141300201416016, -0.0009095072746276855, -0.0007048845291137695, -0.0005002617835998535, -0.0002956390380859375, -9.101629257202148e-05, 0.00011360645294189453, 0.00031822919845581055, 0.0005228519439697266, 0.0007274746894836426, 0.0009320974349975586, 0.0011367201805114746, 0.0013413429260253906, 0.0015459656715393066, 0.0017505884170532227, 0.0019552111625671387, 0.0021598339080810547, 0.0023644566535949707, 0.0025690793991088867, 0.0027737021446228027, 0.0029783248901367188, 0.0031829476356506348, 0.0033875703811645508, 0.003592193126678467, 0.003796815872192383, 0.004001438617706299, 0.004206061363220215, 0.004410684108734131, 0.004615306854248047, 0.004819929599761963, 0.005024552345275879, 0.005229175090789795, 0.005433797836303711, 0.005638420581817627, 0.005843043327331543, 0.006047666072845459, 0.006252288818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 8.0, 9.0, 8.0, 23.0, 154.0, 666.0, 63.0, 23.0, 21.0, 13.0, 3.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3244737386703491, -0.3105740547180176, -0.29667437076568604, -0.2827746570110321, -0.26887497305870056, -0.254975289106369, -0.24107559025287628, -0.22717589139938354, -0.213276207447052, -0.19937652349472046, -0.18547682464122772, -0.17157712578773499, -0.15767744183540344, -0.1437777578830719, -0.12987805902957916, -0.11597836762666702, -0.10207867622375488, -0.08817898482084274, -0.0742792934179306, -0.06037960201501846, -0.04647991061210632, -0.03258021920919418, -0.018680527806282043, -0.0047808364033699036, 0.009118854999542236, 0.023018546402454376, 0.036918237805366516, 0.050817929208278656, 0.0647176206111908, 0.07861731201410294, 0.09251700341701508, 0.10641669481992722, 0.12031638622283936, 0.1342160701751709, 0.14811576902866364, 0.16201546788215637, 0.17591515183448792, 0.18981483578681946, 0.2037145346403122, 0.21761423349380493, 0.23151391744613647, 0.24541360139846802, 0.25931328535079956, 0.2732129991054535, 0.28711268305778503, 0.3010123670101166, 0.3149120807647705, 0.32881176471710205, 0.3427114486694336, 0.35661113262176514, 0.3705108165740967, 0.3844105303287506, 0.39831021428108215, 0.4122098982334137, 0.4261096119880676, 0.44000929594039917, 0.4539089798927307, 0.46780866384506226, 0.4817083477973938, 0.49560806155204773, 0.5095077753067017, 0.5234074592590332, 0.5373071432113647, 0.5512068271636963, 0.5651065111160278]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 3.0, 5.0, 8.0, 7.0, 7.0, 9.0, 20.0, 30.0, 53.0, 107.0, 126.0, 179.0, 150.0, 108.0, 60.0, 32.0, 18.0, 14.0, 11.0, 6.0, 5.0, 5.0, 9.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12328165769577026, -0.11845885217189789, -0.11363604664802551, -0.10881324112415314, -0.10399043560028076, -0.09916763007640839, -0.09434483200311661, -0.08952202647924423, -0.08469922095537186, -0.07987641543149948, -0.0750536099076271, -0.07023080438375473, -0.06540800631046295, -0.06058519706130028, -0.0557623952627182, -0.050939589738845825, -0.04611678421497345, -0.041293978691101074, -0.0364711731672287, -0.03164837136864662, -0.026825565844774246, -0.02200276032090187, -0.017179956659674644, -0.012357152998447418, -0.007534347474575043, -0.002711542882025242, 0.002111261710524559, 0.00693406630307436, 0.01175687089562416, 0.016579676419496536, 0.021402480080723763, 0.02622528374195099, 0.031048089265823364, 0.03587089478969574, 0.040693700313568115, 0.04551650211215019, 0.05033930763602257, 0.05516211315989494, 0.05998491495847702, 0.0648077204823494, 0.06963052600622177, 0.07445333153009415, 0.07927613705396652, 0.0840989425778389, 0.08892174065113068, 0.09374454617500305, 0.09856735169887543, 0.1033901572227478, 0.10821296274662018, 0.11303576827049255, 0.11785857379436493, 0.1226813793182373, 0.12750418484210968, 0.13232699036598206, 0.13714979588985443, 0.1419726014137268, 0.146795392036438, 0.15161819756031036, 0.15644100308418274, 0.16126380860805511, 0.1660866141319275, 0.17090941965579987, 0.17573222517967224, 0.18055501580238342, 0.185377836227417]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 10.0, 14.0, 18.0, 17.0, 20.0, 34.0, 58.0, 147.0, 1190.0, 50004.0, 4139548.0, 2817.0, 150.0, 50.0, 38.0, 26.0, 23.0, 21.0, 14.0, 13.0, 6.0, 3.0, 5.0, 10.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.90625, -2.8321075439453125, -2.757965087890625, -2.6838226318359375, -2.60968017578125, -2.5355377197265625, -2.461395263671875, -2.3872528076171875, -2.3131103515625, -2.2389678955078125, -2.164825439453125, -2.0906829833984375, -2.01654052734375, -1.9423980712890625, -1.868255615234375, -1.7941131591796875, -1.719970703125, -1.6458282470703125, -1.571685791015625, -1.4975433349609375, -1.42340087890625, -1.3492584228515625, -1.275115966796875, -1.2009735107421875, -1.1268310546875, -1.0526885986328125, -0.978546142578125, -0.9044036865234375, -0.83026123046875, -0.7561187744140625, -0.681976318359375, -0.6078338623046875, -0.53369140625, -0.4595489501953125, -0.385406494140625, -0.3112640380859375, -0.23712158203125, -0.1629791259765625, -0.088836669921875, -0.0146942138671875, 0.0594482421875, 0.1335906982421875, 0.207733154296875, 0.2818756103515625, 0.35601806640625, 0.4301605224609375, 0.504302978515625, 0.5784454345703125, 0.652587890625, 0.7267303466796875, 0.800872802734375, 0.8750152587890625, 0.94915771484375, 1.0233001708984375, 1.097442626953125, 1.1715850830078125, 1.2457275390625, 1.3198699951171875, 1.394012451171875, 1.4681549072265625, 1.54229736328125, 1.6164398193359375, 1.690582275390625, 1.7647247314453125, 1.8388671875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 4.0, 9.0, 7.0, 9.0, 9.0, 24.0, 84.0, 283.0, 323.0, 97.0, 24.0, 15.0, 7.0, 7.0, 11.0, 7.0, 9.0, 7.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0014324188232421875, -0.0013889670372009277, -0.001345515251159668, -0.0013020634651184082, -0.0012586116790771484, -0.0012151598930358887, -0.001171708106994629, -0.0011282563209533691, -0.0010848045349121094, -0.0010413527488708496, -0.0009979009628295898, -0.0009544491767883301, -0.0009109973907470703, -0.0008675456047058105, -0.0008240938186645508, -0.000780642032623291, -0.0007371902465820312, -0.0006937384605407715, -0.0006502866744995117, -0.000606834888458252, -0.0005633831024169922, -0.0005199313163757324, -0.00047647953033447266, -0.0004330277442932129, -0.0003895759582519531, -0.00034612417221069336, -0.0003026723861694336, -0.00025922060012817383, -0.00021576881408691406, -0.0001723170280456543, -0.00012886524200439453, -8.541345596313477e-05, -4.1961669921875e-05, 1.4901161193847656e-06, 4.494190216064453e-05, 8.83936882019043e-05, 0.00013184547424316406, 0.00017529726028442383, 0.0002187490463256836, 0.00026220083236694336, 0.0003056526184082031, 0.0003491044044494629, 0.00039255619049072266, 0.0004360079765319824, 0.0004794597625732422, 0.000522911548614502, 0.0005663633346557617, 0.0006098151206970215, 0.0006532669067382812, 0.000696718692779541, 0.0007401704788208008, 0.0007836222648620605, 0.0008270740509033203, 0.0008705258369445801, 0.0009139776229858398, 0.0009574294090270996, 0.0010008811950683594, 0.0010443329811096191, 0.001087784767150879, 0.0011312365531921387, 0.0011746883392333984, 0.0012181401252746582, 0.001261591911315918, 0.0013050436973571777, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 1.0, 18.0, 14.0, 36.0, 45.0, 78.0, 128.0, 208.0, 350.0, 106355.0, 4085870.0, 459.0, 233.0, 184.0, 120.0, 75.0, 49.0, 30.0, 22.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.394775390625, -0.3667106628417969, -0.33864593505859375, -0.3105812072753906, -0.2825164794921875, -0.2544517517089844, -0.22638702392578125, -0.19832229614257812, -0.170257568359375, -0.14219284057617188, -0.11412811279296875, -0.08606338500976562, -0.0579986572265625, -0.029933929443359375, -0.00186920166015625, 0.026195526123046875, 0.05426025390625, 0.08232498168945312, 0.11038970947265625, 0.13845443725585938, 0.1665191650390625, 0.19458389282226562, 0.22264862060546875, 0.2507133483886719, 0.278778076171875, 0.3068428039550781, 0.33490753173828125, 0.3629722595214844, 0.3910369873046875, 0.4191017150878906, 0.44716644287109375, 0.4752311706542969, 0.5032958984375, 0.5313606262207031, 0.5594253540039062, 0.5874900817871094, 0.6155548095703125, 0.6436195373535156, 0.6716842651367188, 0.6997489929199219, 0.727813720703125, 0.7558784484863281, 0.7839431762695312, 0.8120079040527344, 0.8400726318359375, 0.8681373596191406, 0.8962020874023438, 0.9242668151855469, 0.95233154296875, 0.9803962707519531, 1.0084609985351562, 1.0365257263183594, 1.0645904541015625, 1.0926551818847656, 1.1207199096679688, 1.1487846374511719, 1.176849365234375, 1.2049140930175781, 1.2329788208007812, 1.2610435485839844, 1.2891082763671875, 1.3171730041503906, 1.3452377319335938, 1.3733024597167969, 1.4013671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 4.0, 8.0, 15.0, 22.0, 36.0, 48.0, 100.0, 144.0, 236.0, 380.0, 1459.0, 581.0, 321.0, 234.0, 188.0, 111.0, 82.0, 48.0, 29.0, 21.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027332305908203125, -0.002521008253097534, -0.002308785915374756, -0.0020965635776519775, -0.0018843412399291992, -0.001672118902206421, -0.0014598965644836426, -0.0012476742267608643, -0.001035451889038086, -0.0008232295513153076, -0.0006110072135925293, -0.000398784875869751, -0.00018656253814697266, 2.5659799575805664e-05, 0.00023788213729858398, 0.0004501044750213623, 0.0006623268127441406, 0.0008745491504669189, 0.0010867714881896973, 0.0012989938259124756, 0.001511216163635254, 0.0017234385013580322, 0.0019356608390808105, 0.002147883176803589, 0.002360105514526367, 0.0025723278522491455, 0.002784550189971924, 0.002996772527694702, 0.0032089948654174805, 0.003421217203140259, 0.003633439540863037, 0.0038456618785858154, 0.004057884216308594, 0.004270106554031372, 0.00448232889175415, 0.004694551229476929, 0.004906773567199707, 0.005118995904922485, 0.005331218242645264, 0.005543440580368042, 0.00575566291809082, 0.005967885255813599, 0.006180107593536377, 0.006392329931259155, 0.006604552268981934, 0.006816774606704712, 0.00702899694442749, 0.0072412192821502686, 0.007453441619873047, 0.007665663957595825, 0.007877886295318604, 0.008090108633041382, 0.00830233097076416, 0.008514553308486938, 0.008726775646209717, 0.008938997983932495, 0.009151220321655273, 0.009363442659378052, 0.00957566499710083, 0.009787887334823608, 0.010000109672546387, 0.010212332010269165, 0.010424554347991943, 0.010636776685714722, 0.0108489990234375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [616.0, 389.0, 17.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0585235059261322, 0.003385651856660843, 0.06529480963945389, 0.12720397114753723, 0.18911312520503998, 0.2510222792625427, 0.31293144822120667, 0.3748405873775482, 0.43674975633621216, 0.4986589252948761, 0.56056809425354, 0.6224772334098816, 0.6843863725662231, 0.7462955713272095, 0.808204710483551, 0.8701138496398926, 0.9320230484008789, 0.9939321875572205, 1.055841326713562, 1.1177505254745483, 1.1796597242355347, 1.2415688037872314, 1.3034780025482178, 1.365387201309204, 1.4272962808609009, 1.4892054796218872, 1.551114559173584, 1.6130237579345703, 1.6749329566955566, 1.7368420362472534, 1.7987512350082397, 1.8606603145599365, 1.9225696325302124, 1.9844788312911987, 2.0463879108428955, 2.108297109603882, 2.170206308364868, 2.2321155071258545, 2.2940244674682617, 2.355933666229248, 2.4178428649902344, 2.4797520637512207, 2.541661262512207, 2.6035704612731934, 2.6654794216156006, 2.727388620376587, 2.7892978191375732, 2.8512070178985596, 2.913116216659546, 2.9750254154205322, 3.0369346141815186, 3.098843574523926, 3.160752773284912, 3.2226619720458984, 3.2845711708068848, 3.346480369567871, 3.4083893299102783, 3.4702985286712646, 3.532207727432251, 3.594116687774658, 3.6560258865356445, 3.717935085296631, 3.779844284057617, 3.8417534828186035, 3.90366268157959]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 40.0, 84.0, 118.0, 157.0, 179.0, 160.0, 119.0, 59.0, 35.0, 13.0, 12.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05067789554595947, -0.04592546075582504, -0.04117302596569061, -0.03642059490084648, -0.03166816011071205, -0.02691572532057762, -0.02216329239308834, -0.01741085946559906, -0.01265842467546463, -0.007905990816652775, -0.0031535569578409195, 0.0015988769009709358, 0.006351310759782791, 0.011103745549917221, 0.015856178477406502, 0.020608611404895782, 0.025361046195030212, 0.030113480985164642, 0.03486591577529907, 0.039618346840143204, 0.044370781630277634, 0.049123216420412064, 0.053875647485256195, 0.058628082275390625, 0.06338051706552505, 0.06813295185565948, 0.07288538664579391, 0.07763782143592834, 0.08239024877548218, 0.0871426910161972, 0.09189511835575104, 0.09664755314588547, 0.1013999879360199, 0.10615242272615433, 0.11090485751628876, 0.11565729230642319, 0.12040972709655762, 0.12516215443611145, 0.12991459667682648, 0.1346670240163803, 0.13941946625709534, 0.14417189359664917, 0.1489243358373642, 0.15367676317691803, 0.15842920541763306, 0.1631816327571869, 0.16793407499790192, 0.17268650233745575, 0.17743892967700958, 0.18219135701656342, 0.18694379925727844, 0.19169622659683228, 0.1964486688375473, 0.20120109617710114, 0.20595353841781616, 0.21070596575737, 0.21545839309692383, 0.22021082043647766, 0.2249632626771927, 0.22971569001674652, 0.23446813225746155, 0.23922055959701538, 0.2439730018377304, 0.24872542917728424, 0.25347787141799927]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 9.0, 10.0, 24.0, 21.0, 46.0, 57.0, 86.0, 91.0, 131.0, 150.0, 206.0, 313.0, 452.0, 593.0, 799.0, 1159.0, 1507.0, 2261.0, 3063.0, 4583.0, 6814.0, 10889.0, 20465.0, 87547.0, 771677.0, 82316.0, 20096.0, 10755.0, 6754.0, 4612.0, 3134.0, 2187.0, 1515.0, 1180.0, 817.0, 567.0, 478.0, 283.0, 226.0, 173.0, 123.0, 97.0, 85.0, 51.0, 41.0, 26.0, 28.0, 18.0, 9.0, 15.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.023101806640625, -0.022368192672729492, -0.021634578704833984, -0.020900964736938477, -0.02016735076904297, -0.01943373680114746, -0.018700122833251953, -0.017966508865356445, -0.017232894897460938, -0.01649928092956543, -0.015765666961669922, -0.015032052993774414, -0.014298439025878906, -0.013564825057983398, -0.01283121109008789, -0.012097597122192383, -0.011363983154296875, -0.010630369186401367, -0.00989675521850586, -0.009163141250610352, -0.008429527282714844, -0.007695913314819336, -0.006962299346923828, -0.00622868537902832, -0.0054950714111328125, -0.004761457443237305, -0.004027843475341797, -0.003294229507446289, -0.0025606155395507812, -0.0018270015716552734, -0.0010933876037597656, -0.0003597736358642578, 0.00037384033203125, 0.0011074542999267578, 0.0018410682678222656, 0.0025746822357177734, 0.0033082962036132812, 0.004041910171508789, 0.004775524139404297, 0.005509138107299805, 0.0062427520751953125, 0.00697636604309082, 0.007709980010986328, 0.008443593978881836, 0.009177207946777344, 0.009910821914672852, 0.01064443588256836, 0.011378049850463867, 0.012111663818359375, 0.012845277786254883, 0.01357889175415039, 0.014312505722045898, 0.015046119689941406, 0.015779733657836914, 0.016513347625732422, 0.01724696159362793, 0.017980575561523438, 0.018714189529418945, 0.019447803497314453, 0.02018141746520996, 0.02091503143310547, 0.021648645401000977, 0.022382259368896484, 0.023115873336791992, 0.0238494873046875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 7.0, 4.0, 3.0, 5.0, 6.0, 11.0, 3.0, 7.0, 8.0, 7.0, 18.0, 26.0, 88.0, 201.0, 246.0, 183.0, 74.0, 20.0, 11.0, 10.0, 8.0, 9.0, 7.0, 9.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014486312866210938, -0.0014037638902664185, -0.0013588964939117432, -0.0013140290975570679, -0.0012691617012023926, -0.0012242943048477173, -0.001179426908493042, -0.0011345595121383667, -0.0010896921157836914, -0.0010448247194290161, -0.0009999573230743408, -0.0009550899267196655, -0.0009102225303649902, -0.0008653551340103149, -0.0008204877376556396, -0.0007756203413009644, -0.0007307529449462891, -0.0006858855485916138, -0.0006410181522369385, -0.0005961507558822632, -0.0005512833595275879, -0.0005064159631729126, -0.0004615485668182373, -0.000416681170463562, -0.0003718137741088867, -0.0003269463777542114, -0.00028207898139953613, -0.00023721158504486084, -0.00019234418869018555, -0.00014747679233551025, -0.00010260939598083496, -5.774199962615967e-05, -1.2874603271484375e-05, 3.199279308319092e-05, 7.686018943786621e-05, 0.0001217275857925415, 0.0001665949821472168, 0.0002114623785018921, 0.0002563297748565674, 0.0003011971712112427, 0.00034606456756591797, 0.00039093196392059326, 0.00043579936027526855, 0.00048066675662994385, 0.0005255341529846191, 0.0005704015493392944, 0.0006152689456939697, 0.000660136342048645, 0.0007050037384033203, 0.0007498711347579956, 0.0007947385311126709, 0.0008396059274673462, 0.0008844733238220215, 0.0009293407201766968, 0.0009742081165313721, 0.0010190755128860474, 0.0010639429092407227, 0.001108810305595398, 0.0011536777019500732, 0.0011985450983047485, 0.0012434124946594238, 0.0012882798910140991, 0.0013331472873687744, 0.0013780146837234497, 0.001422882080078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 12.0, 20.0, 14.0, 12.0, 13.0, 16.0, 21.0, 22.0, 20.0, 33.0, 30.0, 33.0, 52.0, 87.0, 259.0, 1271.0, 10789.0, 949243.0, 81908.0, 3709.0, 489.0, 106.0, 52.0, 29.0, 26.0, 32.0, 20.0, 32.0, 19.0, 17.0, 21.0, 14.0, 10.0, 18.0, 12.0, 13.0, 7.0, 5.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.07745361328125, -0.07509040832519531, -0.07272720336914062, -0.07036399841308594, -0.06800079345703125, -0.06563758850097656, -0.06327438354492188, -0.06091117858886719, -0.0585479736328125, -0.05618476867675781, -0.053821563720703125, -0.05145835876464844, -0.04909515380859375, -0.04673194885253906, -0.044368743896484375, -0.04200553894042969, -0.039642333984375, -0.03727912902832031, -0.034915924072265625, -0.03255271911621094, -0.03018951416015625, -0.027826309204101562, -0.025463104248046875, -0.023099899291992188, -0.0207366943359375, -0.018373489379882812, -0.016010284423828125, -0.013647079467773438, -0.01128387451171875, -0.008920669555664062, -0.006557464599609375, -0.0041942596435546875, -0.0018310546875, 0.0005321502685546875, 0.002895355224609375, 0.0052585601806640625, 0.00762176513671875, 0.009984970092773438, 0.012348175048828125, 0.014711380004882812, 0.0170745849609375, 0.019437789916992188, 0.021800994873046875, 0.024164199829101562, 0.02652740478515625, 0.028890609741210938, 0.031253814697265625, 0.03361701965332031, 0.035980224609375, 0.03834342956542969, 0.040706634521484375, 0.04306983947753906, 0.04543304443359375, 0.04779624938964844, 0.050159454345703125, 0.05252265930175781, 0.0548858642578125, 0.05724906921386719, 0.059612274169921875, 0.06197547912597656, 0.06433868408203125, 0.06670188903808594, 0.06906509399414062, 0.07142829895019531, 0.07379150390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 2.0, 5.0, 3.0, 5.0, 6.0, 9.0, 12.0, 12.0, 12.0, 13.0, 15.0, 16.0, 18.0, 23.0, 35.0, 27.0, 31.0, 35.0, 32.0, 35.0, 41.0, 38.0, 45.0, 38.0, 41.0, 26.0, 36.0, 39.0, 42.0, 28.0, 39.0, 28.0, 25.0, 27.0, 25.0, 13.0, 20.0, 13.0, 13.0, 13.0, 18.0, 9.0, 7.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.004245758056640625, -0.0041138529777526855, -0.003981947898864746, -0.0038500428199768066, -0.003718137741088867, -0.0035862326622009277, -0.0034543275833129883, -0.003322422504425049, -0.0031905174255371094, -0.00305861234664917, -0.0029267072677612305, -0.002794802188873291, -0.0026628971099853516, -0.002530992031097412, -0.0023990869522094727, -0.002267181873321533, -0.0021352767944335938, -0.0020033717155456543, -0.0018714666366577148, -0.0017395615577697754, -0.001607656478881836, -0.0014757513999938965, -0.001343846321105957, -0.0012119412422180176, -0.0010800361633300781, -0.0009481310844421387, -0.0008162260055541992, -0.0006843209266662598, -0.0005524158477783203, -0.00042051076889038086, -0.0002886056900024414, -0.00015670061111450195, -2.47955322265625e-05, 0.00010710954666137695, 0.0002390146255493164, 0.00037091970443725586, 0.0005028247833251953, 0.0006347298622131348, 0.0007666349411010742, 0.0008985400199890137, 0.0010304450988769531, 0.0011623501777648926, 0.001294255256652832, 0.0014261603355407715, 0.001558065414428711, 0.0016899704933166504, 0.0018218755722045898, 0.0019537806510925293, 0.0020856857299804688, 0.002217590808868408, 0.0023494958877563477, 0.002481400966644287, 0.0026133060455322266, 0.002745211124420166, 0.0028771162033081055, 0.003009021282196045, 0.0031409263610839844, 0.003272831439971924, 0.0034047365188598633, 0.0035366415977478027, 0.003668546676635742, 0.0038004517555236816, 0.003932356834411621, 0.0040642619132995605, 0.0041961669921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 20.0, 23.0, 58.0, 146.0, 899.0, 967740.0, 78803.0, 610.0, 99.0, 58.0, 31.0, 12.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.0650634765625, -0.06364703178405762, -0.062230587005615234, -0.06081414222717285, -0.05939769744873047, -0.057981252670288086, -0.0565648078918457, -0.05514836311340332, -0.05373191833496094, -0.052315473556518555, -0.05089902877807617, -0.04948258399963379, -0.048066139221191406, -0.04664969444274902, -0.04523324966430664, -0.04381680488586426, -0.042400360107421875, -0.04098391532897949, -0.03956747055053711, -0.03815102577209473, -0.036734580993652344, -0.03531813621520996, -0.03390169143676758, -0.032485246658325195, -0.031068801879882812, -0.02965235710144043, -0.028235912322998047, -0.026819467544555664, -0.02540302276611328, -0.0239865779876709, -0.022570133209228516, -0.021153688430786133, -0.01973724365234375, -0.018320798873901367, -0.016904354095458984, -0.015487909317016602, -0.014071464538574219, -0.012655019760131836, -0.011238574981689453, -0.00982213020324707, -0.008405685424804688, -0.006989240646362305, -0.005572795867919922, -0.004156351089477539, -0.0027399063110351562, -0.0013234615325927734, 9.298324584960938e-05, 0.0015094280242919922, 0.002925872802734375, 0.004342317581176758, 0.005758762359619141, 0.0071752071380615234, 0.008591651916503906, 0.010008096694946289, 0.011424541473388672, 0.012840986251831055, 0.014257431030273438, 0.01567387580871582, 0.017090320587158203, 0.018506765365600586, 0.01992321014404297, 0.02133965492248535, 0.022756099700927734, 0.024172544479370117, 0.0255889892578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 11.0, 21.0, 72.0, 415.0, 369.0, 58.0, 18.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002791881561279297, -0.0002709701657295227, -0.0002627521753311157, -0.00025453418493270874, -0.00024631619453430176, -0.00023809820413589478, -0.0002298802137374878, -0.0002216622233390808, -0.00021344423294067383, -0.00020522624254226685, -0.00019700825214385986, -0.00018879026174545288, -0.0001805722713470459, -0.00017235428094863892, -0.00016413629055023193, -0.00015591830015182495, -0.00014770030975341797, -0.00013948231935501099, -0.000131264328956604, -0.00012304633855819702, -0.00011482834815979004, -0.00010661035776138306, -9.839236736297607e-05, -9.017437696456909e-05, -8.195638656616211e-05, -7.373839616775513e-05, -6.552040576934814e-05, -5.730241537094116e-05, -4.908442497253418e-05, -4.08664345741272e-05, -3.2648444175720215e-05, -2.4430453777313232e-05, -1.621246337890625e-05, -7.994472980499268e-06, 2.2351741790771484e-07, 8.441507816314697e-06, 1.665949821472168e-05, 2.4877488613128662e-05, 3.3095479011535645e-05, 4.131346940994263e-05, 4.953145980834961e-05, 5.774945020675659e-05, 6.596744060516357e-05, 7.418543100357056e-05, 8.240342140197754e-05, 9.062141180038452e-05, 9.88394021987915e-05, 0.00010705739259719849, 0.00011527538299560547, 0.00012349337339401245, 0.00013171136379241943, 0.00013992935419082642, 0.0001481473445892334, 0.00015636533498764038, 0.00016458332538604736, 0.00017280131578445435, 0.00018101930618286133, 0.0001892372965812683, 0.0001974552869796753, 0.00020567327737808228, 0.00021389126777648926, 0.00022210925817489624, 0.00023032724857330322, 0.0002385452389717102, 0.0002467632293701172]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 3.0, 13.0, 17.0, 29.0, 61.0, 231.0, 1288.0, 36434.0, 1006640.0, 3276.0, 373.0, 99.0, 37.0, 11.0, 13.0, 10.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048492431640625, -0.04703187942504883, -0.045571327209472656, -0.044110774993896484, -0.04265022277832031, -0.04118967056274414, -0.03972911834716797, -0.0382685661315918, -0.036808013916015625, -0.03534746170043945, -0.03388690948486328, -0.03242635726928711, -0.030965805053710938, -0.029505252838134766, -0.028044700622558594, -0.026584148406982422, -0.02512359619140625, -0.023663043975830078, -0.022202491760253906, -0.020741939544677734, -0.019281387329101562, -0.01782083511352539, -0.01636028289794922, -0.014899730682373047, -0.013439178466796875, -0.011978626251220703, -0.010518074035644531, -0.00905752182006836, -0.0075969696044921875, -0.006136417388916016, -0.004675865173339844, -0.003215312957763672, -0.0017547607421875, -0.0002942085266113281, 0.0011663436889648438, 0.0026268959045410156, 0.0040874481201171875, 0.005548000335693359, 0.007008552551269531, 0.008469104766845703, 0.009929656982421875, 0.011390209197998047, 0.012850761413574219, 0.01431131362915039, 0.015771865844726562, 0.017232418060302734, 0.018692970275878906, 0.020153522491455078, 0.02161407470703125, 0.023074626922607422, 0.024535179138183594, 0.025995731353759766, 0.027456283569335938, 0.02891683578491211, 0.03037738800048828, 0.03183794021606445, 0.033298492431640625, 0.0347590446472168, 0.03621959686279297, 0.03768014907836914, 0.03914070129394531, 0.040601253509521484, 0.042061805725097656, 0.04352235794067383, 0.04498291015625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 8.0, 15.0, 16.0, 42.0, 81.0, 148.0, 452.0, 93.0, 38.0, 25.0, 14.0, 19.0, 10.0, 10.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00852203369140625, -0.00831061601638794, -0.008099198341369629, -0.007887780666351318, -0.007676362991333008, -0.007464945316314697, -0.007253527641296387, -0.007042109966278076, -0.006830692291259766, -0.006619274616241455, -0.0064078569412231445, -0.006196439266204834, -0.0059850215911865234, -0.005773603916168213, -0.005562186241149902, -0.005350768566131592, -0.005139350891113281, -0.004927933216094971, -0.00471651554107666, -0.00450509786605835, -0.004293680191040039, -0.0040822625160217285, -0.003870844841003418, -0.0036594271659851074, -0.003448009490966797, -0.0032365918159484863, -0.0030251741409301758, -0.0028137564659118652, -0.0026023387908935547, -0.002390921115875244, -0.0021795034408569336, -0.001968085765838623, -0.0017566680908203125, -0.001545250415802002, -0.0013338327407836914, -0.0011224150657653809, -0.0009109973907470703, -0.0006995797157287598, -0.0004881620407104492, -0.00027674436569213867, -6.532669067382812e-05, 0.00014609098434448242, 0.00035750865936279297, 0.0005689263343811035, 0.0007803440093994141, 0.0009917616844177246, 0.0012031793594360352, 0.0014145970344543457, 0.0016260147094726562, 0.0018374323844909668, 0.0020488500595092773, 0.002260267734527588, 0.0024716854095458984, 0.002683103084564209, 0.0028945207595825195, 0.00310593843460083, 0.0033173561096191406, 0.003528773784637451, 0.0037401914596557617, 0.003951609134674072, 0.004163026809692383, 0.004374444484710693, 0.004585862159729004, 0.0047972798347473145, 0.005008697509765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 8.0, 10.0, 11.0, 13.0, 30.0, 86.0, 339.0, 326.0, 88.0, 27.0, 15.0, 13.0, 7.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08528926968574524, -0.08200879395008087, -0.07872831076383591, -0.07544783502817154, -0.07216735929250717, -0.06888687610626221, -0.06560640037059784, -0.06232592463493347, -0.059045445173978806, -0.05576496571302414, -0.05248448997735977, -0.049204010516405106, -0.04592353105545044, -0.04264305531978607, -0.039362575858831406, -0.03608209639787674, -0.03280162066221237, -0.029521143063902855, -0.026240665465593338, -0.022960186004638672, -0.019679708406329155, -0.016399230808019638, -0.013118751347064972, -0.009838273748755455, -0.006557796150445938, -0.003277318086475134, 3.1599774956703186e-06, 0.003283638507127762, 0.006564116105437279, 0.009844593703746796, 0.013125073164701462, 0.01640555076301098, 0.0196860209107399, 0.022966498509049416, 0.026246976107358932, 0.0295274555683136, 0.032807931303977966, 0.03608841076493263, 0.0393688902258873, 0.042649365961551666, 0.04592984542250633, 0.049210324883461, 0.052490800619125366, 0.05577128008008003, 0.0590517595410347, 0.062332235276699066, 0.06561271846294403, 0.0688931941986084, 0.07217366993427277, 0.07545414566993713, 0.0787346288561821, 0.08201510459184647, 0.08529558032751083, 0.0885760635137558, 0.09185653924942017, 0.09513701498508453, 0.0984174907207489, 0.10169796645641327, 0.10497844964265823, 0.1082589253783226, 0.11153940111398697, 0.11481988430023193, 0.1181003600358963, 0.12138083577156067, 0.12466131895780563]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 2.0, 5.0, 3.0, 8.0, 16.0, 21.0, 18.0, 36.0, 27.0, 47.0, 67.0, 66.0, 92.0, 89.0, 90.0, 72.0, 61.0, 70.0, 43.0, 36.0, 29.0, 24.0, 24.0, 11.0, 5.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0361018180847168, -0.03461151570081711, -0.03312121331691742, -0.03163091093301773, -0.030140608549118042, -0.028650306165218353, -0.027160003781318665, -0.025669701397418976, -0.024179399013519287, -0.0226890966296196, -0.02119879424571991, -0.01970849186182022, -0.018218189477920532, -0.016727887094020844, -0.015237584710121155, -0.013747282326221466, -0.012256979942321777, -0.010766677558422089, -0.0092763751745224, -0.007786072790622711, -0.0062957704067230225, -0.004805468022823334, -0.003315165638923645, -0.0018248632550239563, -0.0003345608711242676, 0.0011557415127754211, 0.00264604389667511, 0.004136346280574799, 0.005626648664474487, 0.007116951048374176, 0.008607253432273865, 0.010097555816173553, 0.011587858200073242, 0.013078160583972931, 0.01456846296787262, 0.01605876535177231, 0.017549067735671997, 0.019039370119571686, 0.020529672503471375, 0.022019974887371063, 0.023510277271270752, 0.02500057965517044, 0.02649088203907013, 0.027981184422969818, 0.029471486806869507, 0.030961789190769196, 0.032452091574668884, 0.03394239395856857, 0.03543269634246826, 0.03692299872636795, 0.03841330111026764, 0.03990360349416733, 0.04139390587806702, 0.042884208261966705, 0.044374510645866394, 0.04586481302976608, 0.04735511541366577, 0.04884541779756546, 0.05033572018146515, 0.05182602256536484, 0.053316324949264526, 0.054806627333164215, 0.056296929717063904, 0.05778723210096359, 0.05927753448486328]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 6.0, 8.0, 6.0, 6.0, 8.0, 4.0, 14.0, 7.0, 13.0, 12.0, 10.0, 12.0, 10.0, 34.0, 24.0, 112.0, 1803.0, 4191749.0, 220.0, 38.0, 30.0, 14.0, 8.0, 12.0, 14.0, 16.0, 12.0, 0.0, 4.0, 10.0, 6.0, 2.0, 16.0, 6.0, 2.0, 8.0, 4.0, 0.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.9111328125, -1.8597412109375, -1.808349609375, -1.7569580078125, -1.70556640625, -1.6541748046875, -1.602783203125, -1.5513916015625, -1.5, -1.4486083984375, -1.397216796875, -1.3458251953125, -1.29443359375, -1.2430419921875, -1.191650390625, -1.1402587890625, -1.0888671875, -1.0374755859375, -0.986083984375, -0.9346923828125, -0.88330078125, -0.8319091796875, -0.780517578125, -0.7291259765625, -0.677734375, -0.6263427734375, -0.574951171875, -0.5235595703125, -0.47216796875, -0.4207763671875, -0.369384765625, -0.3179931640625, -0.2666015625, -0.2152099609375, -0.163818359375, -0.1124267578125, -0.06103515625, -0.0096435546875, 0.041748046875, 0.0931396484375, 0.14453125, 0.1959228515625, 0.247314453125, 0.2987060546875, 0.35009765625, 0.4014892578125, 0.452880859375, 0.5042724609375, 0.5556640625, 0.6070556640625, 0.658447265625, 0.7098388671875, 0.76123046875, 0.8126220703125, 0.864013671875, 0.9154052734375, 0.966796875, 1.0181884765625, 1.069580078125, 1.1209716796875, 1.17236328125, 1.2237548828125, 1.275146484375, 1.3265380859375, 1.3779296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 3.0, 5.0, 4.0, 11.0, 4.0, 6.0, 9.0, 14.0, 21.0, 49.0, 118.0, 175.0, 230.0, 147.0, 65.0, 32.0, 14.0, 10.0, 7.0, 8.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012407302856445312, -0.0012008696794509888, -0.0011610090732574463, -0.0011211484670639038, -0.0010812878608703613, -0.0010414272546768188, -0.0010015666484832764, -0.0009617060422897339, -0.0009218454360961914, -0.0008819848299026489, -0.0008421242237091064, -0.000802263617515564, -0.0007624030113220215, -0.000722542405128479, -0.0006826817989349365, -0.000642821192741394, -0.0006029605865478516, -0.0005630999803543091, -0.0005232393741607666, -0.0004833787679672241, -0.00044351816177368164, -0.00040365755558013916, -0.0003637969493865967, -0.0003239363431930542, -0.0002840757369995117, -0.00024421513080596924, -0.00020435452461242676, -0.00016449391841888428, -0.0001246333122253418, -8.477270603179932e-05, -4.4912099838256836e-05, -5.0514936447143555e-06, 3.4809112548828125e-05, 7.46697187423706e-05, 0.00011453032493591309, 0.00015439093112945557, 0.00019425153732299805, 0.00023411214351654053, 0.000273972749710083, 0.0003138333559036255, 0.00035369396209716797, 0.00039355456829071045, 0.00043341517448425293, 0.0004732757806777954, 0.0005131363868713379, 0.0005529969930648804, 0.0005928575992584229, 0.0006327182054519653, 0.0006725788116455078, 0.0007124394178390503, 0.0007523000240325928, 0.0007921606302261353, 0.0008320212364196777, 0.0008718818426132202, 0.0009117424488067627, 0.0009516030550003052, 0.0009914636611938477, 0.0010313242673873901, 0.0010711848735809326, 0.001111045479774475, 0.0011509060859680176, 0.00119076669216156, 0.0012306272983551025, 0.001270487904548645, 0.0013103485107421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 10.0, 19.0, 35.0, 88.0, 199.0, 883.0, 4192156.0, 642.0, 143.0, 46.0, 30.0, 16.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.982421875, -1.94384765625, -1.9052734375, -1.86669921875, -1.828125, -1.78955078125, -1.7509765625, -1.71240234375, -1.673828125, -1.63525390625, -1.5966796875, -1.55810546875, -1.51953125, -1.48095703125, -1.4423828125, -1.40380859375, -1.365234375, -1.32666015625, -1.2880859375, -1.24951171875, -1.2109375, -1.17236328125, -1.1337890625, -1.09521484375, -1.056640625, -1.01806640625, -0.9794921875, -0.94091796875, -0.90234375, -0.86376953125, -0.8251953125, -0.78662109375, -0.748046875, -0.70947265625, -0.6708984375, -0.63232421875, -0.59375, -0.55517578125, -0.5166015625, -0.47802734375, -0.439453125, -0.40087890625, -0.3623046875, -0.32373046875, -0.28515625, -0.24658203125, -0.2080078125, -0.16943359375, -0.130859375, -0.09228515625, -0.0537109375, -0.01513671875, 0.0234375, 0.06201171875, 0.1005859375, 0.13916015625, 0.177734375, 0.21630859375, 0.2548828125, 0.29345703125, 0.33203125, 0.37060546875, 0.4091796875, 0.44775390625, 0.486328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 15.0, 18.0, 38.0, 92.0, 126.0, 297.0, 974.0, 1818.0, 371.0, 166.0, 73.0, 34.0, 23.0, 15.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0030727386474609375, -0.0028822720050811768, -0.002691805362701416, -0.0025013387203216553, -0.0023108720779418945, -0.002120405435562134, -0.001929938793182373, -0.0017394721508026123, -0.0015490055084228516, -0.0013585388660430908, -0.00116807222366333, -0.0009776055812835693, -0.0007871389389038086, -0.0005966722965240479, -0.0004062056541442871, -0.00021573901176452637, -2.5272369384765625e-05, 0.00016519427299499512, 0.00035566091537475586, 0.0005461275577545166, 0.0007365942001342773, 0.0009270608425140381, 0.0011175274848937988, 0.0013079941272735596, 0.0014984607696533203, 0.001688927412033081, 0.0018793940544128418, 0.0020698606967926025, 0.0022603273391723633, 0.002450793981552124, 0.0026412606239318848, 0.0028317272663116455, 0.0030221939086914062, 0.003212660551071167, 0.0034031271934509277, 0.0035935938358306885, 0.0037840604782104492, 0.00397452712059021, 0.004164993762969971, 0.0043554604053497314, 0.004545927047729492, 0.004736393690109253, 0.004926860332489014, 0.005117326974868774, 0.005307793617248535, 0.005498260259628296, 0.005688726902008057, 0.005879193544387817, 0.006069660186767578, 0.006260126829147339, 0.0064505934715271, 0.00664106011390686, 0.006831526756286621, 0.007021993398666382, 0.007212460041046143, 0.007402926683425903, 0.007593393325805664, 0.007783859968185425, 0.007974326610565186, 0.008164793252944946, 0.008355259895324707, 0.008545726537704468, 0.008736193180084229, 0.00892665982246399, 0.00911712646484375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 13.0, 1007.0, 1.0, 0.0, 2.0], "bins": [-4.851652145385742, -4.771372318267822, -4.691092491149902, -4.610812664031982, -4.5305328369140625, -4.450253009796143, -4.369973182678223, -4.2896928787231445, -4.209413051605225, -4.129133224487305, -4.048853397369385, -3.968573570251465, -3.888293504714966, -3.808013677597046, -3.727733850479126, -3.647454023361206, -3.5671744346618652, -3.4868946075439453, -3.4066147804260254, -3.3263349533081055, -3.2460548877716064, -3.1657750606536865, -3.0854952335357666, -3.0052154064178467, -2.9249353408813477, -2.8446555137634277, -2.764375686645508, -2.684095859527588, -2.603815793991089, -2.523535966873169, -2.443256139755249, -2.362976312637329, -2.2826967239379883, -2.2024168968200684, -2.1221370697021484, -2.0418572425842285, -1.961577296257019, -1.8812973499298096, -1.8010175228118896, -1.7207376956939697, -1.6404577493667603, -1.5601779222488403, -1.4798979759216309, -1.399618148803711, -1.319338321685791, -1.239058494567871, -1.1587785482406616, -1.0784987211227417, -0.9982188940048218, -0.9179390072822571, -0.8376591801643372, -0.7573792934417725, -0.6770994663238525, -0.5968195796012878, -0.5165396928787231, -0.4362598657608032, -0.35597994923591614, -0.27570009231567383, -0.19542022049427032, -0.11514034867286682, -0.03486049175262451, 0.0454193651676178, 0.1256992518901825, 0.20597907900810242, 0.2862589657306671]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 19.0, 56.0, 104.0, 201.0, 248.0, 186.0, 117.0, 43.0, 18.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04269814491271973, -0.03907020390033722, -0.03544226661324501, -0.0318143293261528, -0.028186388313770294, -0.024558449164032936, -0.020930510014295578, -0.01730257086455822, -0.013674631714820862, -0.010046692565083504, -0.006418753415346146, -0.0027908142656087875, 0.0008371248841285706, 0.004465064033865929, 0.008093003183603287, 0.011720942333340645, 0.015348881483078003, 0.01897682063281536, 0.02260475978255272, 0.026232698932290077, 0.029860638082027435, 0.03348857909440994, 0.03711651638150215, 0.04074445366859436, 0.04437239468097687, 0.048000335693359375, 0.051628272980451584, 0.05525621026754379, 0.0588841512799263, 0.06251209229230881, 0.06614002585411072, 0.06976796686649323, 0.07339590787887573, 0.07702384889125824, 0.08065178990364075, 0.08427972346544266, 0.08790766447782516, 0.09153560549020767, 0.09516353905200958, 0.09879148006439209, 0.1024194210767746, 0.1060473620891571, 0.10967530310153961, 0.11330323666334152, 0.11693117767572403, 0.12055911868810654, 0.12418705224990845, 0.12781499326229095, 0.13144293427467346, 0.13507087528705597, 0.13869881629943848, 0.14232675731182098, 0.1459546983242035, 0.1495826244354248, 0.1532105654478073, 0.15683850646018982, 0.16046644747257233, 0.16409438848495483, 0.16772232949733734, 0.17135027050971985, 0.17497819662094116, 0.17860613763332367, 0.18223407864570618, 0.18586201965808868, 0.1894899606704712]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 6.0, 6.0, 16.0, 8.0, 15.0, 18.0, 12.0, 17.0, 17.0, 18.0, 13.0, 21.0, 31.0, 41.0, 37.0, 36.0, 36.0, 37.0, 72.0, 249.0, 219949.0, 826988.0, 413.0, 92.0, 67.0, 33.0, 34.0, 33.0, 16.0, 27.0, 28.0, 29.0, 23.0, 18.0, 10.0, 21.0, 10.0, 10.0, 9.0, 5.0, 7.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.58935546875, -0.5720596313476562, -0.5547637939453125, -0.5374679565429688, -0.520172119140625, -0.5028762817382812, -0.4855804443359375, -0.46828460693359375, -0.45098876953125, -0.43369293212890625, -0.4163970947265625, -0.39910125732421875, -0.381805419921875, -0.36450958251953125, -0.3472137451171875, -0.32991790771484375, -0.3126220703125, -0.29532623291015625, -0.2780303955078125, -0.26073455810546875, -0.243438720703125, -0.22614288330078125, -0.2088470458984375, -0.19155120849609375, -0.17425537109375, -0.15695953369140625, -0.1396636962890625, -0.12236785888671875, -0.105072021484375, -0.08777618408203125, -0.0704803466796875, -0.05318450927734375, -0.035888671875, -0.01859283447265625, -0.0012969970703125, 0.01599884033203125, 0.033294677734375, 0.05059051513671875, 0.0678863525390625, 0.08518218994140625, 0.10247802734375, 0.11977386474609375, 0.1370697021484375, 0.15436553955078125, 0.171661376953125, 0.18895721435546875, 0.2062530517578125, 0.22354888916015625, 0.2408447265625, 0.25814056396484375, 0.2754364013671875, 0.29273223876953125, 0.310028076171875, 0.32732391357421875, 0.3446197509765625, 0.36191558837890625, 0.37921142578125, 0.39650726318359375, 0.4138031005859375, 0.43109893798828125, 0.448394775390625, 0.46569061279296875, 0.4829864501953125, 0.5002822875976562, 0.517578125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [27.0, 273.0, 590.0, 121.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004947662353515625, -0.0028790831565856934, -0.0008105039596557617, 0.00125807523727417, 0.0033266544342041016, 0.005395233631134033, 0.007463812828063965, 0.009532392024993896, 0.011600971221923828, 0.01366955041885376, 0.01573812961578369, 0.017806708812713623, 0.019875288009643555, 0.021943867206573486, 0.024012446403503418, 0.02608102560043335, 0.02814960479736328, 0.030218183994293213, 0.032286763191223145, 0.034355342388153076, 0.03642392158508301, 0.03849250078201294, 0.04056107997894287, 0.0426296591758728, 0.044698238372802734, 0.046766817569732666, 0.0488353967666626, 0.05090397596359253, 0.05297255516052246, 0.05504113435745239, 0.057109713554382324, 0.059178292751312256, 0.06124687194824219, 0.06331545114517212, 0.06538403034210205, 0.06745260953903198, 0.06952118873596191, 0.07158976793289185, 0.07365834712982178, 0.07572692632675171, 0.07779550552368164, 0.07986408472061157, 0.0819326639175415, 0.08400124311447144, 0.08606982231140137, 0.0881384015083313, 0.09020698070526123, 0.09227555990219116, 0.0943441390991211, 0.09641271829605103, 0.09848129749298096, 0.10054987668991089, 0.10261845588684082, 0.10468703508377075, 0.10675561428070068, 0.10882419347763062, 0.11089277267456055, 0.11296135187149048, 0.11502993106842041, 0.11709851026535034, 0.11916708946228027, 0.1212356686592102, 0.12330424785614014, 0.12537282705307007, 0.12744140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 7.0, 8.0, 16.0, 15.0, 24.0, 31.0, 27.0, 49.0, 64.0, 123.0, 202.0, 503.0, 1448.0, 5697.0, 32482.0, 381129.0, 570476.0, 45758.0, 7334.0, 1860.0, 640.0, 265.0, 122.0, 70.0, 35.0, 32.0, 28.0, 18.0, 14.0, 6.0, 16.0, 12.0, 7.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2357177734375, -0.22837066650390625, -0.2210235595703125, -0.21367645263671875, -0.206329345703125, -0.19898223876953125, -0.1916351318359375, -0.18428802490234375, -0.17694091796875, -0.16959381103515625, -0.1622467041015625, -0.15489959716796875, -0.147552490234375, -0.14020538330078125, -0.1328582763671875, -0.12551116943359375, -0.1181640625, -0.11081695556640625, -0.1034698486328125, -0.09612274169921875, -0.088775634765625, -0.08142852783203125, -0.0740814208984375, -0.06673431396484375, -0.05938720703125, -0.05204010009765625, -0.0446929931640625, -0.03734588623046875, -0.029998779296875, -0.02265167236328125, -0.0153045654296875, -0.00795745849609375, -0.0006103515625, 0.00673675537109375, 0.0140838623046875, 0.02143096923828125, 0.028778076171875, 0.03612518310546875, 0.0434722900390625, 0.05081939697265625, 0.05816650390625, 0.06551361083984375, 0.0728607177734375, 0.08020782470703125, 0.087554931640625, 0.09490203857421875, 0.1022491455078125, 0.10959625244140625, 0.116943359375, 0.12429046630859375, 0.1316375732421875, 0.13898468017578125, 0.146331787109375, 0.15367889404296875, 0.1610260009765625, 0.16837310791015625, 0.17572021484375, 0.18306732177734375, 0.1904144287109375, 0.19776153564453125, 0.205108642578125, 0.21245574951171875, 0.2198028564453125, 0.22714996337890625, 0.2344970703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 7.0, 12.0, 13.0, 15.0, 20.0, 26.0, 27.0, 29.0, 38.0, 45.0, 49.0, 52.0, 50.0, 65.0, 55.0, 73.0, 53.0, 51.0, 54.0, 38.0, 39.0, 33.0, 21.0, 25.0, 24.0, 12.0, 14.0, 11.0, 1.0, 4.0, 13.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.1256103515625, -0.12235069274902344, -0.11909103393554688, -0.11583137512207031, -0.11257171630859375, -0.10931205749511719, -0.10605239868164062, -0.10279273986816406, -0.0995330810546875, -0.09627342224121094, -0.09301376342773438, -0.08975410461425781, -0.08649444580078125, -0.08323478698730469, -0.07997512817382812, -0.07671546936035156, -0.073455810546875, -0.07019615173339844, -0.06693649291992188, -0.06367683410644531, -0.06041717529296875, -0.05715751647949219, -0.053897857666015625, -0.05063819885253906, -0.0473785400390625, -0.04411888122558594, -0.040859222412109375, -0.03759956359863281, -0.03433990478515625, -0.031080245971679688, -0.027820587158203125, -0.024560928344726562, -0.02130126953125, -0.018041610717773438, -0.014781951904296875, -0.011522293090820312, -0.00826263427734375, -0.0050029754638671875, -0.001743316650390625, 0.0015163421630859375, 0.0047760009765625, 0.008035659790039062, 0.011295318603515625, 0.014554977416992188, 0.01781463623046875, 0.021074295043945312, 0.024333953857421875, 0.027593612670898438, 0.030853271484375, 0.03411293029785156, 0.037372589111328125, 0.04063224792480469, 0.04389190673828125, 0.04715156555175781, 0.050411224365234375, 0.05367088317871094, 0.0569305419921875, 0.06019020080566406, 0.06344985961914062, 0.06670951843261719, 0.06996917724609375, 0.07322883605957031, 0.07648849487304688, 0.07974815368652344, 0.0830078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 7.0, 10.0, 15.0, 26.0, 27.0, 46.0, 85.0, 135.0, 295.0, 574.0, 1525.0, 4876.0, 24841.0, 591626.0, 397082.0, 20427.0, 4345.0, 1428.0, 541.0, 273.0, 124.0, 71.0, 47.0, 34.0, 25.0, 24.0, 11.0, 3.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23193359375, -0.22418975830078125, -0.2164459228515625, -0.20870208740234375, -0.200958251953125, -0.19321441650390625, -0.1854705810546875, -0.17772674560546875, -0.16998291015625, -0.16223907470703125, -0.1544952392578125, -0.14675140380859375, -0.139007568359375, -0.13126373291015625, -0.1235198974609375, -0.11577606201171875, -0.1080322265625, -0.10028839111328125, -0.0925445556640625, -0.08480072021484375, -0.077056884765625, -0.06931304931640625, -0.0615692138671875, -0.05382537841796875, -0.04608154296875, -0.03833770751953125, -0.0305938720703125, -0.02285003662109375, -0.015106201171875, -0.00736236572265625, 0.0003814697265625, 0.00812530517578125, 0.015869140625, 0.02361297607421875, 0.0313568115234375, 0.03910064697265625, 0.046844482421875, 0.05458831787109375, 0.0623321533203125, 0.07007598876953125, 0.07781982421875, 0.08556365966796875, 0.0933074951171875, 0.10105133056640625, 0.108795166015625, 0.11653900146484375, 0.1242828369140625, 0.13202667236328125, 0.1397705078125, 0.14751434326171875, 0.1552581787109375, 0.16300201416015625, 0.170745849609375, 0.17848968505859375, 0.1862335205078125, 0.19397735595703125, 0.20172119140625, 0.20946502685546875, 0.2172088623046875, 0.22495269775390625, 0.232696533203125, 0.24044036865234375, 0.2481842041015625, 0.25592803955078125, 0.263671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 18.0, 18.0, 37.0, 45.0, 68.0, 105.0, 156.0, 102.0, 112.0, 88.0, 58.0, 31.0, 23.0, 23.0, 19.0, 6.0, 9.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7702579498291016e-05, -1.7132610082626343e-05, -1.656264066696167e-05, -1.5992671251296997e-05, -1.5422701835632324e-05, -1.4852732419967651e-05, -1.4282763004302979e-05, -1.3712793588638306e-05, -1.3142824172973633e-05, -1.257285475730896e-05, -1.2002885341644287e-05, -1.1432915925979614e-05, -1.0862946510314941e-05, -1.0292977094650269e-05, -9.723007678985596e-06, -9.153038263320923e-06, -8.58306884765625e-06, -8.013099431991577e-06, -7.443130016326904e-06, -6.8731606006622314e-06, -6.303191184997559e-06, -5.733221769332886e-06, -5.163252353668213e-06, -4.59328293800354e-06, -4.023313522338867e-06, -3.4533441066741943e-06, -2.8833746910095215e-06, -2.3134052753448486e-06, -1.7434358596801758e-06, -1.173466444015503e-06, -6.034970283508301e-07, -3.3527612686157227e-08, 5.364418029785156e-07, 1.1064112186431885e-06, 1.6763806343078613e-06, 2.246350049972534e-06, 2.816319465637207e-06, 3.38628888130188e-06, 3.956258296966553e-06, 4.526227712631226e-06, 5.0961971282958984e-06, 5.666166543960571e-06, 6.236135959625244e-06, 6.806105375289917e-06, 7.37607479095459e-06, 7.946044206619263e-06, 8.516013622283936e-06, 9.085983037948608e-06, 9.655952453613281e-06, 1.0225921869277954e-05, 1.0795891284942627e-05, 1.13658607006073e-05, 1.1935830116271973e-05, 1.2505799531936646e-05, 1.3075768947601318e-05, 1.3645738363265991e-05, 1.4215707778930664e-05, 1.4785677194595337e-05, 1.535564661026001e-05, 1.5925616025924683e-05, 1.6495585441589355e-05, 1.706555485725403e-05, 1.76355242729187e-05, 1.8205493688583374e-05, 1.8775463104248047e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 13.0, 16.0, 36.0, 54.0, 86.0, 252.0, 995.0, 13498.0, 997796.0, 33814.0, 1510.0, 279.0, 89.0, 45.0, 23.0, 11.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.68408203125, -0.6676445007324219, -0.6512069702148438, -0.6347694396972656, -0.6183319091796875, -0.6018943786621094, -0.5854568481445312, -0.5690193176269531, -0.552581787109375, -0.5361442565917969, -0.5197067260742188, -0.5032691955566406, -0.4868316650390625, -0.4703941345214844, -0.45395660400390625, -0.4375190734863281, -0.42108154296875, -0.4046440124511719, -0.38820648193359375, -0.3717689514160156, -0.3553314208984375, -0.3388938903808594, -0.32245635986328125, -0.3060188293457031, -0.289581298828125, -0.2731437683105469, -0.25670623779296875, -0.24026870727539062, -0.2238311767578125, -0.20739364624023438, -0.19095611572265625, -0.17451858520507812, -0.1580810546875, -0.14164352416992188, -0.12520599365234375, -0.10876846313476562, -0.0923309326171875, -0.07589340209960938, -0.05945587158203125, -0.043018341064453125, -0.026580810546875, -0.010143280029296875, 0.00629425048828125, 0.022731781005859375, 0.0391693115234375, 0.055606842041015625, 0.07204437255859375, 0.08848190307617188, 0.10491943359375, 0.12135696411132812, 0.13779449462890625, 0.15423202514648438, 0.1706695556640625, 0.18710708618164062, 0.20354461669921875, 0.21998214721679688, 0.236419677734375, 0.2528572082519531, 0.26929473876953125, 0.2857322692871094, 0.3021697998046875, 0.3186073303222656, 0.33504486083984375, 0.3514823913574219, 0.367919921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 5.0, 9.0, 9.0, 10.0, 20.0, 20.0, 28.0, 66.0, 129.0, 285.0, 209.0, 92.0, 45.0, 30.0, 11.0, 9.0, 9.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275390625, -0.268951416015625, -0.26251220703125, -0.256072998046875, -0.2496337890625, -0.243194580078125, -0.23675537109375, -0.230316162109375, -0.223876953125, -0.217437744140625, -0.21099853515625, -0.204559326171875, -0.1981201171875, -0.191680908203125, -0.18524169921875, -0.178802490234375, -0.17236328125, -0.165924072265625, -0.15948486328125, -0.153045654296875, -0.1466064453125, -0.140167236328125, -0.13372802734375, -0.127288818359375, -0.120849609375, -0.114410400390625, -0.10797119140625, -0.101531982421875, -0.0950927734375, -0.088653564453125, -0.08221435546875, -0.075775146484375, -0.0693359375, -0.062896728515625, -0.05645751953125, -0.050018310546875, -0.0435791015625, -0.037139892578125, -0.03070068359375, -0.024261474609375, -0.017822265625, -0.011383056640625, -0.00494384765625, 0.001495361328125, 0.0079345703125, 0.014373779296875, 0.02081298828125, 0.027252197265625, 0.03369140625, 0.040130615234375, 0.04656982421875, 0.053009033203125, 0.0594482421875, 0.065887451171875, 0.07232666015625, 0.078765869140625, 0.085205078125, 0.091644287109375, 0.09808349609375, 0.104522705078125, 0.1109619140625, 0.117401123046875, 0.12384033203125, 0.130279541015625, 0.13671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 12.0, 186.0, 814.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9015557765960693, -2.4335384368896484, -1.9655213356018066, -1.4975041151046753, -1.029486894607544, -0.5614697933197021, -0.09345245361328125, 0.37456488609313965, 0.8425819873809814, 1.3105992078781128, 1.7786164283752441, 2.246633529663086, 2.714650869369507, 3.1826679706573486, 3.6506853103637695, 4.1187028884887695, 4.586719512939453, 5.054736614227295, 5.522753715515137, 5.990771293640137, 6.4587883949279785, 6.92680549621582, 7.39482307434082, 7.862840175628662, 8.330857276916504, 8.798874855041504, 9.266891479492188, 9.734909057617188, 10.202926635742188, 10.670943260192871, 11.138960838317871, 11.606977462768555, 12.074995040893555, 12.543012619018555, 13.011029243469238, 13.479046821594238, 13.947063446044922, 14.415081024169922, 14.883098602294922, 15.351116180419922, 15.819132804870605, 16.28714942932129, 16.75516700744629, 17.22318458557129, 17.69120216369629, 18.159217834472656, 18.627235412597656, 19.095252990722656, 19.563270568847656, 20.031288146972656, 20.499305725097656, 20.967321395874023, 21.435338973999023, 21.903356552124023, 22.371374130249023, 22.839391708374023, 23.30740737915039, 23.77542495727539, 24.24344253540039, 24.711458206176758, 25.179475784301758, 25.647493362426758, 26.115510940551758, 26.583528518676758, 27.051546096801758]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 3.0, 26.0, 30.0, 49.0, 59.0, 71.0, 102.0, 96.0, 105.0, 101.0, 94.0, 90.0, 71.0, 40.0, 27.0, 19.0, 9.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.814208984375, -0.7695979475975037, -0.7249868512153625, -0.6803758144378662, -0.6357647180557251, -0.5911536812782288, -0.5465426445007324, -0.5019315481185913, -0.45732051134109497, -0.41270944476127625, -0.3680983781814575, -0.3234873414039612, -0.27887627482414246, -0.23426520824432373, -0.1896541714668274, -0.14504310488700867, -0.10043203830718994, -0.05582097917795181, -0.011209920048713684, 0.03340113162994385, 0.07801219820976257, 0.1226232647895813, 0.16723430156707764, 0.21184536814689636, 0.2564564347267151, 0.3010675013065338, 0.34567856788635254, 0.3902896046638489, 0.4349006712436676, 0.47951173782348633, 0.5241227746009827, 0.568733811378479, 0.6133449077606201, 0.6579559445381165, 0.7025670409202576, 0.7471780776977539, 0.791789174079895, 0.8364002108573914, 0.8810112476348877, 0.9256223440170288, 0.9702333807945251, 1.0148444175720215, 1.0594555139541626, 1.1040666103363037, 1.1486775875091553, 1.1932886838912964, 1.2378997802734375, 1.282510757446289, 1.3271218538284302, 1.3717329502105713, 1.4163439273834229, 1.460955023765564, 1.505566120147705, 1.5501770973205566, 1.5947881937026978, 1.6393992900848389, 1.6840102672576904, 1.7286213636398315, 1.773232340812683, 1.8178434371948242, 1.8624545335769653, 1.9070656299591064, 1.951676607131958, 1.9962877035140991, 2.0408987998962402]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 12.0, 50.0, 265.0, 16782.0, 4175799.0, 907.0, 230.0, 102.0, 59.0, 44.0, 20.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65625, -0.54974365234375, -0.4432373046875, -0.33673095703125, -0.230224609375, -0.12371826171875, -0.0172119140625, 0.08929443359375, 0.19580078125, 0.30230712890625, 0.4088134765625, 0.51531982421875, 0.621826171875, 0.72833251953125, 0.8348388671875, 0.94134521484375, 1.0478515625, 1.15435791015625, 1.2608642578125, 1.36737060546875, 1.473876953125, 1.58038330078125, 1.6868896484375, 1.79339599609375, 1.89990234375, 2.00640869140625, 2.1129150390625, 2.21942138671875, 2.325927734375, 2.43243408203125, 2.5389404296875, 2.64544677734375, 2.751953125, 2.85845947265625, 2.9649658203125, 3.07147216796875, 3.177978515625, 3.28448486328125, 3.3909912109375, 3.49749755859375, 3.60400390625, 3.71051025390625, 3.8170166015625, 3.92352294921875, 4.030029296875, 4.13653564453125, 4.2430419921875, 4.34954833984375, 4.4560546875, 4.56256103515625, 4.6690673828125, 4.77557373046875, 4.882080078125, 4.98858642578125, 5.0950927734375, 5.20159912109375, 5.30810546875, 5.41461181640625, 5.5211181640625, 5.62762451171875, 5.734130859375, 5.84063720703125, 5.9471435546875, 6.05364990234375, 6.16015625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 10.0, 59.0, 141.0, 284.0, 304.0, 157.0, 37.0, 22.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0188446044921875, -0.016173601150512695, -0.01350259780883789, -0.010831594467163086, -0.008160591125488281, -0.0054895877838134766, -0.002818584442138672, -0.0001475811004638672, 0.0025234222412109375, 0.005194425582885742, 0.007865428924560547, 0.010536432266235352, 0.013207435607910156, 0.01587843894958496, 0.018549442291259766, 0.02122044563293457, 0.023891448974609375, 0.02656245231628418, 0.029233455657958984, 0.03190445899963379, 0.034575462341308594, 0.0372464656829834, 0.0399174690246582, 0.04258847236633301, 0.04525947570800781, 0.04793047904968262, 0.05060148239135742, 0.05327248573303223, 0.05594348907470703, 0.058614492416381836, 0.06128549575805664, 0.06395649909973145, 0.06662750244140625, 0.06929850578308105, 0.07196950912475586, 0.07464051246643066, 0.07731151580810547, 0.07998251914978027, 0.08265352249145508, 0.08532452583312988, 0.08799552917480469, 0.09066653251647949, 0.0933375358581543, 0.0960085391998291, 0.0986795425415039, 0.10135054588317871, 0.10402154922485352, 0.10669255256652832, 0.10936355590820312, 0.11203455924987793, 0.11470556259155273, 0.11737656593322754, 0.12004756927490234, 0.12271857261657715, 0.12538957595825195, 0.12806057929992676, 0.13073158264160156, 0.13340258598327637, 0.13607358932495117, 0.13874459266662598, 0.14141559600830078, 0.14408659934997559, 0.1467576026916504, 0.1494286060333252, 0.152099609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 23.0, 62.0, 92.0, 120.0, 219.0, 497.0, 96348.0, 4095591.0, 537.0, 247.0, 170.0, 132.0, 76.0, 57.0, 39.0, 33.0, 8.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.326385498046875, -3.18206787109375, -3.037750244140625, -2.8934326171875, -2.749114990234375, -2.60479736328125, -2.460479736328125, -2.316162109375, -2.171844482421875, -2.02752685546875, -1.883209228515625, -1.7388916015625, -1.594573974609375, -1.45025634765625, -1.305938720703125, -1.16162109375, -1.017303466796875, -0.87298583984375, -0.728668212890625, -0.5843505859375, -0.440032958984375, -0.29571533203125, -0.151397705078125, -0.007080078125, 0.137237548828125, 0.28155517578125, 0.425872802734375, 0.5701904296875, 0.714508056640625, 0.85882568359375, 1.003143310546875, 1.1474609375, 1.291778564453125, 1.43609619140625, 1.580413818359375, 1.7247314453125, 1.869049072265625, 2.01336669921875, 2.157684326171875, 2.302001953125, 2.446319580078125, 2.59063720703125, 2.734954833984375, 2.8792724609375, 3.023590087890625, 3.16790771484375, 3.312225341796875, 3.45654296875, 3.600860595703125, 3.74517822265625, 3.889495849609375, 4.0338134765625, 4.178131103515625, 4.32244873046875, 4.466766357421875, 4.611083984375, 4.755401611328125, 4.89971923828125, 5.044036865234375, 5.1883544921875, 5.332672119140625, 5.47698974609375, 5.621307373046875, 5.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 24.0, 131.0, 3686.0, 226.0, 10.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12420654296875, -0.10988330841064453, -0.09556007385253906, -0.0812368392944336, -0.06691360473632812, -0.052590370178222656, -0.03826713562011719, -0.02394390106201172, -0.00962066650390625, 0.004702568054199219, 0.019025802612304688, 0.033349037170410156, 0.047672271728515625, 0.061995506286621094, 0.07631874084472656, 0.09064197540283203, 0.1049652099609375, 0.11928844451904297, 0.13361167907714844, 0.1479349136352539, 0.16225814819335938, 0.17658138275146484, 0.1909046173095703, 0.20522785186767578, 0.21955108642578125, 0.23387432098388672, 0.2481975555419922, 0.26252079010009766, 0.2768440246582031, 0.2911672592163086, 0.30549049377441406, 0.31981372833251953, 0.334136962890625, 0.34846019744873047, 0.36278343200683594, 0.3771066665649414, 0.3914299011230469, 0.40575313568115234, 0.4200763702392578, 0.4343996047973633, 0.44872283935546875, 0.4630460739135742, 0.4773693084716797, 0.49169254302978516, 0.5060157775878906, 0.5203390121459961, 0.5346622467041016, 0.548985481262207, 0.5633087158203125, 0.577631950378418, 0.5919551849365234, 0.6062784194946289, 0.6206016540527344, 0.6349248886108398, 0.6492481231689453, 0.6635713577270508, 0.6778945922851562, 0.6922178268432617, 0.7065410614013672, 0.7208642959594727, 0.7351875305175781, 0.7495107650756836, 0.7638339996337891, 0.7781572341918945, 0.79248046875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 12.0, 55.0, 476.0, 428.0, 32.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884055137634277, -0.9903718829154968, -0.7923382520675659, -0.594304621219635, -0.3962709903717041, -0.1982373595237732, -0.00020372867584228516, 0.1978299617767334, 0.39586353302001953, 0.5938971638679504, 0.7919307947158813, 0.9899644255638123, 1.1879980564117432, 1.3860316276550293, 1.584065318107605, 1.7820990085601807, 1.9801325798034668, 2.178166151046753, 2.376199722290039, 2.5742335319519043, 2.7722671031951904, 2.9703006744384766, 3.168334484100342, 3.366368055343628, 3.564401626586914, 3.7624351978302, 3.9604687690734863, 4.158502578735352, 4.356535911560059, 4.554569721221924, 4.752603530883789, 4.950636863708496, 5.148670196533203, 5.346704006195068, 5.544737339019775, 5.742771148681641, 5.940804481506348, 6.138838291168213, 6.336872100830078, 6.534905433654785, 6.73293924331665, 6.930973052978516, 7.129006385803223, 7.327040195465088, 7.525074005126953, 7.72310733795166, 7.921141147613525, 8.11917495727539, 8.317208290100098, 8.515241622924805, 8.713275909423828, 8.911309242248535, 9.109342575073242, 9.307376861572266, 9.505410194396973, 9.70344352722168, 9.901477813720703, 10.09951114654541, 10.297545433044434, 10.49557876586914, 10.693612098693848, 10.891646385192871, 11.089679718017578, 11.287713050842285, 11.485746383666992]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 14.0, 17.0, 65.0, 80.0, 96.0, 150.0, 169.0, 143.0, 105.0, 74.0, 39.0, 25.0, 13.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661320686340332, -2.579507827758789, -2.497695207595825, -2.4158823490142822, -2.3340697288513184, -2.2522568702697754, -2.1704442501068115, -2.0886313915252686, -2.0068187713623047, -1.9250060319900513, -1.8431932926177979, -1.7613805532455444, -1.679567813873291, -1.597754955291748, -1.5159422159194946, -1.4341294765472412, -1.3523166179656982, -1.2705038785934448, -1.1886911392211914, -1.106878399848938, -1.0250656604766846, -0.9432528614997864, -0.8614400625228882, -0.7796273231506348, -0.6978145837783813, -0.6160018444061279, -0.5341891050338745, -0.4523763060569763, -0.3705635666847229, -0.2887508273124695, -0.20693805813789368, -0.12512528896331787, -0.04331254959106445, 0.03850020468235016, 0.12031295895576477, 0.20212571322917938, 0.283938467502594, 0.3657512068748474, 0.4475639760494232, 0.529376745223999, 0.6111894845962524, 0.6930022239685059, 0.7748149633407593, 0.8566277623176575, 0.9384405016899109, 1.0202531814575195, 1.1020660400390625, 1.183878779411316, 1.2656915187835693, 1.3475042581558228, 1.4293169975280762, 1.5111297369003296, 1.592942476272583, 1.674755334854126, 1.7565680742263794, 1.8383808135986328, 1.9201935529708862, 2.0020062923431396, 2.0838191509246826, 2.1656317710876465, 2.2474446296691895, 2.3292572498321533, 2.4110701084136963, 2.49288272857666, 2.574695587158203]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 8.0, 16.0, 26.0, 18.0, 22.0, 41.0, 69.0, 97.0, 235.0, 468.0, 1264.0, 4637.0, 54883.0, 909519.0, 69523.0, 5327.0, 1327.0, 508.0, 231.0, 102.0, 76.0, 38.0, 28.0, 20.0, 19.0, 12.0, 15.0, 7.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1123046875, -1.07464599609375, -1.0369873046875, -0.99932861328125, -0.961669921875, -0.92401123046875, -0.8863525390625, -0.84869384765625, -0.81103515625, -0.77337646484375, -0.7357177734375, -0.69805908203125, -0.660400390625, -0.62274169921875, -0.5850830078125, -0.54742431640625, -0.509765625, -0.47210693359375, -0.4344482421875, -0.39678955078125, -0.359130859375, -0.32147216796875, -0.2838134765625, -0.24615478515625, -0.20849609375, -0.17083740234375, -0.1331787109375, -0.09552001953125, -0.057861328125, -0.02020263671875, 0.0174560546875, 0.05511474609375, 0.0927734375, 0.13043212890625, 0.1680908203125, 0.20574951171875, 0.243408203125, 0.28106689453125, 0.3187255859375, 0.35638427734375, 0.39404296875, 0.43170166015625, 0.4693603515625, 0.50701904296875, 0.544677734375, 0.58233642578125, 0.6199951171875, 0.65765380859375, 0.6953125, 0.73297119140625, 0.7706298828125, 0.80828857421875, 0.845947265625, 0.88360595703125, 0.9212646484375, 0.95892333984375, 0.99658203125, 1.03424072265625, 1.0718994140625, 1.10955810546875, 1.147216796875, 1.18487548828125, 1.2225341796875, 1.26019287109375, 1.2978515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 14.0, 33.0, 49.0, 86.0, 128.0, 190.0, 162.0, 136.0, 94.0, 56.0, 34.0, 14.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.101806640625, -0.09648704528808594, -0.09116744995117188, -0.08584785461425781, -0.08052825927734375, -0.07520866394042969, -0.06988906860351562, -0.06456947326660156, -0.0592498779296875, -0.05393028259277344, -0.048610687255859375, -0.04329109191894531, -0.03797149658203125, -0.03265190124511719, -0.027332305908203125, -0.022012710571289062, -0.016693115234375, -0.011373519897460938, -0.006053924560546875, -0.0007343292236328125, 0.00458526611328125, 0.009904861450195312, 0.015224456787109375, 0.020544052124023438, 0.0258636474609375, 0.031183242797851562, 0.036502838134765625, 0.04182243347167969, 0.04714202880859375, 0.05246162414550781, 0.057781219482421875, 0.06310081481933594, 0.06842041015625, 0.07374000549316406, 0.07905960083007812, 0.08437919616699219, 0.08969879150390625, 0.09501838684082031, 0.10033798217773438, 0.10565757751464844, 0.1109771728515625, 0.11629676818847656, 0.12161636352539062, 0.1269359588623047, 0.13225555419921875, 0.1375751495361328, 0.14289474487304688, 0.14821434020996094, 0.153533935546875, 0.15885353088378906, 0.16417312622070312, 0.1694927215576172, 0.17481231689453125, 0.1801319122314453, 0.18545150756835938, 0.19077110290527344, 0.1960906982421875, 0.20141029357910156, 0.20672988891601562, 0.2120494842529297, 0.21736907958984375, 0.2226886749267578, 0.22800827026367188, 0.23332786560058594, 0.2386474609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 13.0, 24.0, 20.0, 42.0, 60.0, 80.0, 163.0, 395.0, 1140.0, 4874.0, 36280.0, 717816.0, 265930.0, 17211.0, 2912.0, 836.0, 320.0, 139.0, 83.0, 59.0, 26.0, 22.0, 20.0, 22.0, 7.0, 2.0, 11.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5893630981445312, -0.5673980712890625, -0.5454330444335938, -0.523468017578125, -0.5015029907226562, -0.4795379638671875, -0.45757293701171875, -0.43560791015625, -0.41364288330078125, -0.3916778564453125, -0.36971282958984375, -0.347747802734375, -0.32578277587890625, -0.3038177490234375, -0.28185272216796875, -0.2598876953125, -0.23792266845703125, -0.2159576416015625, -0.19399261474609375, -0.172027587890625, -0.15006256103515625, -0.1280975341796875, -0.10613250732421875, -0.08416748046875, -0.06220245361328125, -0.0402374267578125, -0.01827239990234375, 0.003692626953125, 0.02565765380859375, 0.0476226806640625, 0.06958770751953125, 0.091552734375, 0.11351776123046875, 0.1354827880859375, 0.15744781494140625, 0.179412841796875, 0.20137786865234375, 0.2233428955078125, 0.24530792236328125, 0.26727294921875, 0.28923797607421875, 0.3112030029296875, 0.33316802978515625, 0.355133056640625, 0.37709808349609375, 0.3990631103515625, 0.42102813720703125, 0.4429931640625, 0.46495819091796875, 0.4869232177734375, 0.5088882446289062, 0.530853271484375, 0.5528182983398438, 0.5747833251953125, 0.5967483520507812, 0.61871337890625, 0.6406784057617188, 0.6626434326171875, 0.6846084594726562, 0.706573486328125, 0.7285385131835938, 0.7505035400390625, 0.7724685668945312, 0.79443359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 16.0, 17.0, 14.0, 26.0, 28.0, 26.0, 30.0, 52.0, 47.0, 64.0, 69.0, 52.0, 60.0, 66.0, 66.0, 61.0, 51.0, 47.0, 44.0, 26.0, 27.0, 20.0, 16.0, 10.0, 7.0, 8.0, 6.0, 10.0, 1.0, 5.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.27091217041015625, -0.2613067626953125, -0.25170135498046875, -0.242095947265625, -0.23249053955078125, -0.2228851318359375, -0.21327972412109375, -0.20367431640625, -0.19406890869140625, -0.1844635009765625, -0.17485809326171875, -0.165252685546875, -0.15564727783203125, -0.1460418701171875, -0.13643646240234375, -0.1268310546875, -0.11722564697265625, -0.1076202392578125, -0.09801483154296875, -0.088409423828125, -0.07880401611328125, -0.0691986083984375, -0.05959320068359375, -0.04998779296875, -0.04038238525390625, -0.0307769775390625, -0.02117156982421875, -0.011566162109375, -0.00196075439453125, 0.0076446533203125, 0.01725006103515625, 0.02685546875, 0.03646087646484375, 0.0460662841796875, 0.05567169189453125, 0.065277099609375, 0.07488250732421875, 0.0844879150390625, 0.09409332275390625, 0.10369873046875, 0.11330413818359375, 0.1229095458984375, 0.13251495361328125, 0.142120361328125, 0.15172576904296875, 0.1613311767578125, 0.17093658447265625, 0.1805419921875, 0.19014739990234375, 0.1997528076171875, 0.20935821533203125, 0.218963623046875, 0.22856903076171875, 0.2381744384765625, 0.24777984619140625, 0.25738525390625, 0.26699066162109375, 0.2765960693359375, 0.28620147705078125, 0.295806884765625, 0.30541229248046875, 0.3150177001953125, 0.32462310791015625, 0.334228515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 26.0, 55.0, 121.0, 357.0, 1336.0, 11917.0, 968466.0, 62416.0, 2901.0, 593.0, 201.0, 75.0, 35.0, 21.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.451416015625, -0.4331474304199219, -0.41487884521484375, -0.3966102600097656, -0.3783416748046875, -0.3600730895996094, -0.34180450439453125, -0.3235359191894531, -0.305267333984375, -0.2869987487792969, -0.26873016357421875, -0.2504615783691406, -0.2321929931640625, -0.21392440795898438, -0.19565582275390625, -0.17738723754882812, -0.15911865234375, -0.14085006713867188, -0.12258148193359375, -0.10431289672851562, -0.0860443115234375, -0.06777572631835938, -0.04950714111328125, -0.031238555908203125, -0.012969970703125, 0.005298614501953125, 0.02356719970703125, 0.041835784912109375, 0.0601043701171875, 0.07837295532226562, 0.09664154052734375, 0.11491012573242188, 0.1331787109375, 0.15144729614257812, 0.16971588134765625, 0.18798446655273438, 0.2062530517578125, 0.22452163696289062, 0.24279022216796875, 0.2610588073730469, 0.279327392578125, 0.2975959777832031, 0.31586456298828125, 0.3341331481933594, 0.3524017333984375, 0.3706703186035156, 0.38893890380859375, 0.4072074890136719, 0.42547607421875, 0.4437446594238281, 0.46201324462890625, 0.4802818298339844, 0.4985504150390625, 0.5168190002441406, 0.5350875854492188, 0.5533561706542969, 0.571624755859375, 0.5898933410644531, 0.6081619262695312, 0.6264305114746094, 0.6446990966796875, 0.6629676818847656, 0.6812362670898438, 0.6995048522949219, 0.7177734375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 10.0, 18.0, 12.0, 24.0, 21.0, 34.0, 53.0, 58.0, 82.0, 88.0, 97.0, 103.0, 87.0, 78.0, 59.0, 47.0, 38.0, 17.0, 19.0, 16.0, 9.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.823902130126953e-05, -1.7666257917881012e-05, -1.7093494534492493e-05, -1.6520731151103973e-05, -1.5947967767715454e-05, -1.5375204384326935e-05, -1.4802441000938416e-05, -1.4229677617549896e-05, -1.3656914234161377e-05, -1.3084150850772858e-05, -1.2511387467384338e-05, -1.1938624083995819e-05, -1.13658607006073e-05, -1.079309731721878e-05, -1.0220333933830261e-05, -9.647570550441742e-06, -9.074807167053223e-06, -8.502043783664703e-06, -7.929280400276184e-06, -7.356517016887665e-06, -6.7837536334991455e-06, -6.210990250110626e-06, -5.638226866722107e-06, -5.065463483333588e-06, -4.492700099945068e-06, -3.919936716556549e-06, -3.3471733331680298e-06, -2.7744099497795105e-06, -2.201646566390991e-06, -1.628883183002472e-06, -1.0561197996139526e-06, -4.833564162254333e-07, 8.940696716308594e-08, 6.621703505516052e-07, 1.2349337339401245e-06, 1.8076971173286438e-06, 2.380460500717163e-06, 2.9532238841056824e-06, 3.5259872674942017e-06, 4.098750650882721e-06, 4.67151403427124e-06, 5.2442774176597595e-06, 5.817040801048279e-06, 6.389804184436798e-06, 6.962567567825317e-06, 7.535330951213837e-06, 8.108094334602356e-06, 8.680857717990875e-06, 9.253621101379395e-06, 9.826384484767914e-06, 1.0399147868156433e-05, 1.0971911251544952e-05, 1.1544674634933472e-05, 1.2117438018321991e-05, 1.269020140171051e-05, 1.326296478509903e-05, 1.3835728168487549e-05, 1.4408491551876068e-05, 1.4981254935264587e-05, 1.5554018318653107e-05, 1.6126781702041626e-05, 1.6699545085430145e-05, 1.7272308468818665e-05, 1.7845071852207184e-05, 1.8417835235595703e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 11.0, 20.0, 13.0, 29.0, 56.0, 104.0, 183.0, 574.0, 2249.0, 35003.0, 977870.0, 29338.0, 2050.0, 544.0, 235.0, 105.0, 59.0, 36.0, 23.0, 12.0, 15.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34326171875, -0.3297882080078125, -0.316314697265625, -0.3028411865234375, -0.28936767578125, -0.2758941650390625, -0.262420654296875, -0.2489471435546875, -0.2354736328125, -0.2220001220703125, -0.208526611328125, -0.1950531005859375, -0.18157958984375, -0.1681060791015625, -0.154632568359375, -0.1411590576171875, -0.127685546875, -0.1142120361328125, -0.100738525390625, -0.0872650146484375, -0.07379150390625, -0.0603179931640625, -0.046844482421875, -0.0333709716796875, -0.0198974609375, -0.0064239501953125, 0.007049560546875, 0.0205230712890625, 0.03399658203125, 0.0474700927734375, 0.060943603515625, 0.0744171142578125, 0.087890625, 0.1013641357421875, 0.114837646484375, 0.1283111572265625, 0.14178466796875, 0.1552581787109375, 0.168731689453125, 0.1822052001953125, 0.1956787109375, 0.2091522216796875, 0.222625732421875, 0.2360992431640625, 0.24957275390625, 0.2630462646484375, 0.276519775390625, 0.2899932861328125, 0.303466796875, 0.3169403076171875, 0.330413818359375, 0.3438873291015625, 0.35736083984375, 0.3708343505859375, 0.384307861328125, 0.3977813720703125, 0.4112548828125, 0.4247283935546875, 0.438201904296875, 0.4516754150390625, 0.46514892578125, 0.4786224365234375, 0.492095947265625, 0.5055694580078125, 0.51904296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 12.0, 20.0, 16.0, 32.0, 60.0, 96.0, 155.0, 183.0, 140.0, 90.0, 57.0, 35.0, 31.0, 12.0, 12.0, 16.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10589599609375, -0.10045719146728516, -0.09501838684082031, -0.08957958221435547, -0.08414077758789062, -0.07870197296142578, -0.07326316833496094, -0.0678243637084961, -0.06238555908203125, -0.056946754455566406, -0.05150794982910156, -0.04606914520263672, -0.040630340576171875, -0.03519153594970703, -0.029752731323242188, -0.024313926696777344, -0.0188751220703125, -0.013436317443847656, -0.007997512817382812, -0.0025587081909179688, 0.002880096435546875, 0.008318901062011719, 0.013757705688476562, 0.019196510314941406, 0.02463531494140625, 0.030074119567871094, 0.03551292419433594, 0.04095172882080078, 0.046390533447265625, 0.05182933807373047, 0.05726814270019531, 0.06270694732666016, 0.068145751953125, 0.07358455657958984, 0.07902336120605469, 0.08446216583251953, 0.08990097045898438, 0.09533977508544922, 0.10077857971191406, 0.1062173843383789, 0.11165618896484375, 0.1170949935913086, 0.12253379821777344, 0.12797260284423828, 0.13341140747070312, 0.13885021209716797, 0.1442890167236328, 0.14972782135009766, 0.1551666259765625, 0.16060543060302734, 0.1660442352294922, 0.17148303985595703, 0.17692184448242188, 0.18236064910888672, 0.18779945373535156, 0.1932382583618164, 0.19867706298828125, 0.2041158676147461, 0.20955467224121094, 0.21499347686767578, 0.22043228149414062, 0.22587108612060547, 0.2313098907470703, 0.23674869537353516, 0.2421875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 54.0, 904.0, 54.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.636589050292969, -8.08128833770752, -7.525986671447754, -6.970685958862305, -6.415384292602539, -5.86008358001709, -5.304782390594482, -4.749481201171875, -4.194180011749268, -3.63887882232666, -3.0835776329040527, -2.5282766819000244, -1.972975492477417, -1.4176743030548096, -0.8623733520507812, -0.30707216262817383, 0.2482290267944336, 0.8035301566123962, 1.3588312864303589, 1.9141323566436768, 2.469433546066284, 3.0247347354888916, 3.58003568649292, 4.135336875915527, 4.690638065338135, 5.245939254760742, 5.80124044418335, 6.356541633605957, 6.911842346191406, 7.467144012451172, 8.022444725036621, 8.57774543762207, 9.133047103881836, 9.688347816467285, 10.24364948272705, 10.7989501953125, 11.354251861572266, 11.909552574157715, 12.464853286743164, 13.02015495300293, 13.575456619262695, 14.130757331848145, 14.68605899810791, 15.24135971069336, 15.796661376953125, 16.35196304321289, 16.907262802124023, 17.46256446838379, 18.017864227294922, 18.573165893554688, 19.12846565246582, 19.683767318725586, 20.23906898498535, 20.794370651245117, 21.34967041015625, 21.904972076416016, 22.46027374267578, 23.015575408935547, 23.57087516784668, 24.126176834106445, 24.68147850036621, 25.236780166625977, 25.79207992553711, 26.347381591796875, 26.90268325805664]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 9.0, 11.0, 8.0, 17.0, 23.0, 28.0, 42.0, 41.0, 41.0, 61.0, 64.0, 62.0, 69.0, 61.0, 62.0, 57.0, 59.0, 49.0, 57.0, 47.0, 35.0, 21.0, 19.0, 19.0, 6.0, 8.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1347343921661377, -2.068380117416382, -2.002025604248047, -1.9356712102890015, -1.869316816329956, -1.8029624223709106, -1.7366080284118652, -1.6702537536621094, -1.6038992404937744, -1.537544846534729, -1.4711904525756836, -1.4048360586166382, -1.3384816646575928, -1.2721272706985474, -1.205772876739502, -1.139418601989746, -1.0730642080307007, -1.0067098140716553, -0.9403554201126099, -0.8740010261535645, -0.807646632194519, -0.7412922382354736, -0.674937903881073, -0.6085835099220276, -0.5422291159629822, -0.47587472200393677, -0.40952032804489136, -0.34316596388816833, -0.2768115699291229, -0.21045717597007751, -0.1441028118133545, -0.07774841785430908, -0.011394023895263672, 0.05496036261320114, 0.12131474912166595, 0.18766912817955017, 0.2540235221385956, 0.320377916097641, 0.386732280254364, 0.4530866742134094, 0.5194410681724548, 0.5857954621315002, 0.6521498560905457, 0.7185041904449463, 0.7848585844039917, 0.8512129783630371, 0.9175673723220825, 0.9839217662811279, 1.0502761602401733, 1.1166305541992188, 1.1829849481582642, 1.2493393421173096, 1.315693736076355, 1.3820481300354004, 1.4484024047851562, 1.5147569179534912, 1.581111192703247, 1.6474655866622925, 1.713819980621338, 1.7801743745803833, 1.8465287685394287, 1.9128831624984741, 1.9792375564575195, 2.0455918312072754, 2.1119463443756104]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 3.0, 4.0, 11.0, 14.0, 35.0, 107.0, 196.0, 504.0, 1500.0, 5215.0, 22996.0, 585576.0, 3537854.0, 30744.0, 6015.0, 1758.0, 721.0, 362.0, 205.0, 127.0, 67.0, 58.0, 40.0, 36.0, 21.0, 15.0, 13.0, 13.0, 9.0, 8.0, 8.0, 13.0, 9.0, 9.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.41082000732421875, -0.3768157958984375, -0.34281158447265625, -0.308807373046875, -0.27480316162109375, -0.2407989501953125, -0.20679473876953125, -0.17279052734375, -0.13878631591796875, -0.1047821044921875, -0.07077789306640625, -0.036773681640625, -0.00276947021484375, 0.0312347412109375, 0.06523895263671875, 0.0992431640625, 0.13324737548828125, 0.1672515869140625, 0.20125579833984375, 0.235260009765625, 0.26926422119140625, 0.3032684326171875, 0.33727264404296875, 0.37127685546875, 0.40528106689453125, 0.4392852783203125, 0.47328948974609375, 0.507293701171875, 0.5412979125976562, 0.5753021240234375, 0.6093063354492188, 0.643310546875, 0.6773147583007812, 0.7113189697265625, 0.7453231811523438, 0.779327392578125, 0.8133316040039062, 0.8473358154296875, 0.8813400268554688, 0.91534423828125, 0.9493484497070312, 0.9833526611328125, 1.0173568725585938, 1.051361083984375, 1.0853652954101562, 1.1193695068359375, 1.1533737182617188, 1.1873779296875, 1.2213821411132812, 1.2553863525390625, 1.2893905639648438, 1.323394775390625, 1.3573989868164062, 1.3914031982421875, 1.4254074096679688, 1.45941162109375, 1.4934158325195312, 1.5274200439453125, 1.5614242553710938, 1.595428466796875, 1.6294326782226562, 1.6634368896484375, 1.6974411010742188, 1.7314453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 14.0, 21.0, 29.0, 49.0, 61.0, 116.0, 129.0, 154.0, 123.0, 104.0, 77.0, 60.0, 31.0, 14.0, 11.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06976318359375, -0.0649557113647461, -0.06014823913574219, -0.05534076690673828, -0.050533294677734375, -0.04572582244873047, -0.04091835021972656, -0.036110877990722656, -0.03130340576171875, -0.026495933532714844, -0.021688461303710938, -0.01688098907470703, -0.012073516845703125, -0.007266044616699219, -0.0024585723876953125, 0.0023488998413085938, 0.0071563720703125, 0.011963844299316406, 0.016771316528320312, 0.02157878875732422, 0.026386260986328125, 0.03119373321533203, 0.03600120544433594, 0.040808677673339844, 0.04561614990234375, 0.050423622131347656, 0.05523109436035156, 0.06003856658935547, 0.06484603881835938, 0.06965351104736328, 0.07446098327636719, 0.0792684555053711, 0.084075927734375, 0.0888833999633789, 0.09369087219238281, 0.09849834442138672, 0.10330581665039062, 0.10811328887939453, 0.11292076110839844, 0.11772823333740234, 0.12253570556640625, 0.12734317779541016, 0.13215065002441406, 0.13695812225341797, 0.14176559448242188, 0.14657306671142578, 0.1513805389404297, 0.1561880111694336, 0.1609954833984375, 0.1658029556274414, 0.1706104278564453, 0.17541790008544922, 0.18022537231445312, 0.18503284454345703, 0.18984031677246094, 0.19464778900146484, 0.19945526123046875, 0.20426273345947266, 0.20907020568847656, 0.21387767791748047, 0.21868515014648438, 0.22349262237548828, 0.2283000946044922, 0.2331075668334961, 0.2379150390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 12.0, 19.0, 46.0, 113.0, 586.0, 4132447.0, 59990.0, 702.0, 224.0, 73.0, 41.0, 24.0, 12.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.837158203125, -3.59619140625, -3.355224609375, -3.1142578125, -2.873291015625, -2.63232421875, -2.391357421875, -2.150390625, -1.909423828125, -1.66845703125, -1.427490234375, -1.1865234375, -0.945556640625, -0.70458984375, -0.463623046875, -0.22265625, 0.018310546875, 0.25927734375, 0.500244140625, 0.7412109375, 0.982177734375, 1.22314453125, 1.464111328125, 1.705078125, 1.946044921875, 2.18701171875, 2.427978515625, 2.6689453125, 2.909912109375, 3.15087890625, 3.391845703125, 3.6328125, 3.873779296875, 4.11474609375, 4.355712890625, 4.5966796875, 4.837646484375, 5.07861328125, 5.319580078125, 5.560546875, 5.801513671875, 6.04248046875, 6.283447265625, 6.5244140625, 6.765380859375, 7.00634765625, 7.247314453125, 7.48828125, 7.729248046875, 7.97021484375, 8.211181640625, 8.4521484375, 8.693115234375, 8.93408203125, 9.175048828125, 9.416015625, 9.656982421875, 9.89794921875, 10.138916015625, 10.3798828125, 10.620849609375, 10.86181640625, 11.102783203125, 11.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 10.0, 28.0, 117.0, 3439.0, 402.0, 54.0, 17.0, 11.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1568603515625, -0.13651084899902344, -0.11616134643554688, -0.09581184387207031, -0.07546234130859375, -0.05511283874511719, -0.034763336181640625, -0.014413833618164062, 0.0059356689453125, 0.026285171508789062, 0.046634674072265625, 0.06698417663574219, 0.08733367919921875, 0.10768318176269531, 0.12803268432617188, 0.14838218688964844, 0.168731689453125, 0.18908119201660156, 0.20943069458007812, 0.2297801971435547, 0.25012969970703125, 0.2704792022705078, 0.2908287048339844, 0.31117820739746094, 0.3315277099609375, 0.35187721252441406, 0.3722267150878906, 0.3925762176513672, 0.41292572021484375, 0.4332752227783203, 0.4536247253417969, 0.47397422790527344, 0.49432373046875, 0.5146732330322266, 0.5350227355957031, 0.5553722381591797, 0.5757217407226562, 0.5960712432861328, 0.6164207458496094, 0.6367702484130859, 0.6571197509765625, 0.6774692535400391, 0.6978187561035156, 0.7181682586669922, 0.7385177612304688, 0.7588672637939453, 0.7792167663574219, 0.7995662689208984, 0.819915771484375, 0.8402652740478516, 0.8606147766113281, 0.8809642791748047, 0.9013137817382812, 0.9216632843017578, 0.9420127868652344, 0.9623622894287109, 0.9827117919921875, 1.003061294555664, 1.0234107971191406, 1.0437602996826172, 1.0641098022460938, 1.0844593048095703, 1.1048088073730469, 1.1251583099365234, 1.1455078125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 19.0, 206.0, 676.0, 69.0, 15.0, 6.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.629086971282959, -5.429607391357422, -5.230128288269043, -5.030648708343506, -4.831169128417969, -4.63169002532959, -4.432210445404053, -4.232730865478516, -4.033251762390137, -3.8337724208831787, -3.6342928409576416, -3.4348134994506836, -3.2353339195251465, -3.0358545780181885, -2.8363752365112305, -2.6368956565856934, -2.4374160766601562, -2.2379367351531982, -2.038457155227661, -1.8389778137207031, -1.6394983530044556, -1.440018892288208, -1.24053955078125, -1.0410600900650024, -0.8415806293487549, -0.6421011686325073, -0.44262176752090454, -0.24314236640930176, -0.0436629056930542, 0.15581655502319336, 0.35529589653015137, 0.5547753572463989, 0.7542543411254883, 0.9537338018417358, 1.1532132625579834, 1.3526926040649414, 1.552172064781189, 1.7516515254974365, 1.9511308670043945, 2.1506104469299316, 2.3500897884368896, 2.5495691299438477, 2.7490487098693848, 2.9485280513763428, 3.148007392883301, 3.347486972808838, 3.546966314315796, 3.746445655822754, 3.945925235748291, 4.145404815673828, 4.344883918762207, 4.544363498687744, 4.743843078613281, 4.94332218170166, 5.142801761627197, 5.342281341552734, 5.541760444641113, 5.74124002456665, 5.940719127655029, 6.140198707580566, 6.3396782875061035, 6.539157867431641, 6.7386369705200195, 6.938116550445557, 7.137596130371094]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 14.0, 26.0, 33.0, 57.0, 72.0, 79.0, 84.0, 97.0, 101.0, 122.0, 78.0, 62.0, 49.0, 48.0, 37.0, 10.0, 13.0, 6.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9486967325210571, -1.88349449634552, -1.818292260169983, -1.7530900239944458, -1.6878877878189087, -1.6226855516433716, -1.557483434677124, -1.492281198501587, -1.4270789623260498, -1.3618767261505127, -1.2966744899749756, -1.2314722537994385, -1.1662700176239014, -1.1010677814483643, -1.0358655452728271, -0.9706633687019348, -0.9054610729217529, -0.8402588367462158, -0.7750566005706787, -0.7098543643951416, -0.6446521282196045, -0.5794498920440674, -0.514247715473175, -0.44904547929763794, -0.38384324312210083, -0.3186410069465637, -0.2534387707710266, -0.1882365643978119, -0.12303432822227478, -0.05783209204673767, 0.007370114326477051, 0.07257235050201416, 0.13777470588684082, 0.20297694206237793, 0.26817917823791504, 0.33338138461112976, 0.39858362078666687, 0.463785856962204, 0.5289880633354187, 0.5941902995109558, 0.6593925356864929, 0.72459477186203, 0.7897970080375671, 0.8549991846084595, 0.9202014207839966, 0.9854036569595337, 1.0506058931350708, 1.115808129310608, 1.181010365486145, 1.2462126016616821, 1.3114148378372192, 1.3766170740127563, 1.4418193101882935, 1.5070215463638306, 1.5722236633300781, 1.6374258995056152, 1.7026281356811523, 1.7678303718566895, 1.8330326080322266, 1.8982348442077637, 1.9634370803833008, 2.028639316558838, 2.093841552734375, 2.159043788909912, 2.224246025085449]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 5.0, 10.0, 19.0, 21.0, 22.0, 27.0, 42.0, 50.0, 73.0, 102.0, 134.0, 194.0, 347.0, 654.0, 1207.0, 2839.0, 8151.0, 32208.0, 192188.0, 667237.0, 110906.0, 21350.0, 5985.0, 2221.0, 995.0, 519.0, 307.0, 222.0, 144.0, 103.0, 68.0, 59.0, 31.0, 27.0, 11.0, 13.0, 9.0, 5.0, 9.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.697265625, -0.6743011474609375, -0.651336669921875, -0.6283721923828125, -0.60540771484375, -0.5824432373046875, -0.559478759765625, -0.5365142822265625, -0.5135498046875, -0.4905853271484375, -0.467620849609375, -0.4446563720703125, -0.42169189453125, -0.3987274169921875, -0.375762939453125, -0.3527984619140625, -0.329833984375, -0.3068695068359375, -0.283905029296875, -0.2609405517578125, -0.23797607421875, -0.2150115966796875, -0.192047119140625, -0.1690826416015625, -0.1461181640625, -0.1231536865234375, -0.100189208984375, -0.0772247314453125, -0.05426025390625, -0.0312957763671875, -0.008331298828125, 0.0146331787109375, 0.03759765625, 0.0605621337890625, 0.083526611328125, 0.1064910888671875, 0.12945556640625, 0.1524200439453125, 0.175384521484375, 0.1983489990234375, 0.2213134765625, 0.2442779541015625, 0.267242431640625, 0.2902069091796875, 0.31317138671875, 0.3361358642578125, 0.359100341796875, 0.3820648193359375, 0.405029296875, 0.4279937744140625, 0.450958251953125, 0.4739227294921875, 0.49688720703125, 0.5198516845703125, 0.542816162109375, 0.5657806396484375, 0.5887451171875, 0.6117095947265625, 0.634674072265625, 0.6576385498046875, 0.68060302734375, 0.7035675048828125, 0.726531982421875, 0.7494964599609375, 0.7724609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 6.0, 12.0, 18.0, 31.0, 31.0, 66.0, 64.0, 87.0, 91.0, 101.0, 106.0, 94.0, 72.0, 68.0, 44.0, 44.0, 34.0, 13.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12078857421875, -0.11504077911376953, -0.10929298400878906, -0.1035451889038086, -0.09779739379882812, -0.09204959869384766, -0.08630180358886719, -0.08055400848388672, -0.07480621337890625, -0.06905841827392578, -0.06331062316894531, -0.057562828063964844, -0.051815032958984375, -0.046067237854003906, -0.04031944274902344, -0.03457164764404297, -0.0288238525390625, -0.02307605743408203, -0.017328262329101562, -0.011580467224121094, -0.005832672119140625, -8.487701416015625e-05, 0.0056629180908203125, 0.011410713195800781, 0.01715850830078125, 0.02290630340576172, 0.028654098510742188, 0.034401893615722656, 0.040149688720703125, 0.045897483825683594, 0.05164527893066406, 0.05739307403564453, 0.063140869140625, 0.06888866424560547, 0.07463645935058594, 0.0803842544555664, 0.08613204956054688, 0.09187984466552734, 0.09762763977050781, 0.10337543487548828, 0.10912322998046875, 0.11487102508544922, 0.12061882019042969, 0.12636661529541016, 0.13211441040039062, 0.1378622055053711, 0.14361000061035156, 0.14935779571533203, 0.1551055908203125, 0.16085338592529297, 0.16660118103027344, 0.1723489761352539, 0.17809677124023438, 0.18384456634521484, 0.1895923614501953, 0.19534015655517578, 0.20108795166015625, 0.20683574676513672, 0.2125835418701172, 0.21833133697509766, 0.22407913208007812, 0.2298269271850586, 0.23557472229003906, 0.24132251739501953, 0.2470703125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 6.0, 7.0, 15.0, 15.0, 23.0, 35.0, 47.0, 77.0, 119.0, 246.0, 491.0, 1025.0, 2864.0, 9099.0, 40351.0, 322658.0, 584789.0, 66704.0, 13451.0, 3846.0, 1360.0, 594.0, 286.0, 143.0, 95.0, 66.0, 36.0, 29.0, 12.0, 16.0, 8.0, 6.0, 8.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.66015625, -0.639617919921875, -0.61907958984375, -0.598541259765625, -0.5780029296875, -0.557464599609375, -0.53692626953125, -0.516387939453125, -0.495849609375, -0.475311279296875, -0.45477294921875, -0.434234619140625, -0.4136962890625, -0.393157958984375, -0.37261962890625, -0.352081298828125, -0.33154296875, -0.311004638671875, -0.29046630859375, -0.269927978515625, -0.2493896484375, -0.228851318359375, -0.20831298828125, -0.187774658203125, -0.167236328125, -0.146697998046875, -0.12615966796875, -0.105621337890625, -0.0850830078125, -0.064544677734375, -0.04400634765625, -0.023468017578125, -0.0029296875, 0.017608642578125, 0.03814697265625, 0.058685302734375, 0.0792236328125, 0.099761962890625, 0.12030029296875, 0.140838623046875, 0.161376953125, 0.181915283203125, 0.20245361328125, 0.222991943359375, 0.2435302734375, 0.264068603515625, 0.28460693359375, 0.305145263671875, 0.32568359375, 0.346221923828125, 0.36676025390625, 0.387298583984375, 0.4078369140625, 0.428375244140625, 0.44891357421875, 0.469451904296875, 0.489990234375, 0.510528564453125, 0.53106689453125, 0.551605224609375, 0.5721435546875, 0.592681884765625, 0.61322021484375, 0.633758544921875, 0.654296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 10.0, 21.0, 11.0, 21.0, 24.0, 35.0, 43.0, 41.0, 53.0, 52.0, 62.0, 64.0, 62.0, 46.0, 71.0, 45.0, 54.0, 41.0, 53.0, 33.0, 26.0, 30.0, 16.0, 12.0, 10.0, 10.0, 10.0, 4.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.49951171875, -0.48384857177734375, -0.4681854248046875, -0.45252227783203125, -0.436859130859375, -0.42119598388671875, -0.4055328369140625, -0.38986968994140625, -0.37420654296875, -0.35854339599609375, -0.3428802490234375, -0.32721710205078125, -0.311553955078125, -0.29589080810546875, -0.2802276611328125, -0.26456451416015625, -0.2489013671875, -0.23323822021484375, -0.2175750732421875, -0.20191192626953125, -0.186248779296875, -0.17058563232421875, -0.1549224853515625, -0.13925933837890625, -0.12359619140625, -0.10793304443359375, -0.0922698974609375, -0.07660675048828125, -0.060943603515625, -0.04528045654296875, -0.0296173095703125, -0.01395416259765625, 0.001708984375, 0.01737213134765625, 0.0330352783203125, 0.04869842529296875, 0.064361572265625, 0.08002471923828125, 0.0956878662109375, 0.11135101318359375, 0.12701416015625, 0.14267730712890625, 0.1583404541015625, 0.17400360107421875, 0.189666748046875, 0.20532989501953125, 0.2209930419921875, 0.23665618896484375, 0.2523193359375, 0.26798248291015625, 0.2836456298828125, 0.29930877685546875, 0.314971923828125, 0.33063507080078125, 0.3462982177734375, 0.36196136474609375, 0.37762451171875, 0.39328765869140625, 0.4089508056640625, 0.42461395263671875, 0.440277099609375, 0.45594024658203125, 0.4716033935546875, 0.48726654052734375, 0.5029296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 2.0, 11.0, 12.0, 16.0, 28.0, 38.0, 47.0, 90.0, 169.0, 420.0, 1284.0, 5783.0, 92392.0, 909461.0, 33629.0, 3640.0, 890.0, 298.0, 117.0, 81.0, 40.0, 30.0, 25.0, 19.0, 8.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337646484375, -0.3265266418457031, -0.31540679931640625, -0.3042869567871094, -0.2931671142578125, -0.2820472717285156, -0.27092742919921875, -0.2598075866699219, -0.248687744140625, -0.23756790161132812, -0.22644805908203125, -0.21532821655273438, -0.2042083740234375, -0.19308853149414062, -0.18196868896484375, -0.17084884643554688, -0.15972900390625, -0.14860916137695312, -0.13748931884765625, -0.12636947631835938, -0.1152496337890625, -0.10412979125976562, -0.09300994873046875, -0.08189010620117188, -0.070770263671875, -0.059650421142578125, -0.04853057861328125, -0.037410736083984375, -0.0262908935546875, -0.015171051025390625, -0.00405120849609375, 0.007068634033203125, 0.0181884765625, 0.029308319091796875, 0.04042816162109375, 0.051548004150390625, 0.0626678466796875, 0.07378768920898438, 0.08490753173828125, 0.09602737426757812, 0.107147216796875, 0.11826705932617188, 0.12938690185546875, 0.14050674438476562, 0.1516265869140625, 0.16274642944335938, 0.17386627197265625, 0.18498611450195312, 0.19610595703125, 0.20722579956054688, 0.21834564208984375, 0.22946548461914062, 0.2405853271484375, 0.2517051696777344, 0.26282501220703125, 0.2739448547363281, 0.285064697265625, 0.2961845397949219, 0.30730438232421875, 0.3184242248535156, 0.3295440673828125, 0.3406639099121094, 0.35178375244140625, 0.3629035949707031, 0.3740234375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 11.0, 11.0, 9.0, 16.0, 17.0, 23.0, 29.0, 32.0, 42.0, 43.0, 63.0, 68.0, 65.0, 66.0, 77.0, 76.0, 61.0, 51.0, 35.0, 37.0, 39.0, 23.0, 18.0, 27.0, 8.0, 8.0, 7.0, 5.0, 3.0, 5.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4781951904296875e-05, -1.433398574590683e-05, -1.3886019587516785e-05, -1.343805342912674e-05, -1.2990087270736694e-05, -1.254212111234665e-05, -1.2094154953956604e-05, -1.1646188795566559e-05, -1.1198222637176514e-05, -1.0750256478786469e-05, -1.0302290320396423e-05, -9.854324162006378e-06, -9.406358003616333e-06, -8.958391845226288e-06, -8.510425686836243e-06, -8.062459528446198e-06, -7.614493370056152e-06, -7.166527211666107e-06, -6.718561053276062e-06, -6.270594894886017e-06, -5.822628736495972e-06, -5.3746625781059265e-06, -4.926696419715881e-06, -4.478730261325836e-06, -4.030764102935791e-06, -3.582797944545746e-06, -3.1348317861557007e-06, -2.6868656277656555e-06, -2.2388994693756104e-06, -1.7909333109855652e-06, -1.34296715259552e-06, -8.950009942054749e-07, -4.470348358154297e-07, 9.313225746154785e-10, 4.4889748096466064e-07, 8.968636393547058e-07, 1.344829797744751e-06, 1.7927959561347961e-06, 2.2407621145248413e-06, 2.6887282729148865e-06, 3.1366944313049316e-06, 3.584660589694977e-06, 4.032626748085022e-06, 4.480592906475067e-06, 4.928559064865112e-06, 5.3765252232551575e-06, 5.824491381645203e-06, 6.272457540035248e-06, 6.720423698425293e-06, 7.168389856815338e-06, 7.616356015205383e-06, 8.064322173595428e-06, 8.512288331985474e-06, 8.960254490375519e-06, 9.408220648765564e-06, 9.856186807155609e-06, 1.0304152965545654e-05, 1.07521191239357e-05, 1.1200085282325745e-05, 1.164805144071579e-05, 1.2096017599105835e-05, 1.254398375749588e-05, 1.2991949915885925e-05, 1.343991607427597e-05, 1.3887882232666016e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 8.0, 11.0, 8.0, 21.0, 28.0, 29.0, 80.0, 104.0, 192.0, 474.0, 1109.0, 3620.0, 17935.0, 297673.0, 682779.0, 36124.0, 5563.0, 1597.0, 590.0, 252.0, 134.0, 77.0, 43.0, 33.0, 20.0, 6.0, 4.0, 7.0, 5.0, 2.0, 7.0, 5.0, 2.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.228759765625, -0.2214183807373047, -0.21407699584960938, -0.20673561096191406, -0.19939422607421875, -0.19205284118652344, -0.18471145629882812, -0.1773700714111328, -0.1700286865234375, -0.1626873016357422, -0.15534591674804688, -0.14800453186035156, -0.14066314697265625, -0.13332176208496094, -0.12598037719726562, -0.11863899230957031, -0.111297607421875, -0.10395622253417969, -0.09661483764648438, -0.08927345275878906, -0.08193206787109375, -0.07459068298339844, -0.06724929809570312, -0.05990791320800781, -0.0525665283203125, -0.04522514343261719, -0.037883758544921875, -0.030542373657226562, -0.02320098876953125, -0.015859603881835938, -0.008518218994140625, -0.0011768341064453125, 0.00616455078125, 0.013505935668945312, 0.020847320556640625, 0.028188705444335938, 0.03553009033203125, 0.04287147521972656, 0.050212860107421875, 0.05755424499511719, 0.0648956298828125, 0.07223701477050781, 0.07957839965820312, 0.08691978454589844, 0.09426116943359375, 0.10160255432128906, 0.10894393920898438, 0.11628532409667969, 0.123626708984375, 0.1309680938720703, 0.13830947875976562, 0.14565086364746094, 0.15299224853515625, 0.16033363342285156, 0.16767501831054688, 0.1750164031982422, 0.1823577880859375, 0.1896991729736328, 0.19704055786132812, 0.20438194274902344, 0.21172332763671875, 0.21906471252441406, 0.22640609741210938, 0.2337474822998047, 0.2410888671875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 13.0, 10.0, 23.0, 18.0, 34.0, 56.0, 79.0, 96.0, 121.0, 148.0, 121.0, 80.0, 55.0, 38.0, 27.0, 25.0, 13.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.162841796875, -0.1579151153564453, -0.15298843383789062, -0.14806175231933594, -0.14313507080078125, -0.13820838928222656, -0.13328170776367188, -0.1283550262451172, -0.1234283447265625, -0.11850166320800781, -0.11357498168945312, -0.10864830017089844, -0.10372161865234375, -0.09879493713378906, -0.09386825561523438, -0.08894157409667969, -0.084014892578125, -0.07908821105957031, -0.07416152954101562, -0.06923484802246094, -0.06430816650390625, -0.05938148498535156, -0.054454803466796875, -0.04952812194824219, -0.0446014404296875, -0.03967475891113281, -0.034748077392578125, -0.029821395874023438, -0.02489471435546875, -0.019968032836914062, -0.015041351318359375, -0.010114669799804688, -0.00518798828125, -0.0002613067626953125, 0.004665374755859375, 0.009592056274414062, 0.01451873779296875, 0.019445419311523438, 0.024372100830078125, 0.029298782348632812, 0.0342254638671875, 0.03915214538574219, 0.044078826904296875, 0.04900550842285156, 0.05393218994140625, 0.05885887145996094, 0.06378555297851562, 0.06871223449707031, 0.073638916015625, 0.07856559753417969, 0.08349227905273438, 0.08841896057128906, 0.09334564208984375, 0.09827232360839844, 0.10319900512695312, 0.10812568664550781, 0.1130523681640625, 0.11797904968261719, 0.12290573120117188, 0.12783241271972656, 0.13275909423828125, 0.13768577575683594, 0.14261245727539062, 0.1475391387939453, 0.1524658203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 25.0, 58.0, 101.0, 244.0, 301.0, 134.0, 55.0, 30.0, 12.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.129291534423828, -1.997900366783142, -1.8665093183517456, -1.7351181507110596, -1.603727102279663, -1.472335934638977, -1.340944766998291, -1.2095537185668945, -1.0781625509262085, -0.9467714428901672, -0.815380334854126, -0.6839891672134399, -0.5525980591773987, -0.4212069511413574, -0.2898157835006714, -0.15842467546463013, -0.027033567428588867, 0.10435755550861359, 0.23574867844581604, 0.3671398162841797, 0.49853092432022095, 0.6299220323562622, 0.7613131999969482, 0.8927043080329895, 1.0240954160690308, 1.1554865837097168, 1.2868776321411133, 1.4182687997817993, 1.5496599674224854, 1.6810510158538818, 1.8124421834945679, 1.943833351135254, 2.0752243995666504, 2.206615447998047, 2.3380067348480225, 2.469397783279419, 2.6007888317108154, 2.732180118560791, 2.8635711669921875, 2.994962215423584, 3.1263532638549805, 3.257744312286377, 3.3891355991363525, 3.520526647567749, 3.6519176959991455, 3.783308982849121, 3.9147000312805176, 4.046091079711914, 4.177482604980469, 4.308873653411865, 4.440264701843262, 4.571656227111816, 4.703047275543213, 4.834438323974609, 4.965829372406006, 5.097220420837402, 5.228611469268799, 5.360002517700195, 5.491393566131592, 5.622784614562988, 5.754176139831543, 5.8855671882629395, 6.016958236694336, 6.148349285125732, 6.279740333557129]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 5.0, 7.0, 16.0, 22.0, 19.0, 26.0, 31.0, 24.0, 30.0, 45.0, 39.0, 49.0, 37.0, 65.0, 61.0, 48.0, 69.0, 59.0, 35.0, 40.0, 40.0, 33.0, 30.0, 29.0, 25.0, 18.0, 10.0, 11.0, 8.0, 11.0, 10.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2502613067626953, -2.168671131134033, -2.087080955505371, -2.005490779876709, -1.9239004850387573, -1.8423101902008057, -1.7607200145721436, -1.6791298389434814, -1.5975396633148193, -1.5159494876861572, -1.4343591928482056, -1.3527690172195435, -1.2711788415908813, -1.1895885467529297, -1.1079983711242676, -1.0264081954956055, -0.9448179006576538, -0.8632276654243469, -0.7816374897956848, -0.7000472545623779, -0.6184570789337158, -0.5368668437004089, -0.45527660846710205, -0.37368643283843994, -0.29209619760513306, -0.21050599217414856, -0.12891577184200287, -0.04732555150985718, 0.03426465392112732, 0.11585485935211182, 0.1974450945854187, 0.2790352702140808, 0.3606255054473877, 0.4422157108783722, 0.5238059163093567, 0.6053961515426636, 0.6869863271713257, 0.7685765624046326, 0.8501667976379395, 0.9317569732666016, 1.0133471488952637, 1.0949373245239258, 1.1765276193618774, 1.2581177949905396, 1.3397079706192017, 1.4212982654571533, 1.5028884410858154, 1.5844786167144775, 1.6660689115524292, 1.7476590871810913, 1.829249382019043, 1.910839557647705, 1.9924297332763672, 2.0740199089050293, 2.1556100845336914, 2.2372002601623535, 2.3187906742095947, 2.400380849838257, 2.481971025466919, 2.56356143951416, 2.6451516151428223, 2.7267417907714844, 2.8083319664001465, 2.8899221420288086, 2.9715123176574707]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 6.0, 9.0, 8.0, 5.0, 23.0, 9.0, 34.0, 66.0, 130.0, 204.0, 436.0, 827.0, 1890.0, 5315.0, 21035.0, 215583.0, 3864410.0, 66281.0, 11279.0, 3431.0, 1450.0, 684.0, 390.0, 215.0, 157.0, 115.0, 60.0, 59.0, 42.0, 31.0, 27.0, 14.0, 7.0, 8.0, 8.0, 9.0, 1.0, 9.0, 4.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5846328735351562, -0.5584259033203125, -0.5322189331054688, -0.506011962890625, -0.47980499267578125, -0.4535980224609375, -0.42739105224609375, -0.40118408203125, -0.37497711181640625, -0.3487701416015625, -0.32256317138671875, -0.296356201171875, -0.27014923095703125, -0.2439422607421875, -0.21773529052734375, -0.1915283203125, -0.16532135009765625, -0.1391143798828125, -0.11290740966796875, -0.086700439453125, -0.06049346923828125, -0.0342864990234375, -0.00807952880859375, 0.01812744140625, 0.04433441162109375, 0.0705413818359375, 0.09674835205078125, 0.122955322265625, 0.14916229248046875, 0.1753692626953125, 0.20157623291015625, 0.227783203125, 0.25399017333984375, 0.2801971435546875, 0.30640411376953125, 0.332611083984375, 0.35881805419921875, 0.3850250244140625, 0.41123199462890625, 0.43743896484375, 0.46364593505859375, 0.4898529052734375, 0.5160598754882812, 0.542266845703125, 0.5684738159179688, 0.5946807861328125, 0.6208877563476562, 0.6470947265625, 0.6733016967773438, 0.6995086669921875, 0.7257156372070312, 0.751922607421875, 0.7781295776367188, 0.8043365478515625, 0.8305435180664062, 0.85675048828125, 0.8829574584960938, 0.9091644287109375, 0.9353713989257812, 0.961578369140625, 0.9877853393554688, 1.0139923095703125, 1.0401992797851562, 1.06640625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 13.0, 12.0, 34.0, 29.0, 49.0, 63.0, 59.0, 91.0, 96.0, 86.0, 99.0, 87.0, 69.0, 65.0, 44.0, 37.0, 26.0, 12.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.12211418151855469, -0.11617660522460938, -0.11023902893066406, -0.10430145263671875, -0.09836387634277344, -0.09242630004882812, -0.08648872375488281, -0.0805511474609375, -0.07461357116699219, -0.06867599487304688, -0.06273841857910156, -0.05680084228515625, -0.05086326599121094, -0.044925689697265625, -0.03898811340332031, -0.033050537109375, -0.027112960815429688, -0.021175384521484375, -0.015237808227539062, -0.00930023193359375, -0.0033626556396484375, 0.002574920654296875, 0.008512496948242188, 0.0144500732421875, 0.020387649536132812, 0.026325225830078125, 0.03226280212402344, 0.03820037841796875, 0.04413795471191406, 0.050075531005859375, 0.05601310729980469, 0.06195068359375, 0.06788825988769531, 0.07382583618164062, 0.07976341247558594, 0.08570098876953125, 0.09163856506347656, 0.09757614135742188, 0.10351371765136719, 0.1094512939453125, 0.11538887023925781, 0.12132644653320312, 0.12726402282714844, 0.13320159912109375, 0.13913917541503906, 0.14507675170898438, 0.1510143280029297, 0.156951904296875, 0.1628894805908203, 0.16882705688476562, 0.17476463317871094, 0.18070220947265625, 0.18663978576660156, 0.19257736206054688, 0.1985149383544922, 0.2044525146484375, 0.2103900909423828, 0.21632766723632812, 0.22226524353027344, 0.22820281982421875, 0.23414039611816406, 0.24007797241210938, 0.2460155487060547, 0.251953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 6.0, 5.0, 9.0, 15.0, 18.0, 20.0, 21.0, 20.0, 47.0, 56.0, 76.0, 96.0, 183.0, 355.0, 1676.0, 3465489.0, 723890.0, 1417.0, 319.0, 174.0, 107.0, 76.0, 52.0, 44.0, 22.0, 21.0, 8.0, 9.0, 12.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.244140625, -3.156402587890625, -3.06866455078125, -2.980926513671875, -2.8931884765625, -2.805450439453125, -2.71771240234375, -2.629974365234375, -2.542236328125, -2.454498291015625, -2.36676025390625, -2.279022216796875, -2.1912841796875, -2.103546142578125, -2.01580810546875, -1.928070068359375, -1.84033203125, -1.752593994140625, -1.66485595703125, -1.577117919921875, -1.4893798828125, -1.401641845703125, -1.31390380859375, -1.226165771484375, -1.138427734375, -1.050689697265625, -0.96295166015625, -0.875213623046875, -0.7874755859375, -0.699737548828125, -0.61199951171875, -0.524261474609375, -0.4365234375, -0.348785400390625, -0.26104736328125, -0.173309326171875, -0.0855712890625, 0.002166748046875, 0.08990478515625, 0.177642822265625, 0.265380859375, 0.353118896484375, 0.44085693359375, 0.528594970703125, 0.6163330078125, 0.704071044921875, 0.79180908203125, 0.879547119140625, 0.96728515625, 1.055023193359375, 1.14276123046875, 1.230499267578125, 1.3182373046875, 1.405975341796875, 1.49371337890625, 1.581451416015625, 1.669189453125, 1.756927490234375, 1.84466552734375, 1.932403564453125, 2.0201416015625, 2.107879638671875, 2.19561767578125, 2.283355712890625, 2.37109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 16.0, 44.0, 151.0, 3057.0, 671.0, 92.0, 31.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64306640625, -0.6273002624511719, -0.6115341186523438, -0.5957679748535156, -0.5800018310546875, -0.5642356872558594, -0.5484695434570312, -0.5327033996582031, -0.516937255859375, -0.5011711120605469, -0.48540496826171875, -0.4696388244628906, -0.4538726806640625, -0.4381065368652344, -0.42234039306640625, -0.4065742492675781, -0.39080810546875, -0.3750419616699219, -0.35927581787109375, -0.3435096740722656, -0.3277435302734375, -0.3119773864746094, -0.29621124267578125, -0.2804450988769531, -0.264678955078125, -0.24891281127929688, -0.23314666748046875, -0.21738052368164062, -0.2016143798828125, -0.18584823608398438, -0.17008209228515625, -0.15431594848632812, -0.1385498046875, -0.12278366088867188, -0.10701751708984375, -0.09125137329101562, -0.0754852294921875, -0.059719085693359375, -0.04395294189453125, -0.028186798095703125, -0.012420654296875, 0.003345489501953125, 0.01911163330078125, 0.034877777099609375, 0.0506439208984375, 0.06641006469726562, 0.08217620849609375, 0.09794235229492188, 0.11370849609375, 0.12947463989257812, 0.14524078369140625, 0.16100692749023438, 0.1767730712890625, 0.19253921508789062, 0.20830535888671875, 0.22407150268554688, 0.239837646484375, 0.2556037902832031, 0.27136993408203125, 0.2871360778808594, 0.3029022216796875, 0.3186683654785156, 0.33443450927734375, 0.3502006530761719, 0.365966796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 51.0, 877.0, 69.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.579231262207031, -9.342940330505371, -9.106649398803711, -8.870357513427734, -8.634066581726074, -8.397775650024414, -8.161483764648438, -7.925192832946777, -7.688901901245117, -7.452610969543457, -7.216319561004639, -6.98002815246582, -6.74373722076416, -6.5074462890625, -6.271154880523682, -6.034863471984863, -5.798572540283203, -5.562281608581543, -5.325990200042725, -5.089698791503906, -4.853407859802246, -4.617116928100586, -4.380825519561768, -4.144534111022949, -3.908243179321289, -3.67195200920105, -3.4356608390808105, -3.1993696689605713, -2.963078498840332, -2.7267873287200928, -2.4904961585998535, -2.2542049884796143, -2.017913818359375, -1.7816226482391357, -1.5453314781188965, -1.3090403079986572, -1.072749137878418, -0.8364579677581787, -0.6001667976379395, -0.3638756275177002, -0.12758445739746094, 0.10870671272277832, 0.3449978828430176, 0.5812890529632568, 0.8175802230834961, 1.0538713932037354, 1.2901625633239746, 1.5264537334442139, 1.7627449035644531, 1.9990360736846924, 2.2353272438049316, 2.471618413925171, 2.70790958404541, 2.9442007541656494, 3.1804919242858887, 3.416783094406128, 3.653074264526367, 3.8893654346466064, 4.125656604766846, 4.361948013305664, 4.598238945007324, 4.834529876708984, 5.070821285247803, 5.307112693786621, 5.543403625488281]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 11.0, 16.0, 22.0, 31.0, 42.0, 67.0, 77.0, 72.0, 80.0, 80.0, 87.0, 79.0, 77.0, 69.0, 54.0, 36.0, 38.0, 27.0, 16.0, 9.0, 9.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7951920628547668, -0.7656492590904236, -0.7361063957214355, -0.7065635919570923, -0.677020788192749, -0.6474779844284058, -0.6179351806640625, -0.5883923172950745, -0.5588495135307312, -0.5293067097663879, -0.4997638761997223, -0.47022104263305664, -0.4406782388687134, -0.4111354351043701, -0.38159260153770447, -0.3520497679710388, -0.32250696420669556, -0.2929641604423523, -0.26342132687568665, -0.2338785082101822, -0.20433568954467773, -0.17479287087917328, -0.14525005221366882, -0.11570723354816437, -0.08616441488265991, -0.05662159621715546, -0.027078777551651, 0.0024640411138534546, 0.03200685977935791, 0.061549678444862366, 0.09109249711036682, 0.12063531577587128, 0.1501781940460205, 0.17972101271152496, 0.20926383137702942, 0.23880665004253387, 0.26834946870803833, 0.2978922724723816, 0.32743510603904724, 0.3569779396057129, 0.38652074337005615, 0.4160635471343994, 0.44560638070106506, 0.4751492142677307, 0.504692018032074, 0.5342348217964172, 0.5637776851654053, 0.5933204889297485, 0.6228632926940918, 0.6524060964584351, 0.6819489002227783, 0.7114917635917664, 0.7410345673561096, 0.7705773711204529, 0.8001202344894409, 0.8296630382537842, 0.8592058420181274, 0.8887486457824707, 0.918291449546814, 0.947834312915802, 0.9773771166801453, 1.0069199800491333, 1.0364627838134766, 1.0660055875778198, 1.095548391342163]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 16.0, 15.0, 18.0, 37.0, 36.0, 42.0, 65.0, 89.0, 149.0, 238.0, 390.0, 655.0, 1145.0, 2503.0, 7058.0, 23284.0, 100318.0, 575891.0, 268951.0, 46848.0, 12754.0, 4262.0, 1685.0, 801.0, 487.0, 279.0, 173.0, 102.0, 92.0, 39.0, 35.0, 28.0, 20.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.472900390625, -0.4545402526855469, -0.43618011474609375, -0.4178199768066406, -0.3994598388671875, -0.3810997009277344, -0.36273956298828125, -0.3443794250488281, -0.326019287109375, -0.3076591491699219, -0.28929901123046875, -0.2709388732910156, -0.2525787353515625, -0.23421859741210938, -0.21585845947265625, -0.19749832153320312, -0.17913818359375, -0.16077804565429688, -0.14241790771484375, -0.12405776977539062, -0.1056976318359375, -0.08733749389648438, -0.06897735595703125, -0.050617218017578125, -0.032257080078125, -0.013896942138671875, 0.00446319580078125, 0.022823333740234375, 0.0411834716796875, 0.059543609619140625, 0.07790374755859375, 0.09626388549804688, 0.1146240234375, 0.13298416137695312, 0.15134429931640625, 0.16970443725585938, 0.1880645751953125, 0.20642471313476562, 0.22478485107421875, 0.24314498901367188, 0.261505126953125, 0.2798652648925781, 0.29822540283203125, 0.3165855407714844, 0.3349456787109375, 0.3533058166503906, 0.37166595458984375, 0.3900260925292969, 0.40838623046875, 0.4267463684082031, 0.44510650634765625, 0.4634666442871094, 0.4818267822265625, 0.5001869201660156, 0.5185470581054688, 0.5369071960449219, 0.555267333984375, 0.5736274719238281, 0.5919876098632812, 0.6103477478027344, 0.6287078857421875, 0.6470680236816406, 0.6654281616210938, 0.6837882995605469, 0.7021484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 8.0, 6.0, 13.0, 27.0, 22.0, 25.0, 50.0, 57.0, 54.0, 60.0, 82.0, 85.0, 92.0, 80.0, 65.0, 55.0, 55.0, 45.0, 28.0, 32.0, 25.0, 5.0, 16.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10821533203125, -0.10307979583740234, -0.09794425964355469, -0.09280872344970703, -0.08767318725585938, -0.08253765106201172, -0.07740211486816406, -0.0722665786743164, -0.06713104248046875, -0.061995506286621094, -0.05685997009277344, -0.05172443389892578, -0.046588897705078125, -0.04145336151123047, -0.03631782531738281, -0.031182289123535156, -0.0260467529296875, -0.020911216735839844, -0.015775680541992188, -0.010640144348144531, -0.005504608154296875, -0.00036907196044921875, 0.0047664642333984375, 0.009902000427246094, 0.01503753662109375, 0.020173072814941406, 0.025308609008789062, 0.03044414520263672, 0.035579681396484375, 0.04071521759033203, 0.04585075378417969, 0.050986289978027344, 0.056121826171875, 0.061257362365722656, 0.06639289855957031, 0.07152843475341797, 0.07666397094726562, 0.08179950714111328, 0.08693504333496094, 0.0920705795288086, 0.09720611572265625, 0.1023416519165039, 0.10747718811035156, 0.11261272430419922, 0.11774826049804688, 0.12288379669189453, 0.1280193328857422, 0.13315486907958984, 0.1382904052734375, 0.14342594146728516, 0.1485614776611328, 0.15369701385498047, 0.15883255004882812, 0.16396808624267578, 0.16910362243652344, 0.1742391586303711, 0.17937469482421875, 0.1845102310180664, 0.18964576721191406, 0.19478130340576172, 0.19991683959960938, 0.20505237579345703, 0.2101879119873047, 0.21532344818115234, 0.220458984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 6.0, 14.0, 17.0, 22.0, 29.0, 56.0, 80.0, 107.0, 237.0, 431.0, 982.0, 2425.0, 7258.0, 28649.0, 207456.0, 686674.0, 89642.0, 16478.0, 4666.0, 1689.0, 760.0, 352.0, 188.0, 109.0, 64.0, 35.0, 29.0, 25.0, 14.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67333984375, -0.6495590209960938, -0.6257781982421875, -0.6019973754882812, -0.578216552734375, -0.5544357299804688, -0.5306549072265625, -0.5068740844726562, -0.48309326171875, -0.45931243896484375, -0.4355316162109375, -0.41175079345703125, -0.387969970703125, -0.36418914794921875, -0.3404083251953125, -0.31662750244140625, -0.2928466796875, -0.26906585693359375, -0.2452850341796875, -0.22150421142578125, -0.197723388671875, -0.17394256591796875, -0.1501617431640625, -0.12638092041015625, -0.10260009765625, -0.07881927490234375, -0.0550384521484375, -0.03125762939453125, -0.007476806640625, 0.01630401611328125, 0.0400848388671875, 0.06386566162109375, 0.087646484375, 0.11142730712890625, 0.1352081298828125, 0.15898895263671875, 0.182769775390625, 0.20655059814453125, 0.2303314208984375, 0.25411224365234375, 0.27789306640625, 0.30167388916015625, 0.3254547119140625, 0.34923553466796875, 0.373016357421875, 0.39679718017578125, 0.4205780029296875, 0.44435882568359375, 0.4681396484375, 0.49192047119140625, 0.5157012939453125, 0.5394821166992188, 0.563262939453125, 0.5870437622070312, 0.6108245849609375, 0.6346054077148438, 0.65838623046875, 0.6821670532226562, 0.7059478759765625, 0.7297286987304688, 0.753509521484375, 0.7772903442382812, 0.8010711669921875, 0.8248519897460938, 0.8486328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 9.0, 8.0, 15.0, 14.0, 19.0, 31.0, 30.0, 43.0, 49.0, 49.0, 55.0, 59.0, 78.0, 76.0, 60.0, 75.0, 51.0, 55.0, 43.0, 31.0, 22.0, 27.0, 16.0, 17.0, 9.0, 9.0, 4.0, 10.0, 6.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.57421875, -0.5531234741210938, -0.5320281982421875, -0.5109329223632812, -0.489837646484375, -0.46874237060546875, -0.4476470947265625, -0.42655181884765625, -0.40545654296875, -0.38436126708984375, -0.3632659912109375, -0.34217071533203125, -0.321075439453125, -0.29998016357421875, -0.2788848876953125, -0.25778961181640625, -0.2366943359375, -0.21559906005859375, -0.1945037841796875, -0.17340850830078125, -0.152313232421875, -0.13121795654296875, -0.1101226806640625, -0.08902740478515625, -0.06793212890625, -0.04683685302734375, -0.0257415771484375, -0.00464630126953125, 0.016448974609375, 0.03754425048828125, 0.0586395263671875, 0.07973480224609375, 0.100830078125, 0.12192535400390625, 0.1430206298828125, 0.16411590576171875, 0.185211181640625, 0.20630645751953125, 0.2274017333984375, 0.24849700927734375, 0.26959228515625, 0.29068756103515625, 0.3117828369140625, 0.33287811279296875, 0.353973388671875, 0.37506866455078125, 0.3961639404296875, 0.41725921630859375, 0.4383544921875, 0.45944976806640625, 0.4805450439453125, 0.5016403198242188, 0.522735595703125, 0.5438308715820312, 0.5649261474609375, 0.5860214233398438, 0.60711669921875, 0.6282119750976562, 0.6493072509765625, 0.6704025268554688, 0.691497802734375, 0.7125930786132812, 0.7336883544921875, 0.7547836303710938, 0.77587890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 11.0, 9.0, 23.0, 33.0, 60.0, 104.0, 154.0, 311.0, 792.0, 2363.0, 12536.0, 424421.0, 588699.0, 14799.0, 2571.0, 818.0, 383.0, 168.0, 109.0, 60.0, 39.0, 21.0, 17.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.398193359375, -0.3853645324707031, -0.37253570556640625, -0.3597068786621094, -0.3468780517578125, -0.3340492248535156, -0.32122039794921875, -0.3083915710449219, -0.295562744140625, -0.2827339172363281, -0.26990509033203125, -0.2570762634277344, -0.2442474365234375, -0.23141860961914062, -0.21858978271484375, -0.20576095581054688, -0.19293212890625, -0.18010330200195312, -0.16727447509765625, -0.15444564819335938, -0.1416168212890625, -0.12878799438476562, -0.11595916748046875, -0.10313034057617188, -0.090301513671875, -0.07747268676757812, -0.06464385986328125, -0.051815032958984375, -0.0389862060546875, -0.026157379150390625, -0.01332855224609375, -0.000499725341796875, 0.0123291015625, 0.025157928466796875, 0.03798675537109375, 0.050815582275390625, 0.0636444091796875, 0.07647323608398438, 0.08930206298828125, 0.10213088989257812, 0.114959716796875, 0.12778854370117188, 0.14061737060546875, 0.15344619750976562, 0.1662750244140625, 0.17910385131835938, 0.19193267822265625, 0.20476150512695312, 0.21759033203125, 0.23041915893554688, 0.24324798583984375, 0.2560768127441406, 0.2689056396484375, 0.2817344665527344, 0.29456329345703125, 0.3073921203613281, 0.320220947265625, 0.3330497741699219, 0.34587860107421875, 0.3587074279785156, 0.3715362548828125, 0.3843650817871094, 0.39719390869140625, 0.4100227355957031, 0.4228515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 12.0, 14.0, 15.0, 30.0, 44.0, 73.0, 121.0, 157.0, 150.0, 111.0, 92.0, 72.0, 43.0, 24.0, 14.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.89354133605957e-05, -4.780478775501251e-05, -4.667416214942932e-05, -4.554353654384613e-05, -4.441291093826294e-05, -4.328228533267975e-05, -4.215165972709656e-05, -4.102103412151337e-05, -3.9890408515930176e-05, -3.8759782910346985e-05, -3.7629157304763794e-05, -3.64985316991806e-05, -3.536790609359741e-05, -3.423728048801422e-05, -3.310665488243103e-05, -3.197602927684784e-05, -3.084540367126465e-05, -2.9714778065681458e-05, -2.8584152460098267e-05, -2.7453526854515076e-05, -2.6322901248931885e-05, -2.5192275643348694e-05, -2.4061650037765503e-05, -2.2931024432182312e-05, -2.180039882659912e-05, -2.066977322101593e-05, -1.953914761543274e-05, -1.840852200984955e-05, -1.7277896404266357e-05, -1.6147270798683167e-05, -1.5016645193099976e-05, -1.3886019587516785e-05, -1.2755393981933594e-05, -1.1624768376350403e-05, -1.0494142770767212e-05, -9.363517165184021e-06, -8.23289155960083e-06, -7.102265954017639e-06, -5.971640348434448e-06, -4.841014742851257e-06, -3.7103891372680664e-06, -2.5797635316848755e-06, -1.4491379261016846e-06, -3.1851232051849365e-07, 8.121132850646973e-07, 1.942738890647888e-06, 3.073364496231079e-06, 4.20399010181427e-06, 5.334615707397461e-06, 6.465241312980652e-06, 7.595866918563843e-06, 8.726492524147034e-06, 9.857118129730225e-06, 1.0987743735313416e-05, 1.2118369340896606e-05, 1.3248994946479797e-05, 1.4379620552062988e-05, 1.551024615764618e-05, 1.664087176322937e-05, 1.777149736881256e-05, 1.8902122974395752e-05, 2.0032748579978943e-05, 2.1163374185562134e-05, 2.2293999791145325e-05, 2.3424625396728516e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 15.0, 20.0, 18.0, 42.0, 73.0, 129.0, 311.0, 815.0, 3148.0, 28623.0, 914507.0, 93365.0, 5518.0, 1178.0, 412.0, 179.0, 77.0, 42.0, 24.0, 16.0, 15.0, 5.0, 7.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.484130859375, -0.471923828125, -0.459716796875, -0.447509765625, -0.435302734375, -0.423095703125, -0.410888671875, -0.398681640625, -0.386474609375, -0.374267578125, -0.362060546875, -0.349853515625, -0.337646484375, -0.325439453125, -0.313232421875, -0.301025390625, -0.288818359375, -0.276611328125, -0.264404296875, -0.252197265625, -0.239990234375, -0.227783203125, -0.215576171875, -0.203369140625, -0.191162109375, -0.178955078125, -0.166748046875, -0.154541015625, -0.142333984375, -0.130126953125, -0.117919921875, -0.105712890625, -0.093505859375, -0.081298828125, -0.069091796875, -0.056884765625, -0.044677734375, -0.032470703125, -0.020263671875, -0.008056640625, 0.004150390625, 0.016357421875, 0.028564453125, 0.040771484375, 0.052978515625, 0.065185546875, 0.077392578125, 0.089599609375, 0.101806640625, 0.114013671875, 0.126220703125, 0.138427734375, 0.150634765625, 0.162841796875, 0.175048828125, 0.187255859375, 0.199462890625, 0.211669921875, 0.223876953125, 0.236083984375, 0.248291015625, 0.260498046875, 0.272705078125, 0.284912109375, 0.297119140625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 12.0, 13.0, 27.0, 34.0, 55.0, 116.0, 193.0, 206.0, 145.0, 89.0, 46.0, 23.0, 9.0, 8.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.413818359375, -0.4048786163330078, -0.3959388732910156, -0.38699913024902344, -0.37805938720703125, -0.36911964416503906, -0.3601799011230469, -0.3512401580810547, -0.3423004150390625, -0.3333606719970703, -0.3244209289550781, -0.31548118591308594, -0.30654144287109375, -0.29760169982910156, -0.2886619567871094, -0.2797222137451172, -0.270782470703125, -0.2618427276611328, -0.2529029846191406, -0.24396324157714844, -0.23502349853515625, -0.22608375549316406, -0.21714401245117188, -0.2082042694091797, -0.1992645263671875, -0.1903247833251953, -0.18138504028320312, -0.17244529724121094, -0.16350555419921875, -0.15456581115722656, -0.14562606811523438, -0.1366863250732422, -0.12774658203125, -0.11880683898925781, -0.10986709594726562, -0.10092735290527344, -0.09198760986328125, -0.08304786682128906, -0.07410812377929688, -0.06516838073730469, -0.0562286376953125, -0.04728889465332031, -0.038349151611328125, -0.029409408569335938, -0.02046966552734375, -0.011529922485351562, -0.002590179443359375, 0.0063495635986328125, 0.015289306640625, 0.024229049682617188, 0.033168792724609375, 0.04210853576660156, 0.05104827880859375, 0.05998802185058594, 0.06892776489257812, 0.07786750793457031, 0.0868072509765625, 0.09574699401855469, 0.10468673706054688, 0.11362648010253906, 0.12256622314453125, 0.13150596618652344, 0.14044570922851562, 0.1493854522705078, 0.1583251953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 17.0, 47.0, 176.0, 471.0, 203.0, 56.0, 17.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7482404708862305, -3.4502804279327393, -3.152320384979248, -2.854360342025757, -2.5564002990722656, -2.2584402561187744, -1.9604802131652832, -1.662520170211792, -1.3645601272583008, -1.0666000843048096, -0.7686400413513184, -0.47067999839782715, -0.17271995544433594, 0.12524008750915527, 0.4232001304626465, 0.7211601734161377, 1.019120216369629, 1.3170802593231201, 1.6150403022766113, 1.9130003452301025, 2.2109603881835938, 2.508920431137085, 2.806880474090576, 3.1048405170440674, 3.4028005599975586, 3.70076060295105, 3.998720645904541, 4.296680450439453, 4.594640731811523, 4.892601013183594, 5.190560817718506, 5.488520622253418, 5.786481857299805, 6.084442138671875, 6.382401943206787, 6.680361747741699, 6.9783220291137695, 7.27628231048584, 7.574242115020752, 7.872201919555664, 8.170162200927734, 8.468122482299805, 8.766082763671875, 9.064042091369629, 9.3620023727417, 9.65996265411377, 9.957921981811523, 10.255882263183594, 10.553842544555664, 10.851802825927734, 11.149763107299805, 11.447722434997559, 11.745682716369629, 12.0436429977417, 12.341602325439453, 12.639562606811523, 12.937522888183594, 13.235483169555664, 13.533443450927734, 13.831402778625488, 14.129363059997559, 14.427323341369629, 14.725282669067383, 15.023242950439453, 15.321203231811523]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 7.0, 10.0, 13.0, 6.0, 11.0, 10.0, 24.0, 22.0, 26.0, 23.0, 31.0, 27.0, 37.0, 45.0, 54.0, 44.0, 47.0, 53.0, 47.0, 52.0, 53.0, 54.0, 41.0, 29.0, 41.0, 26.0, 31.0, 24.0, 12.0, 14.0, 19.0, 13.0, 5.0, 8.0, 6.0, 8.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0459728240966797, -2.943551778793335, -2.8411309719085693, -2.7387099266052246, -2.636289119720459, -2.5338680744171143, -2.4314470291137695, -2.329026222229004, -2.226605176925659, -2.1241841316223145, -2.021763324737549, -1.919342279434204, -1.816921353340149, -1.7145004272460938, -1.6120795011520386, -1.5096585750579834, -1.4072376489639282, -1.304816722869873, -1.2023957967758179, -1.0999748706817627, -0.997553825378418, -0.8951328992843628, -0.7927119731903076, -0.6902909874916077, -0.5878700613975525, -0.4854491055011749, -0.38302814960479736, -0.2806072235107422, -0.17818626761436462, -0.07576531171798706, 0.026655614376068115, 0.12907660007476807, 0.23149752616882324, 0.3339184820652008, 0.43633943796157837, 0.5387603640556335, 0.6411813497543335, 0.7436022758483887, 0.8460232019424438, 0.9484441876411438, 1.0508651733398438, 1.153286099433899, 1.255707025527954, 1.3581280708312988, 1.460548996925354, 1.5629699230194092, 1.6653908491134644, 1.7678117752075195, 1.8702327013015747, 1.9726536273956299, 2.0750746726989746, 2.1774954795837402, 2.279916524887085, 2.3823375701904297, 2.4847583770751953, 2.58717942237854, 2.6896002292633057, 2.7920212745666504, 2.894442081451416, 2.9968631267547607, 3.0992839336395264, 3.201704978942871, 3.3041257858276367, 3.4065468311309814, 3.508967876434326]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 14.0, 11.0, 28.0, 38.0, 60.0, 89.0, 152.0, 271.0, 512.0, 956.0, 2053.0, 4815.0, 14754.0, 74741.0, 3726191.0, 325265.0, 29724.0, 8209.0, 3077.0, 1470.0, 754.0, 416.0, 208.0, 139.0, 101.0, 60.0, 44.0, 29.0, 26.0, 18.0, 10.0, 5.0, 6.0, 7.0, 1.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6582183837890625, -0.627960205078125, -0.5977020263671875, -0.56744384765625, -0.5371856689453125, -0.506927490234375, -0.4766693115234375, -0.4464111328125, -0.4161529541015625, -0.385894775390625, -0.3556365966796875, -0.32537841796875, -0.2951202392578125, -0.264862060546875, -0.2346038818359375, -0.204345703125, -0.1740875244140625, -0.143829345703125, -0.1135711669921875, -0.08331298828125, -0.0530548095703125, -0.022796630859375, 0.0074615478515625, 0.0377197265625, 0.0679779052734375, 0.098236083984375, 0.1284942626953125, 0.15875244140625, 0.1890106201171875, 0.219268798828125, 0.2495269775390625, 0.27978515625, 0.3100433349609375, 0.340301513671875, 0.3705596923828125, 0.40081787109375, 0.4310760498046875, 0.461334228515625, 0.4915924072265625, 0.5218505859375, 0.5521087646484375, 0.582366943359375, 0.6126251220703125, 0.64288330078125, 0.6731414794921875, 0.703399658203125, 0.7336578369140625, 0.763916015625, 0.7941741943359375, 0.824432373046875, 0.8546905517578125, 0.88494873046875, 0.9152069091796875, 0.945465087890625, 0.9757232666015625, 1.0059814453125, 1.0362396240234375, 1.066497802734375, 1.0967559814453125, 1.12701416015625, 1.1572723388671875, 1.187530517578125, 1.2177886962890625, 1.248046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 13.0, 11.0, 23.0, 21.0, 24.0, 45.0, 53.0, 61.0, 53.0, 80.0, 88.0, 75.0, 84.0, 62.0, 56.0, 50.0, 44.0, 44.0, 30.0, 28.0, 19.0, 8.0, 7.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11968994140625, -0.11406803131103516, -0.10844612121582031, -0.10282421112060547, -0.09720230102539062, -0.09158039093017578, -0.08595848083496094, -0.0803365707397461, -0.07471466064453125, -0.0690927505493164, -0.06347084045410156, -0.05784893035888672, -0.052227020263671875, -0.04660511016845703, -0.04098320007324219, -0.035361289978027344, -0.0297393798828125, -0.024117469787597656, -0.018495559692382812, -0.012873649597167969, -0.007251739501953125, -0.0016298294067382812, 0.0039920806884765625, 0.009613990783691406, 0.01523590087890625, 0.020857810974121094, 0.026479721069335938, 0.03210163116455078, 0.037723541259765625, 0.04334545135498047, 0.04896736145019531, 0.054589271545410156, 0.060211181640625, 0.06583309173583984, 0.07145500183105469, 0.07707691192626953, 0.08269882202148438, 0.08832073211669922, 0.09394264221191406, 0.0995645523071289, 0.10518646240234375, 0.1108083724975586, 0.11643028259277344, 0.12205219268798828, 0.12767410278320312, 0.13329601287841797, 0.1389179229736328, 0.14453983306884766, 0.1501617431640625, 0.15578365325927734, 0.1614055633544922, 0.16702747344970703, 0.17264938354492188, 0.17827129364013672, 0.18389320373535156, 0.1895151138305664, 0.19513702392578125, 0.2007589340209961, 0.20638084411621094, 0.21200275421142578, 0.21762466430664062, 0.22324657440185547, 0.2288684844970703, 0.23449039459228516, 0.2401123046875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 6.0, 15.0, 28.0, 19.0, 45.0, 91.0, 232.0, 569.0, 2152.0, 15763.0, 4073019.0, 94952.0, 5309.0, 1204.0, 423.0, 175.0, 85.0, 62.0, 47.0, 31.0, 17.0, 10.0, 8.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.30859375, -1.242279052734375, -1.17596435546875, -1.109649658203125, -1.0433349609375, -0.977020263671875, -0.91070556640625, -0.844390869140625, -0.778076171875, -0.711761474609375, -0.64544677734375, -0.579132080078125, -0.5128173828125, -0.446502685546875, -0.38018798828125, -0.313873291015625, -0.24755859375, -0.181243896484375, -0.11492919921875, -0.048614501953125, 0.0177001953125, 0.084014892578125, 0.15032958984375, 0.216644287109375, 0.282958984375, 0.349273681640625, 0.41558837890625, 0.481903076171875, 0.5482177734375, 0.614532470703125, 0.68084716796875, 0.747161865234375, 0.8134765625, 0.879791259765625, 0.94610595703125, 1.012420654296875, 1.0787353515625, 1.145050048828125, 1.21136474609375, 1.277679443359375, 1.343994140625, 1.410308837890625, 1.47662353515625, 1.542938232421875, 1.6092529296875, 1.675567626953125, 1.74188232421875, 1.808197021484375, 1.87451171875, 1.940826416015625, 2.00714111328125, 2.073455810546875, 2.1397705078125, 2.206085205078125, 2.27239990234375, 2.338714599609375, 2.405029296875, 2.471343994140625, 2.53765869140625, 2.603973388671875, 2.6702880859375, 2.736602783203125, 2.80291748046875, 2.869232177734375, 2.935546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 17.0, 27.0, 79.0, 230.0, 2730.0, 723.0, 126.0, 58.0, 21.0, 15.0, 12.0, 10.0, 7.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.27716064453125, -0.2554931640625, -0.23382568359375, -0.212158203125, -0.19049072265625, -0.1688232421875, -0.14715576171875, -0.12548828125, -0.10382080078125, -0.0821533203125, -0.06048583984375, -0.038818359375, -0.01715087890625, 0.0045166015625, 0.02618408203125, 0.0478515625, 0.06951904296875, 0.0911865234375, 0.11285400390625, 0.134521484375, 0.15618896484375, 0.1778564453125, 0.19952392578125, 0.22119140625, 0.24285888671875, 0.2645263671875, 0.28619384765625, 0.307861328125, 0.32952880859375, 0.3511962890625, 0.37286376953125, 0.39453125, 0.41619873046875, 0.4378662109375, 0.45953369140625, 0.481201171875, 0.50286865234375, 0.5245361328125, 0.54620361328125, 0.56787109375, 0.58953857421875, 0.6112060546875, 0.63287353515625, 0.654541015625, 0.67620849609375, 0.6978759765625, 0.71954345703125, 0.7412109375, 0.76287841796875, 0.7845458984375, 0.80621337890625, 0.827880859375, 0.84954833984375, 0.8712158203125, 0.89288330078125, 0.91455078125, 0.93621826171875, 0.9578857421875, 0.97955322265625, 1.001220703125, 1.02288818359375, 1.0445556640625, 1.06622314453125, 1.087890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 37.0, 74.0, 187.0, 335.0, 206.0, 79.0, 38.0, 16.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.143627882003784, -2.0527660846710205, -1.9619044065475464, -1.8710427284240723, -1.7801809310913086, -1.689319133758545, -1.5984574556350708, -1.5075957775115967, -1.416733980178833, -1.3258721828460693, -1.2350105047225952, -1.144148826599121, -1.0532870292663574, -0.9624252915382385, -0.8715635538101196, -0.7807018160820007, -0.6898400783538818, -0.5989783406257629, -0.508116602897644, -0.41725486516952515, -0.32639312744140625, -0.23553138971328735, -0.14466965198516846, -0.05380791425704956, 0.037053823471069336, 0.12791556119918823, 0.21877729892730713, 0.309639036655426, 0.4005007743835449, 0.4913625121116638, 0.5822242498397827, 0.6730859875679016, 0.7639479637145996, 0.8548097014427185, 0.9456714391708374, 1.0365331172943115, 1.1273949146270752, 1.2182567119598389, 1.309118390083313, 1.399980068206787, 1.4908418655395508, 1.5817036628723145, 1.6725653409957886, 1.7634270191192627, 1.8542888164520264, 1.94515061378479, 2.0360121726989746, 2.1268739700317383, 2.217735767364502, 2.3085975646972656, 2.3994593620300293, 2.490320920944214, 2.5811827182769775, 2.672044515609741, 2.762906074523926, 2.8537678718566895, 2.944629669189453, 3.035491466522217, 3.1263532638549805, 3.217214822769165, 3.3080766201019287, 3.3989384174346924, 3.489799976348877, 3.5806617736816406, 3.6715235710144043]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 20.0, 35.0, 39.0, 64.0, 90.0, 96.0, 104.0, 104.0, 111.0, 107.0, 72.0, 49.0, 48.0, 20.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.661919593811035, -2.5783746242523193, -2.4948296546936035, -2.4112846851348877, -2.327739715576172, -2.244194746017456, -2.1606497764587402, -2.0771048069000244, -1.9935598373413086, -1.9100148677825928, -1.826469898223877, -1.7429249286651611, -1.6593799591064453, -1.5758349895477295, -1.4922900199890137, -1.4087450504302979, -1.3252002000808716, -1.2416552305221558, -1.15811026096344, -1.0745652914047241, -0.9910203218460083, -0.9074753522872925, -0.8239304423332214, -0.7403854727745056, -0.6568405032157898, -0.573295533657074, -0.48975056409835815, -0.4062056243419647, -0.3226606547832489, -0.23911568522453308, -0.15557074546813965, -0.07202577590942383, 0.011519193649291992, 0.09506415575742722, 0.17860911786556244, 0.26215407252311707, 0.3456990420818329, 0.4292440116405487, 0.5127889513969421, 0.596333920955658, 0.6798788905143738, 0.7634238600730896, 0.8469688296318054, 0.9305137395858765, 1.0140587091445923, 1.097603678703308, 1.181148648262024, 1.2646936178207397, 1.3482385873794556, 1.4317835569381714, 1.5153285264968872, 1.598873496055603, 1.6824184656143188, 1.7659634351730347, 1.849508285522461, 1.9330532550811768, 2.0165982246398926, 2.1001431941986084, 2.183688163757324, 2.26723313331604, 2.350778102874756, 2.4343230724334717, 2.5178680419921875, 2.6014130115509033, 2.684957981109619]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 5.0, 9.0, 17.0, 17.0, 13.0, 25.0, 41.0, 41.0, 70.0, 111.0, 166.0, 288.0, 526.0, 959.0, 2240.0, 6322.0, 23412.0, 119175.0, 641237.0, 204378.0, 35157.0, 8615.0, 2933.0, 1269.0, 615.0, 335.0, 183.0, 122.0, 68.0, 42.0, 38.0, 25.0, 33.0, 20.0, 15.0, 4.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7980499267578125, -0.774322509765625, -0.7505950927734375, -0.72686767578125, -0.7031402587890625, -0.679412841796875, -0.6556854248046875, -0.6319580078125, -0.6082305908203125, -0.584503173828125, -0.5607757568359375, -0.53704833984375, -0.5133209228515625, -0.489593505859375, -0.4658660888671875, -0.442138671875, -0.4184112548828125, -0.394683837890625, -0.3709564208984375, -0.34722900390625, -0.3235015869140625, -0.299774169921875, -0.2760467529296875, -0.2523193359375, -0.2285919189453125, -0.204864501953125, -0.1811370849609375, -0.15740966796875, -0.1336822509765625, -0.109954833984375, -0.0862274169921875, -0.0625, -0.0387725830078125, -0.015045166015625, 0.0086822509765625, 0.03240966796875, 0.0561370849609375, 0.079864501953125, 0.1035919189453125, 0.1273193359375, 0.1510467529296875, 0.174774169921875, 0.1985015869140625, 0.22222900390625, 0.2459564208984375, 0.269683837890625, 0.2934112548828125, 0.317138671875, 0.3408660888671875, 0.364593505859375, 0.3883209228515625, 0.41204833984375, 0.4357757568359375, 0.459503173828125, 0.4832305908203125, 0.5069580078125, 0.5306854248046875, 0.554412841796875, 0.5781402587890625, 0.60186767578125, 0.6255950927734375, 0.649322509765625, 0.6730499267578125, 0.69677734375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 8.0, 24.0, 20.0, 43.0, 54.0, 68.0, 93.0, 98.0, 119.0, 95.0, 88.0, 78.0, 55.0, 58.0, 42.0, 21.0, 10.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15087890625, -0.14321517944335938, -0.13555145263671875, -0.12788772583007812, -0.1202239990234375, -0.11256027221679688, -0.10489654541015625, -0.09723281860351562, -0.089569091796875, -0.08190536499023438, -0.07424163818359375, -0.06657791137695312, -0.0589141845703125, -0.051250457763671875, -0.04358673095703125, -0.035923004150390625, -0.02825927734375, -0.020595550537109375, -0.01293182373046875, -0.005268096923828125, 0.0023956298828125, 0.010059356689453125, 0.01772308349609375, 0.025386810302734375, 0.033050537109375, 0.040714263916015625, 0.04837799072265625, 0.056041717529296875, 0.0637054443359375, 0.07136917114257812, 0.07903289794921875, 0.08669662475585938, 0.0943603515625, 0.10202407836914062, 0.10968780517578125, 0.11735153198242188, 0.1250152587890625, 0.13267898559570312, 0.14034271240234375, 0.14800643920898438, 0.155670166015625, 0.16333389282226562, 0.17099761962890625, 0.17866134643554688, 0.1863250732421875, 0.19398880004882812, 0.20165252685546875, 0.20931625366210938, 0.21697998046875, 0.22464370727539062, 0.23230743408203125, 0.23997116088867188, 0.2476348876953125, 0.2552986145019531, 0.26296234130859375, 0.2706260681152344, 0.278289794921875, 0.2859535217285156, 0.29361724853515625, 0.3012809753417969, 0.3089447021484375, 0.3166084289550781, 0.32427215576171875, 0.3319358825683594, 0.339599609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 17.0, 10.0, 38.0, 43.0, 51.0, 71.0, 127.0, 176.0, 294.0, 515.0, 945.0, 1918.0, 3986.0, 9265.0, 22677.0, 63959.0, 230935.0, 471991.0, 160876.0, 48394.0, 18034.0, 7456.0, 3210.0, 1578.0, 822.0, 422.0, 258.0, 154.0, 123.0, 60.0, 44.0, 31.0, 15.0, 9.0, 9.0, 8.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38623046875, -0.3726158142089844, -0.35900115966796875, -0.3453865051269531, -0.3317718505859375, -0.3181571960449219, -0.30454254150390625, -0.2909278869628906, -0.277313232421875, -0.2636985778808594, -0.25008392333984375, -0.23646926879882812, -0.2228546142578125, -0.20923995971679688, -0.19562530517578125, -0.18201065063476562, -0.16839599609375, -0.15478134155273438, -0.14116668701171875, -0.12755203247070312, -0.1139373779296875, -0.10032272338867188, -0.08670806884765625, -0.07309341430664062, -0.059478759765625, -0.045864105224609375, -0.03224945068359375, -0.018634796142578125, -0.0050201416015625, 0.008594512939453125, 0.02220916748046875, 0.035823822021484375, 0.0494384765625, 0.06305313110351562, 0.07666778564453125, 0.09028244018554688, 0.1038970947265625, 0.11751174926757812, 0.13112640380859375, 0.14474105834960938, 0.158355712890625, 0.17197036743164062, 0.18558502197265625, 0.19919967651367188, 0.2128143310546875, 0.22642898559570312, 0.24004364013671875, 0.2536582946777344, 0.26727294921875, 0.2808876037597656, 0.29450225830078125, 0.3081169128417969, 0.3217315673828125, 0.3353462219238281, 0.34896087646484375, 0.3625755310058594, 0.376190185546875, 0.3898048400878906, 0.40341949462890625, 0.4170341491699219, 0.4306488037109375, 0.4442634582519531, 0.45787811279296875, 0.4714927673339844, 0.485107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 9.0, 11.0, 14.0, 12.0, 15.0, 19.0, 19.0, 26.0, 35.0, 42.0, 33.0, 50.0, 46.0, 54.0, 36.0, 49.0, 52.0, 40.0, 58.0, 46.0, 61.0, 35.0, 30.0, 25.0, 16.0, 28.0, 23.0, 27.0, 14.0, 14.0, 10.0, 5.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4575767517089844, -0.44029998779296875, -0.4230232238769531, -0.4057464599609375, -0.3884696960449219, -0.37119293212890625, -0.3539161682128906, -0.336639404296875, -0.3193626403808594, -0.30208587646484375, -0.2848091125488281, -0.2675323486328125, -0.2502555847167969, -0.23297882080078125, -0.21570205688476562, -0.19842529296875, -0.18114852905273438, -0.16387176513671875, -0.14659500122070312, -0.1293182373046875, -0.11204147338867188, -0.09476470947265625, -0.07748794555664062, -0.060211181640625, -0.042934417724609375, -0.02565765380859375, -0.008380889892578125, 0.0088958740234375, 0.026172637939453125, 0.04344940185546875, 0.060726165771484375, 0.0780029296875, 0.09527969360351562, 0.11255645751953125, 0.12983322143554688, 0.1471099853515625, 0.16438674926757812, 0.18166351318359375, 0.19894027709960938, 0.216217041015625, 0.23349380493164062, 0.25077056884765625, 0.2680473327636719, 0.2853240966796875, 0.3026008605957031, 0.31987762451171875, 0.3371543884277344, 0.35443115234375, 0.3717079162597656, 0.38898468017578125, 0.4062614440917969, 0.4235382080078125, 0.4408149719238281, 0.45809173583984375, 0.4753684997558594, 0.492645263671875, 0.5099220275878906, 0.5271987915039062, 0.5444755554199219, 0.5617523193359375, 0.5790290832519531, 0.5963058471679688, 0.6135826110839844, 0.630859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 12.0, 15.0, 19.0, 25.0, 41.0, 36.0, 63.0, 107.0, 143.0, 283.0, 431.0, 858.0, 1700.0, 3952.0, 12598.0, 72772.0, 540012.0, 359060.0, 41346.0, 8915.0, 3100.0, 1346.0, 727.0, 371.0, 197.0, 147.0, 76.0, 50.0, 32.0, 13.0, 20.0, 18.0, 11.0, 13.0, 7.0, 5.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.158203125, -0.1520862579345703, -0.14596939086914062, -0.13985252380371094, -0.13373565673828125, -0.12761878967285156, -0.12150192260742188, -0.11538505554199219, -0.1092681884765625, -0.10315132141113281, -0.09703445434570312, -0.09091758728027344, -0.08480072021484375, -0.07868385314941406, -0.07256698608398438, -0.06645011901855469, -0.060333251953125, -0.05421638488769531, -0.048099517822265625, -0.04198265075683594, -0.03586578369140625, -0.029748916625976562, -0.023632049560546875, -0.017515182495117188, -0.0113983154296875, -0.0052814483642578125, 0.000835418701171875, 0.0069522857666015625, 0.01306915283203125, 0.019186019897460938, 0.025302886962890625, 0.03141975402832031, 0.03753662109375, 0.04365348815917969, 0.049770355224609375, 0.05588722229003906, 0.06200408935546875, 0.06812095642089844, 0.07423782348632812, 0.08035469055175781, 0.0864715576171875, 0.09258842468261719, 0.09870529174804688, 0.10482215881347656, 0.11093902587890625, 0.11705589294433594, 0.12317276000976562, 0.1292896270751953, 0.135406494140625, 0.1415233612060547, 0.14764022827148438, 0.15375709533691406, 0.15987396240234375, 0.16599082946777344, 0.17210769653320312, 0.1782245635986328, 0.1843414306640625, 0.1904582977294922, 0.19657516479492188, 0.20269203186035156, 0.20880889892578125, 0.21492576599121094, 0.22104263305664062, 0.2271595001220703, 0.2332763671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 6.0, 8.0, 11.0, 17.0, 18.0, 29.0, 39.0, 49.0, 47.0, 53.0, 58.0, 83.0, 77.0, 66.0, 79.0, 59.0, 60.0, 48.0, 47.0, 25.0, 30.0, 19.0, 15.0, 12.0, 9.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.531839370727539e-05, -1.4705583453178406e-05, -1.4092773199081421e-05, -1.3479962944984436e-05, -1.2867152690887451e-05, -1.2254342436790466e-05, -1.1641532182693481e-05, -1.1028721928596497e-05, -1.0415911674499512e-05, -9.803101420402527e-06, -9.190291166305542e-06, -8.577480912208557e-06, -7.964670658111572e-06, -7.351860404014587e-06, -6.7390501499176025e-06, -6.126239895820618e-06, -5.513429641723633e-06, -4.900619387626648e-06, -4.287809133529663e-06, -3.6749988794326782e-06, -3.0621886253356934e-06, -2.4493783712387085e-06, -1.8365681171417236e-06, -1.2237578630447388e-06, -6.109476089477539e-07, 1.862645149230957e-09, 6.146728992462158e-07, 1.2274831533432007e-06, 1.8402934074401855e-06, 2.4531036615371704e-06, 3.0659139156341553e-06, 3.67872416973114e-06, 4.291534423828125e-06, 4.90434467792511e-06, 5.517154932022095e-06, 6.12996518611908e-06, 6.7427754402160645e-06, 7.355585694313049e-06, 7.968395948410034e-06, 8.581206202507019e-06, 9.194016456604004e-06, 9.806826710700989e-06, 1.0419636964797974e-05, 1.1032447218894958e-05, 1.1645257472991943e-05, 1.2258067727088928e-05, 1.2870877981185913e-05, 1.3483688235282898e-05, 1.4096498489379883e-05, 1.4709308743476868e-05, 1.5322118997573853e-05, 1.5934929251670837e-05, 1.6547739505767822e-05, 1.7160549759864807e-05, 1.7773360013961792e-05, 1.8386170268058777e-05, 1.8998980522155762e-05, 1.9611790776252747e-05, 2.022460103034973e-05, 2.0837411284446716e-05, 2.14502215385437e-05, 2.2063031792640686e-05, 2.267584204673767e-05, 2.3288652300834656e-05, 2.390146255493164e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 14.0, 13.0, 19.0, 36.0, 45.0, 68.0, 127.0, 234.0, 473.0, 1032.0, 2690.0, 8247.0, 34322.0, 235640.0, 598235.0, 135681.0, 22117.0, 5816.0, 1946.0, 852.0, 408.0, 214.0, 108.0, 68.0, 41.0, 35.0, 15.0, 8.0, 16.0, 5.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17394638061523438, -0.16857147216796875, -0.16319656372070312, -0.1578216552734375, -0.15244674682617188, -0.14707183837890625, -0.14169692993164062, -0.136322021484375, -0.13094711303710938, -0.12557220458984375, -0.12019729614257812, -0.1148223876953125, -0.10944747924804688, -0.10407257080078125, -0.09869766235351562, -0.09332275390625, -0.08794784545898438, -0.08257293701171875, -0.07719802856445312, -0.0718231201171875, -0.06644821166992188, -0.06107330322265625, -0.055698394775390625, -0.050323486328125, -0.044948577880859375, -0.03957366943359375, -0.034198760986328125, -0.0288238525390625, -0.023448944091796875, -0.01807403564453125, -0.012699127197265625, -0.00732421875, -0.001949310302734375, 0.00342559814453125, 0.008800506591796875, 0.0141754150390625, 0.019550323486328125, 0.02492523193359375, 0.030300140380859375, 0.035675048828125, 0.041049957275390625, 0.04642486572265625, 0.051799774169921875, 0.0571746826171875, 0.06254959106445312, 0.06792449951171875, 0.07329940795898438, 0.07867431640625, 0.08404922485351562, 0.08942413330078125, 0.09479904174804688, 0.1001739501953125, 0.10554885864257812, 0.11092376708984375, 0.11629867553710938, 0.121673583984375, 0.12704849243164062, 0.13242340087890625, 0.13779830932617188, 0.1431732177734375, 0.14854812622070312, 0.15392303466796875, 0.15929794311523438, 0.1646728515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 7.0, 8.0, 5.0, 13.0, 16.0, 28.0, 34.0, 41.0, 67.0, 92.0, 91.0, 113.0, 110.0, 88.0, 87.0, 45.0, 46.0, 29.0, 20.0, 12.0, 16.0, 8.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211181640625, -0.2049388885498047, -0.19869613647460938, -0.19245338439941406, -0.18621063232421875, -0.17996788024902344, -0.17372512817382812, -0.1674823760986328, -0.1612396240234375, -0.1549968719482422, -0.14875411987304688, -0.14251136779785156, -0.13626861572265625, -0.13002586364746094, -0.12378311157226562, -0.11754035949707031, -0.111297607421875, -0.10505485534667969, -0.09881210327148438, -0.09256935119628906, -0.08632659912109375, -0.08008384704589844, -0.07384109497070312, -0.06759834289550781, -0.0613555908203125, -0.05511283874511719, -0.048870086669921875, -0.04262733459472656, -0.03638458251953125, -0.030141830444335938, -0.023899078369140625, -0.017656326293945312, -0.01141357421875, -0.0051708221435546875, 0.001071929931640625, 0.0073146820068359375, 0.01355743408203125, 0.019800186157226562, 0.026042938232421875, 0.03228569030761719, 0.0385284423828125, 0.04477119445800781, 0.051013946533203125, 0.05725669860839844, 0.06349945068359375, 0.06974220275878906, 0.07598495483398438, 0.08222770690917969, 0.088470458984375, 0.09471321105957031, 0.10095596313476562, 0.10719871520996094, 0.11344146728515625, 0.11968421936035156, 0.12592697143554688, 0.1321697235107422, 0.1384124755859375, 0.1446552276611328, 0.15089797973632812, 0.15714073181152344, 0.16338348388671875, 0.16962623596191406, 0.17586898803710938, 0.1821117401123047, 0.1883544921875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 8.0, 17.0, 37.0, 78.0, 187.0, 347.0, 207.0, 78.0, 16.0, 18.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.164790153503418, -6.9453654289245605, -6.725940704345703, -6.506516456604004, -6.2870917320251465, -6.067667007446289, -5.848242282867432, -5.628817558288574, -5.409393310546875, -5.189968585968018, -4.97054386138916, -4.751119613647461, -4.5316948890686035, -4.312270164489746, -4.092845439910889, -3.8734207153320312, -3.653995990753174, -3.4345712661743164, -3.215146780014038, -2.9957220554351807, -2.7762975692749023, -2.556872844696045, -2.3374481201171875, -2.11802339553833, -1.8985989093780518, -1.6791743040084839, -1.459749698638916, -1.2403249740600586, -1.0209003686904907, -0.8014757633209229, -0.5820510387420654, -0.36262643337249756, -0.1432023048400879, 0.07622233033180237, 0.2956469655036926, 0.5150716304779053, 0.7344962358474731, 0.953920841217041, 1.1733455657958984, 1.3927701711654663, 1.6121947765350342, 1.831619381904602, 2.05104398727417, 2.2704687118530273, 2.4898934364318848, 2.709317922592163, 2.9287426471710205, 3.148167133331299, 3.3675918579101562, 3.5870165824890137, 3.806441068649292, 4.02586555480957, 4.245290279388428, 4.464715003967285, 4.684139728546143, 4.903564453125, 5.122988700866699, 5.342413425445557, 5.561838150024414, 5.781262397766113, 6.000687122344971, 6.220111846923828, 6.4395365715026855, 6.658961296081543, 6.8783860206604]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 7.0, 11.0, 13.0, 20.0, 30.0, 26.0, 30.0, 46.0, 54.0, 58.0, 55.0, 53.0, 59.0, 67.0, 52.0, 56.0, 53.0, 51.0, 36.0, 50.0, 36.0, 26.0, 24.0, 15.0, 17.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.710875988006592, -3.5751142501831055, -3.43935227394104, -3.3035905361175537, -3.1678285598754883, -3.032066822052002, -2.8963050842285156, -2.7605433464050293, -2.624781370162964, -2.4890196323394775, -2.353257656097412, -2.217495918273926, -2.0817341804504395, -1.945972204208374, -1.8102104663848877, -1.6744486093521118, -1.538686752319336, -1.40292489528656, -1.2671630382537842, -1.1314013004302979, -0.995639443397522, -0.8598775863647461, -0.724115788936615, -0.5883539915084839, -0.452592134475708, -0.3168303072452545, -0.18106848001480103, -0.045306652784347534, 0.09045517444610596, 0.22621703147888184, 0.36197882890701294, 0.49774062633514404, 0.6335020065307617, 0.7692638635635376, 0.9050256609916687, 1.0407874584197998, 1.1765493154525757, 1.3123111724853516, 1.448072910308838, 1.5838347673416138, 1.7195966243743896, 1.8553584814071655, 1.9911203384399414, 2.1268820762634277, 2.262643814086914, 2.3984057903289795, 2.534167528152466, 2.6699295043945312, 2.8056912422180176, 2.941452980041504, 3.0772149562835693, 3.2129766941070557, 3.348738670349121, 3.4845004081726074, 3.6202621459960938, 3.75602388381958, 3.8917858600616455, 4.027547836303711, 4.163309574127197, 4.299071311950684, 4.43483304977417, 4.570594787597656, 4.706357002258301, 4.842118740081787, 4.977880477905273]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 10.0, 11.0, 16.0, 10.0, 21.0, 29.0, 71.0, 116.0, 221.0, 474.0, 950.0, 2753.0, 10563.0, 88091.0, 3967664.0, 106046.0, 12001.0, 2939.0, 1120.0, 490.0, 260.0, 151.0, 82.0, 53.0, 41.0, 33.0, 21.0, 14.0, 7.0, 3.0, 11.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5185546875, -0.494476318359375, -0.47039794921875, -0.446319580078125, -0.4222412109375, -0.398162841796875, -0.37408447265625, -0.350006103515625, -0.325927734375, -0.301849365234375, -0.27777099609375, -0.253692626953125, -0.2296142578125, -0.205535888671875, -0.18145751953125, -0.157379150390625, -0.13330078125, -0.109222412109375, -0.08514404296875, -0.061065673828125, -0.0369873046875, -0.012908935546875, 0.01116943359375, 0.035247802734375, 0.059326171875, 0.083404541015625, 0.10748291015625, 0.131561279296875, 0.1556396484375, 0.179718017578125, 0.20379638671875, 0.227874755859375, 0.251953125, 0.276031494140625, 0.30010986328125, 0.324188232421875, 0.3482666015625, 0.372344970703125, 0.39642333984375, 0.420501708984375, 0.444580078125, 0.468658447265625, 0.49273681640625, 0.516815185546875, 0.5408935546875, 0.564971923828125, 0.58905029296875, 0.613128662109375, 0.63720703125, 0.661285400390625, 0.68536376953125, 0.709442138671875, 0.7335205078125, 0.757598876953125, 0.78167724609375, 0.805755615234375, 0.829833984375, 0.853912353515625, 0.87799072265625, 0.902069091796875, 0.9261474609375, 0.950225830078125, 0.97430419921875, 0.998382568359375, 1.0224609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 3.0, 16.0, 25.0, 33.0, 37.0, 78.0, 64.0, 84.0, 101.0, 93.0, 96.0, 79.0, 72.0, 65.0, 48.0, 39.0, 25.0, 13.0, 9.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.146484375, -0.13861465454101562, -0.13074493408203125, -0.12287521362304688, -0.1150054931640625, -0.10713577270507812, -0.09926605224609375, -0.09139633178710938, -0.083526611328125, -0.07565689086914062, -0.06778717041015625, -0.059917449951171875, -0.0520477294921875, -0.044178009033203125, -0.03630828857421875, -0.028438568115234375, -0.02056884765625, -0.012699127197265625, -0.00482940673828125, 0.003040313720703125, 0.0109100341796875, 0.018779754638671875, 0.02664947509765625, 0.034519195556640625, 0.042388916015625, 0.050258636474609375, 0.05812835693359375, 0.06599807739257812, 0.0738677978515625, 0.08173751831054688, 0.08960723876953125, 0.09747695922851562, 0.1053466796875, 0.11321640014648438, 0.12108612060546875, 0.12895584106445312, 0.1368255615234375, 0.14469528198242188, 0.15256500244140625, 0.16043472290039062, 0.168304443359375, 0.17617416381835938, 0.18404388427734375, 0.19191360473632812, 0.1997833251953125, 0.20765304565429688, 0.21552276611328125, 0.22339248657226562, 0.23126220703125, 0.23913192749023438, 0.24700164794921875, 0.2548713684082031, 0.2627410888671875, 0.2706108093261719, 0.27848052978515625, 0.2863502502441406, 0.294219970703125, 0.3020896911621094, 0.30995941162109375, 0.3178291320800781, 0.3256988525390625, 0.3335685729980469, 0.34143829345703125, 0.3493080139160156, 0.357177734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 5.0, 4.0, 7.0, 19.0, 46.0, 85.0, 132.0, 213.0, 378.0, 736.0, 1646.0, 5044.0, 32228.0, 3855073.0, 280317.0, 13150.0, 2823.0, 1136.0, 520.0, 287.0, 159.0, 92.0, 55.0, 46.0, 25.0, 23.0, 12.0, 10.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.0390625, -1.0115737915039062, -0.9840850830078125, -0.9565963745117188, -0.929107666015625, -0.9016189575195312, -0.8741302490234375, -0.8466415405273438, -0.81915283203125, -0.7916641235351562, -0.7641754150390625, -0.7366867065429688, -0.709197998046875, -0.6817092895507812, -0.6542205810546875, -0.6267318725585938, -0.5992431640625, -0.5717544555664062, -0.5442657470703125, -0.5167770385742188, -0.489288330078125, -0.46179962158203125, -0.4343109130859375, -0.40682220458984375, -0.37933349609375, -0.35184478759765625, -0.3243560791015625, -0.29686737060546875, -0.269378662109375, -0.24188995361328125, -0.2144012451171875, -0.18691253662109375, -0.159423828125, -0.13193511962890625, -0.1044464111328125, -0.07695770263671875, -0.049468994140625, -0.02198028564453125, 0.0055084228515625, 0.03299713134765625, 0.06048583984375, 0.08797454833984375, 0.1154632568359375, 0.14295196533203125, 0.170440673828125, 0.19792938232421875, 0.2254180908203125, 0.25290679931640625, 0.2803955078125, 0.30788421630859375, 0.3353729248046875, 0.36286163330078125, 0.390350341796875, 0.41783905029296875, 0.4453277587890625, 0.47281646728515625, 0.50030517578125, 0.5277938842773438, 0.5552825927734375, 0.5827713012695312, 0.610260009765625, 0.6377487182617188, 0.6652374267578125, 0.6927261352539062, 0.72021484375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 6.0, 4.0, 4.0, 5.0, 10.0, 13.0, 28.0, 45.0, 100.0, 346.0, 2676.0, 595.0, 117.0, 58.0, 21.0, 23.0, 10.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.294921875, -0.2842674255371094, -0.27361297607421875, -0.2629585266113281, -0.2523040771484375, -0.24164962768554688, -0.23099517822265625, -0.22034072875976562, -0.209686279296875, -0.19903182983398438, -0.18837738037109375, -0.17772293090820312, -0.1670684814453125, -0.15641403198242188, -0.14575958251953125, -0.13510513305664062, -0.12445068359375, -0.11379623413085938, -0.10314178466796875, -0.09248733520507812, -0.0818328857421875, -0.07117843627929688, -0.06052398681640625, -0.049869537353515625, -0.039215087890625, -0.028560638427734375, -0.01790618896484375, -0.007251739501953125, 0.0034027099609375, 0.014057159423828125, 0.02471160888671875, 0.035366058349609375, 0.0460205078125, 0.056674957275390625, 0.06732940673828125, 0.07798385620117188, 0.0886383056640625, 0.09929275512695312, 0.10994720458984375, 0.12060165405273438, 0.131256103515625, 0.14191055297851562, 0.15256500244140625, 0.16321945190429688, 0.1738739013671875, 0.18452835083007812, 0.19518280029296875, 0.20583724975585938, 0.21649169921875, 0.22714614868164062, 0.23780059814453125, 0.24845504760742188, 0.2591094970703125, 0.2697639465332031, 0.28041839599609375, 0.2910728454589844, 0.301727294921875, 0.3123817443847656, 0.32303619384765625, 0.3336906433105469, 0.3443450927734375, 0.3549995422363281, 0.36565399169921875, 0.3763084411621094, 0.386962890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 23.0, 48.0, 141.0, 278.0, 293.0, 140.0, 37.0, 15.0, 9.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8432812690734863, -2.777459144592285, -2.711637020111084, -2.645815134048462, -2.5799930095672607, -2.5141708850860596, -2.4483487606048584, -2.3825266361236572, -2.316704750061035, -2.250882625579834, -2.185060501098633, -2.1192386150360107, -2.0534164905548096, -1.9875943660736084, -1.9217722415924072, -1.855950117111206, -1.7901279926300049, -1.7243058681488037, -1.658483862876892, -1.592661738395691, -1.5268397331237793, -1.4610176086425781, -1.395195484161377, -1.3293733596801758, -1.2635513544082642, -1.197729229927063, -1.1319072246551514, -1.0660851001739502, -1.000262975692749, -0.9344409704208374, -0.8686188459396362, -0.8027967810630798, -0.7369744777679443, -0.6711524128913879, -0.6053303480148315, -0.5395082235336304, -0.473686158657074, -0.4078640937805176, -0.3420419991016388, -0.27621990442276, -0.2103978395462036, -0.14457575976848602, -0.07875367999076843, -0.012931600213050842, 0.05289047956466675, 0.11871254444122314, 0.18453463912010193, 0.2503567337989807, 0.3161787986755371, 0.3820008635520935, 0.4478229582309723, 0.5136450529098511, 0.5794671177864075, 0.6452891826629639, 0.711111307144165, 0.7769333720207214, 0.8427554368972778, 0.9085775017738342, 0.9743995666503906, 1.0402216911315918, 1.106043815612793, 1.1718658208847046, 1.2376879453659058, 1.3035099506378174, 1.3693320751190186]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 11.0, 17.0, 20.0, 26.0, 26.0, 34.0, 59.0, 71.0, 70.0, 109.0, 75.0, 83.0, 85.0, 82.0, 60.0, 59.0, 36.0, 23.0, 21.0, 11.0, 13.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1679142713546753, -1.1222763061523438, -1.0766383409500122, -1.0310003757476807, -0.9853624105453491, -0.9397244453430176, -0.8940865397453308, -0.8484485745429993, -0.8028106093406677, -0.7571726441383362, -0.7115346789360046, -0.6658967733383179, -0.6202588081359863, -0.5746208429336548, -0.5289828777313232, -0.4833449125289917, -0.43770694732666016, -0.3920689821243286, -0.34643101692199707, -0.3007930815219879, -0.25515511631965637, -0.20951715111732483, -0.16387921571731567, -0.11824125051498413, -0.07260328531265259, -0.026965327560901642, 0.018672630190849304, 0.06431058049201965, 0.1099485456943512, 0.15558651089668274, 0.2012244462966919, 0.24686241149902344, 0.29250025749206543, 0.338138222694397, 0.3837761878967285, 0.42941412329673767, 0.4750520884990692, 0.5206900835037231, 0.5663279891014099, 0.6119659543037415, 0.657603919506073, 0.7032418847084045, 0.7488798499107361, 0.7945177555084229, 0.8401557207107544, 0.8857936859130859, 0.9314316511154175, 0.977069616317749, 1.0227075815200806, 1.068345546722412, 1.1139835119247437, 1.1596214771270752, 1.2052594423294067, 1.2508974075317383, 1.2965352535247803, 1.3421733379364014, 1.3878111839294434, 1.433449149131775, 1.4790871143341064, 1.524725079536438, 1.5703630447387695, 1.616001009941101, 1.6616389751434326, 1.7072768211364746, 1.7529149055480957]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 15.0, 20.0, 24.0, 35.0, 42.0, 72.0, 111.0, 183.0, 312.0, 636.0, 1369.0, 3224.0, 8501.0, 26132.0, 97755.0, 446157.0, 354888.0, 75699.0, 20943.0, 7089.0, 2803.0, 1172.0, 522.0, 308.0, 170.0, 104.0, 66.0, 48.0, 31.0, 23.0, 9.0, 18.0, 4.0, 5.0, 5.0, 6.0, 3.0, 5.0, 4.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.626953125, -0.6079025268554688, -0.5888519287109375, -0.5698013305664062, -0.550750732421875, -0.5317001342773438, -0.5126495361328125, -0.49359893798828125, -0.47454833984375, -0.45549774169921875, -0.4364471435546875, -0.41739654541015625, -0.398345947265625, -0.37929534912109375, -0.3602447509765625, -0.34119415283203125, -0.3221435546875, -0.30309295654296875, -0.2840423583984375, -0.26499176025390625, -0.245941162109375, -0.22689056396484375, -0.2078399658203125, -0.18878936767578125, -0.16973876953125, -0.15068817138671875, -0.1316375732421875, -0.11258697509765625, -0.093536376953125, -0.07448577880859375, -0.0554351806640625, -0.03638458251953125, -0.017333984375, 0.00171661376953125, 0.0207672119140625, 0.03981781005859375, 0.058868408203125, 0.07791900634765625, 0.0969696044921875, 0.11602020263671875, 0.13507080078125, 0.15412139892578125, 0.1731719970703125, 0.19222259521484375, 0.211273193359375, 0.23032379150390625, 0.2493743896484375, 0.26842498779296875, 0.2874755859375, 0.30652618408203125, 0.3255767822265625, 0.34462738037109375, 0.363677978515625, 0.38272857666015625, 0.4017791748046875, 0.42082977294921875, 0.43988037109375, 0.45893096923828125, 0.4779815673828125, 0.49703216552734375, 0.516082763671875, 0.5351333618164062, 0.5541839599609375, 0.5732345581054688, 0.59228515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 10.0, 10.0, 10.0, 39.0, 44.0, 64.0, 63.0, 56.0, 80.0, 109.0, 82.0, 99.0, 71.0, 65.0, 51.0, 39.0, 37.0, 26.0, 13.0, 12.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14599609375, -0.13876724243164062, -0.13153839111328125, -0.12430953979492188, -0.1170806884765625, -0.10985183715820312, -0.10262298583984375, -0.09539413452148438, -0.088165283203125, -0.08093643188476562, -0.07370758056640625, -0.06647872924804688, -0.0592498779296875, -0.052021026611328125, -0.04479217529296875, -0.037563323974609375, -0.03033447265625, -0.023105621337890625, -0.01587677001953125, -0.008647918701171875, -0.0014190673828125, 0.005809783935546875, 0.01303863525390625, 0.020267486572265625, 0.027496337890625, 0.034725189208984375, 0.04195404052734375, 0.049182891845703125, 0.0564117431640625, 0.06364059448242188, 0.07086944580078125, 0.07809829711914062, 0.0853271484375, 0.09255599975585938, 0.09978485107421875, 0.10701370239257812, 0.1142425537109375, 0.12147140502929688, 0.12870025634765625, 0.13592910766601562, 0.143157958984375, 0.15038681030273438, 0.15761566162109375, 0.16484451293945312, 0.1720733642578125, 0.17930221557617188, 0.18653106689453125, 0.19375991821289062, 0.20098876953125, 0.20821762084960938, 0.21544647216796875, 0.22267532348632812, 0.2299041748046875, 0.23713302612304688, 0.24436187744140625, 0.2515907287597656, 0.258819580078125, 0.2660484313964844, 0.27327728271484375, 0.2805061340332031, 0.2877349853515625, 0.2949638366699219, 0.30219268798828125, 0.3094215393066406, 0.316650390625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 8.0, 5.0, 13.0, 24.0, 26.0, 41.0, 67.0, 106.0, 124.0, 237.0, 290.0, 578.0, 901.0, 1601.0, 2987.0, 5597.0, 11595.0, 25743.0, 63298.0, 180797.0, 404174.0, 218566.0, 74688.0, 29811.0, 13179.0, 6362.0, 3307.0, 1827.0, 952.0, 584.0, 355.0, 248.0, 120.0, 100.0, 70.0, 57.0, 40.0, 15.0, 9.0, 9.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.345703125, -0.3344001770019531, -0.32309722900390625, -0.3117942810058594, -0.3004913330078125, -0.2891883850097656, -0.27788543701171875, -0.2665824890136719, -0.255279541015625, -0.24397659301757812, -0.23267364501953125, -0.22137069702148438, -0.2100677490234375, -0.19876480102539062, -0.18746185302734375, -0.17615890502929688, -0.16485595703125, -0.15355300903320312, -0.14225006103515625, -0.13094711303710938, -0.1196441650390625, -0.10834121704101562, -0.09703826904296875, -0.08573532104492188, -0.074432373046875, -0.06312942504882812, -0.05182647705078125, -0.040523529052734375, -0.0292205810546875, -0.017917633056640625, -0.00661468505859375, 0.004688262939453125, 0.0159912109375, 0.027294158935546875, 0.03859710693359375, 0.049900054931640625, 0.0612030029296875, 0.07250595092773438, 0.08380889892578125, 0.09511184692382812, 0.106414794921875, 0.11771774291992188, 0.12902069091796875, 0.14032363891601562, 0.1516265869140625, 0.16292953491210938, 0.17423248291015625, 0.18553543090820312, 0.19683837890625, 0.20814132690429688, 0.21944427490234375, 0.23074722290039062, 0.2420501708984375, 0.2533531188964844, 0.26465606689453125, 0.2759590148925781, 0.287261962890625, 0.2985649108886719, 0.30986785888671875, 0.3211708068847656, 0.3324737548828125, 0.3437767028808594, 0.35507965087890625, 0.3663825988769531, 0.377685546875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 12.0, 5.0, 16.0, 17.0, 17.0, 19.0, 28.0, 28.0, 36.0, 39.0, 32.0, 35.0, 46.0, 46.0, 52.0, 48.0, 42.0, 47.0, 57.0, 43.0, 45.0, 39.0, 26.0, 36.0, 28.0, 32.0, 25.0, 17.0, 20.0, 17.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.542205810546875, -0.52386474609375, -0.505523681640625, -0.4871826171875, -0.468841552734375, -0.45050048828125, -0.432159423828125, -0.413818359375, -0.395477294921875, -0.37713623046875, -0.358795166015625, -0.3404541015625, -0.322113037109375, -0.30377197265625, -0.285430908203125, -0.26708984375, -0.248748779296875, -0.23040771484375, -0.212066650390625, -0.1937255859375, -0.175384521484375, -0.15704345703125, -0.138702392578125, -0.120361328125, -0.102020263671875, -0.08367919921875, -0.065338134765625, -0.0469970703125, -0.028656005859375, -0.01031494140625, 0.008026123046875, 0.0263671875, 0.044708251953125, 0.06304931640625, 0.081390380859375, 0.0997314453125, 0.118072509765625, 0.13641357421875, 0.154754638671875, 0.173095703125, 0.191436767578125, 0.20977783203125, 0.228118896484375, 0.2464599609375, 0.264801025390625, 0.28314208984375, 0.301483154296875, 0.31982421875, 0.338165283203125, 0.35650634765625, 0.374847412109375, 0.3931884765625, 0.411529541015625, 0.42987060546875, 0.448211669921875, 0.466552734375, 0.484893798828125, 0.50323486328125, 0.521575927734375, 0.5399169921875, 0.558258056640625, 0.57659912109375, 0.594940185546875, 0.61328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 12.0, 7.0, 15.0, 24.0, 51.0, 67.0, 139.0, 276.0, 575.0, 1470.0, 4763.0, 27533.0, 357622.0, 594042.0, 51391.0, 7161.0, 1968.0, 750.0, 306.0, 184.0, 74.0, 49.0, 27.0, 19.0, 9.0, 9.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2093505859375, -0.20163536071777344, -0.19392013549804688, -0.1862049102783203, -0.17848968505859375, -0.1707744598388672, -0.16305923461914062, -0.15534400939941406, -0.1476287841796875, -0.13991355895996094, -0.13219833374023438, -0.12448310852050781, -0.11676788330078125, -0.10905265808105469, -0.10133743286132812, -0.09362220764160156, -0.085906982421875, -0.07819175720214844, -0.07047653198242188, -0.06276130676269531, -0.05504608154296875, -0.04733085632324219, -0.039615631103515625, -0.03190040588378906, -0.0241851806640625, -0.016469955444335938, -0.008754730224609375, -0.0010395050048828125, 0.00667572021484375, 0.014390945434570312, 0.022106170654296875, 0.029821395874023438, 0.03753662109375, 0.04525184631347656, 0.052967071533203125, 0.06068229675292969, 0.06839752197265625, 0.07611274719238281, 0.08382797241210938, 0.09154319763183594, 0.0992584228515625, 0.10697364807128906, 0.11468887329101562, 0.12240409851074219, 0.13011932373046875, 0.1378345489501953, 0.14554977416992188, 0.15326499938964844, 0.160980224609375, 0.16869544982910156, 0.17641067504882812, 0.1841259002685547, 0.19184112548828125, 0.1995563507080078, 0.20727157592773438, 0.21498680114746094, 0.2227020263671875, 0.23041725158691406, 0.23813247680664062, 0.2458477020263672, 0.25356292724609375, 0.2612781524658203, 0.2689933776855469, 0.27670860290527344, 0.284423828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 5.0, 21.0, 38.0, 53.0, 135.0, 178.0, 202.0, 160.0, 114.0, 54.0, 26.0, 14.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.675037831068039e-05, -2.500973641872406e-05, -2.326909452676773e-05, -2.15284526348114e-05, -1.9787810742855072e-05, -1.8047168850898743e-05, -1.6306526958942413e-05, -1.4565885066986084e-05, -1.2825243175029755e-05, -1.1084601283073425e-05, -9.343959391117096e-06, -7.603317499160767e-06, -5.862675607204437e-06, -4.122033715248108e-06, -2.3813918232917786e-06, -6.407499313354492e-07, 1.0998919606208801e-06, 2.8405338525772095e-06, 4.581175744533539e-06, 6.321817636489868e-06, 8.062459528446198e-06, 9.803101420402527e-06, 1.1543743312358856e-05, 1.3284385204315186e-05, 1.5025027096271515e-05, 1.6765668988227844e-05, 1.8506310880184174e-05, 2.0246952772140503e-05, 2.1987594664096832e-05, 2.372823655605316e-05, 2.546887844800949e-05, 2.720952033996582e-05, 2.895016223192215e-05, 3.069080412387848e-05, 3.243144601583481e-05, 3.417208790779114e-05, 3.591272979974747e-05, 3.7653371691703796e-05, 3.9394013583660126e-05, 4.1134655475616455e-05, 4.2875297367572784e-05, 4.4615939259529114e-05, 4.635658115148544e-05, 4.809722304344177e-05, 4.98378649353981e-05, 5.157850682735443e-05, 5.331914871931076e-05, 5.505979061126709e-05, 5.680043250322342e-05, 5.854107439517975e-05, 6.028171628713608e-05, 6.202235817909241e-05, 6.376300007104874e-05, 6.550364196300507e-05, 6.72442838549614e-05, 6.898492574691772e-05, 7.072556763887405e-05, 7.246620953083038e-05, 7.420685142278671e-05, 7.594749331474304e-05, 7.768813520669937e-05, 7.94287770986557e-05, 8.116941899061203e-05, 8.291006088256836e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 18.0, 15.0, 48.0, 59.0, 91.0, 214.0, 527.0, 1468.0, 5365.0, 30572.0, 386623.0, 565807.0, 47647.0, 7081.0, 1790.0, 606.0, 249.0, 143.0, 68.0, 41.0, 32.0, 18.0, 17.0, 13.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.284423828125, -0.2769584655761719, -0.26949310302734375, -0.2620277404785156, -0.2545623779296875, -0.24709701538085938, -0.23963165283203125, -0.23216629028320312, -0.224700927734375, -0.21723556518554688, -0.20977020263671875, -0.20230484008789062, -0.1948394775390625, -0.18737411499023438, -0.17990875244140625, -0.17244338989257812, -0.16497802734375, -0.15751266479492188, -0.15004730224609375, -0.14258193969726562, -0.1351165771484375, -0.12765121459960938, -0.12018585205078125, -0.11272048950195312, -0.105255126953125, -0.09778976440429688, -0.09032440185546875, -0.08285903930664062, -0.0753936767578125, -0.06792831420898438, -0.06046295166015625, -0.052997589111328125, -0.0455322265625, -0.038066864013671875, -0.03060150146484375, -0.023136138916015625, -0.0156707763671875, -0.008205413818359375, -0.00074005126953125, 0.006725311279296875, 0.014190673828125, 0.021656036376953125, 0.02912139892578125, 0.036586761474609375, 0.0440521240234375, 0.051517486572265625, 0.05898284912109375, 0.06644821166992188, 0.07391357421875, 0.08137893676757812, 0.08884429931640625, 0.09630966186523438, 0.1037750244140625, 0.11124038696289062, 0.11870574951171875, 0.12617111206054688, 0.133636474609375, 0.14110183715820312, 0.14856719970703125, 0.15603256225585938, 0.1634979248046875, 0.17096328735351562, 0.17842864990234375, 0.18589401245117188, 0.193359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 10.0, 10.0, 17.0, 22.0, 36.0, 45.0, 74.0, 85.0, 88.0, 110.0, 118.0, 86.0, 69.0, 75.0, 28.0, 30.0, 21.0, 25.0, 15.0, 9.0, 5.0, 5.0, 3.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1976318359375, -0.19101715087890625, -0.1844024658203125, -0.17778778076171875, -0.171173095703125, -0.16455841064453125, -0.1579437255859375, -0.15132904052734375, -0.14471435546875, -0.13809967041015625, -0.1314849853515625, -0.12487030029296875, -0.118255615234375, -0.11164093017578125, -0.1050262451171875, -0.09841156005859375, -0.091796875, -0.08518218994140625, -0.0785675048828125, -0.07195281982421875, -0.065338134765625, -0.05872344970703125, -0.0521087646484375, -0.04549407958984375, -0.03887939453125, -0.03226470947265625, -0.0256500244140625, -0.01903533935546875, -0.012420654296875, -0.00580596923828125, 0.0008087158203125, 0.00742340087890625, 0.0140380859375, 0.02065277099609375, 0.0272674560546875, 0.03388214111328125, 0.040496826171875, 0.04711151123046875, 0.0537261962890625, 0.06034088134765625, 0.06695556640625, 0.07357025146484375, 0.0801849365234375, 0.08679962158203125, 0.093414306640625, 0.10002899169921875, 0.1066436767578125, 0.11325836181640625, 0.119873046875, 0.12648773193359375, 0.1331024169921875, 0.13971710205078125, 0.146331787109375, 0.15294647216796875, 0.1595611572265625, 0.16617584228515625, 0.17279052734375, 0.17940521240234375, 0.1860198974609375, 0.19263458251953125, 0.199249267578125, 0.20586395263671875, 0.2124786376953125, 0.21909332275390625, 0.2257080078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 21.0, 80.0, 295.0, 459.0, 107.0, 32.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836428642272949, -6.480191707611084, -6.123955249786377, -5.767718315124512, -5.411481857299805, -5.0552449226379395, -4.699007987976074, -4.342771530151367, -3.986534833908081, -3.630298137664795, -3.274061441421509, -2.9178247451782227, -2.5615878105163574, -2.2053513526916504, -1.8491144180297852, -1.492877721786499, -1.136641025543213, -0.7804043292999268, -0.42416757345199585, -0.06793081760406494, 0.2883058786392212, 0.6445425748825073, 1.000779390335083, 1.3570160865783691, 1.7132527828216553, 2.0694894790649414, 2.4257261753082275, 2.7819628715515137, 3.138199806213379, 3.494436264038086, 3.850673198699951, 4.206910133361816, 4.563146591186523, 4.919383525848389, 5.275619983673096, 5.631856918334961, 5.988093376159668, 6.344330310821533, 6.700567245483398, 7.0568037033081055, 7.4130401611328125, 7.769277095794678, 8.125514030456543, 8.48175048828125, 8.837986946105957, 9.194223403930664, 9.550460815429688, 9.906697273254395, 10.262933731079102, 10.619170188903809, 10.975407600402832, 11.331644058227539, 11.687880516052246, 12.044116973876953, 12.400354385375977, 12.756590843200684, 13.112828254699707, 13.469064712524414, 13.825302124023438, 14.181538581848145, 14.537775039672852, 14.894011497497559, 15.250248908996582, 15.606485366821289, 15.962721824645996]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 9.0, 12.0, 17.0, 16.0, 24.0, 14.0, 30.0, 28.0, 29.0, 42.0, 32.0, 44.0, 47.0, 51.0, 66.0, 37.0, 42.0, 59.0, 48.0, 54.0, 36.0, 42.0, 33.0, 28.0, 24.0, 20.0, 22.0, 18.0, 18.0, 9.0, 9.0, 8.0, 6.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7749481201171875, -3.656970500946045, -3.5389928817749023, -3.421015501022339, -3.3030378818511963, -3.1850602626800537, -3.067082643508911, -2.9491052627563477, -2.831127643585205, -2.7131500244140625, -2.59517240524292, -2.4771950244903564, -2.359217405319214, -2.2412397861480713, -2.1232621669769287, -2.0052847862243652, -1.887307047843933, -1.7693294286727905, -1.6513519287109375, -1.533374309539795, -1.415396809577942, -1.2974191904067993, -1.1794416904449463, -1.0614640712738037, -0.9434865117073059, -0.8255089521408081, -0.7075313925743103, -0.5895538330078125, -0.4715762436389923, -0.3535986542701721, -0.23562109470367432, -0.11764353513717651, 0.00033402442932128906, 0.11831159144639969, 0.2362891584634781, 0.3542667329311371, 0.4722442924976349, 0.5902218818664551, 0.7081994414329529, 0.8261770009994507, 0.9441545605659485, 1.0621321201324463, 1.1801097393035889, 1.298087239265442, 1.4160648584365845, 1.5340423583984375, 1.65201997756958, 1.7699975967407227, 1.8879750967025757, 2.0059525966644287, 2.1239302158355713, 2.241907835006714, 2.3598854541778564, 2.47786283493042, 2.5958404541015625, 2.713818073272705, 2.8317956924438477, 2.9497733116149902, 3.067750930786133, 3.1857283115386963, 3.303705930709839, 3.4216835498809814, 3.539661169052124, 3.6576385498046875, 3.77561616897583]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 17.0, 18.0, 43.0, 59.0, 100.0, 165.0, 368.0, 945.0, 2746.0, 15327.0, 3808720.0, 351967.0, 9937.0, 2220.0, 823.0, 362.0, 176.0, 100.0, 65.0, 31.0, 25.0, 14.0, 15.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8370437622070312, -0.7927398681640625, -0.7484359741210938, -0.704132080078125, -0.6598281860351562, -0.6155242919921875, -0.5712203979492188, -0.52691650390625, -0.48261260986328125, -0.4383087158203125, -0.39400482177734375, -0.349700927734375, -0.30539703369140625, -0.2610931396484375, -0.21678924560546875, -0.1724853515625, -0.12818145751953125, -0.0838775634765625, -0.03957366943359375, 0.004730224609375, 0.04903411865234375, 0.0933380126953125, 0.13764190673828125, 0.18194580078125, 0.22624969482421875, 0.2705535888671875, 0.31485748291015625, 0.359161376953125, 0.40346527099609375, 0.4477691650390625, 0.49207305908203125, 0.536376953125, 0.5806808471679688, 0.6249847412109375, 0.6692886352539062, 0.713592529296875, 0.7578964233398438, 0.8022003173828125, 0.8465042114257812, 0.89080810546875, 0.9351119995117188, 0.9794158935546875, 1.0237197875976562, 1.068023681640625, 1.1123275756835938, 1.1566314697265625, 1.2009353637695312, 1.2452392578125, 1.2895431518554688, 1.3338470458984375, 1.3781509399414062, 1.422454833984375, 1.4667587280273438, 1.5110626220703125, 1.5553665161132812, 1.59967041015625, 1.6439743041992188, 1.6882781982421875, 1.7325820922851562, 1.776885986328125, 1.8211898803710938, 1.8654937744140625, 1.9097976684570312, 1.9541015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 10.0, 9.0, 16.0, 29.0, 28.0, 37.0, 44.0, 50.0, 62.0, 67.0, 73.0, 85.0, 63.0, 61.0, 63.0, 67.0, 59.0, 32.0, 32.0, 24.0, 24.0, 23.0, 14.0, 10.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1485595703125, -0.14116477966308594, -0.13376998901367188, -0.1263751983642578, -0.11898040771484375, -0.11158561706542969, -0.10419082641601562, -0.09679603576660156, -0.0894012451171875, -0.08200645446777344, -0.07461166381835938, -0.06721687316894531, -0.05982208251953125, -0.05242729187011719, -0.045032501220703125, -0.03763771057128906, -0.030242919921875, -0.022848129272460938, -0.015453338623046875, -0.008058547973632812, -0.00066375732421875, 0.0067310333251953125, 0.014125823974609375, 0.021520614624023438, 0.0289154052734375, 0.03631019592285156, 0.043704986572265625, 0.05109977722167969, 0.05849456787109375, 0.06588935852050781, 0.07328414916992188, 0.08067893981933594, 0.08807373046875, 0.09546852111816406, 0.10286331176757812, 0.11025810241699219, 0.11765289306640625, 0.1250476837158203, 0.13244247436523438, 0.13983726501464844, 0.1472320556640625, 0.15462684631347656, 0.16202163696289062, 0.1694164276123047, 0.17681121826171875, 0.1842060089111328, 0.19160079956054688, 0.19899559020996094, 0.206390380859375, 0.21378517150878906, 0.22117996215820312, 0.2285747528076172, 0.23596954345703125, 0.2433643341064453, 0.2507591247558594, 0.25815391540527344, 0.2655487060546875, 0.27294349670410156, 0.2803382873535156, 0.2877330780029297, 0.29512786865234375, 0.3025226593017578, 0.3099174499511719, 0.31731224060058594, 0.32470703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 13.0, 20.0, 46.0, 102.0, 197.0, 383.0, 929.0, 3065.0, 20925.0, 3953860.0, 203971.0, 7952.0, 1615.0, 599.0, 272.0, 150.0, 75.0, 58.0, 26.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.0278778076171875, -0.986419677734375, -0.9449615478515625, -0.90350341796875, -0.8620452880859375, -0.820587158203125, -0.7791290283203125, -0.7376708984375, -0.6962127685546875, -0.654754638671875, -0.6132965087890625, -0.57183837890625, -0.5303802490234375, -0.488922119140625, -0.4474639892578125, -0.406005859375, -0.3645477294921875, -0.323089599609375, -0.2816314697265625, -0.24017333984375, -0.1987152099609375, -0.157257080078125, -0.1157989501953125, -0.0743408203125, -0.0328826904296875, 0.008575439453125, 0.0500335693359375, 0.09149169921875, 0.1329498291015625, 0.174407958984375, 0.2158660888671875, 0.25732421875, 0.2987823486328125, 0.340240478515625, 0.3816986083984375, 0.42315673828125, 0.4646148681640625, 0.506072998046875, 0.5475311279296875, 0.5889892578125, 0.6304473876953125, 0.671905517578125, 0.7133636474609375, 0.75482177734375, 0.7962799072265625, 0.837738037109375, 0.8791961669921875, 0.920654296875, 0.9621124267578125, 1.003570556640625, 1.0450286865234375, 1.08648681640625, 1.1279449462890625, 1.169403076171875, 1.2108612060546875, 1.2523193359375, 1.2937774658203125, 1.335235595703125, 1.3766937255859375, 1.41815185546875, 1.4596099853515625, 1.501068115234375, 1.5425262451171875, 1.583984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 13.0, 22.0, 26.0, 65.0, 203.0, 2129.0, 1280.0, 172.0, 58.0, 36.0, 23.0, 14.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5027847290039062, -0.4865264892578125, -0.47026824951171875, -0.454010009765625, -0.43775177001953125, -0.4214935302734375, -0.40523529052734375, -0.38897705078125, -0.37271881103515625, -0.3564605712890625, -0.34020233154296875, -0.323944091796875, -0.30768585205078125, -0.2914276123046875, -0.27516937255859375, -0.2589111328125, -0.24265289306640625, -0.2263946533203125, -0.21013641357421875, -0.193878173828125, -0.17761993408203125, -0.1613616943359375, -0.14510345458984375, -0.12884521484375, -0.11258697509765625, -0.0963287353515625, -0.08007049560546875, -0.063812255859375, -0.04755401611328125, -0.0312957763671875, -0.01503753662109375, 0.001220703125, 0.01747894287109375, 0.0337371826171875, 0.04999542236328125, 0.066253662109375, 0.08251190185546875, 0.0987701416015625, 0.11502838134765625, 0.13128662109375, 0.14754486083984375, 0.1638031005859375, 0.18006134033203125, 0.196319580078125, 0.21257781982421875, 0.2288360595703125, 0.24509429931640625, 0.2613525390625, 0.27761077880859375, 0.2938690185546875, 0.31012725830078125, 0.326385498046875, 0.34264373779296875, 0.3589019775390625, 0.37516021728515625, 0.39141845703125, 0.40767669677734375, 0.4239349365234375, 0.44019317626953125, 0.456451416015625, 0.47270965576171875, 0.4889678955078125, 0.5052261352539062, 0.521484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 28.0, 201.0, 637.0, 116.0, 16.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-11.237338066101074, -11.038126945495605, -10.838916778564453, -10.639705657958984, -10.440495491027832, -10.241284370422363, -10.042074203491211, -9.842863082885742, -9.643651962280273, -9.444440841674805, -9.245230674743652, -9.046019554138184, -8.846809387207031, -8.647598266601562, -8.44838809967041, -8.249176979064941, -8.049966812133789, -7.8507561683654785, -7.651545524597168, -7.452334880828857, -7.253124237060547, -7.053913116455078, -6.854702472686768, -6.655491828918457, -6.4562811851501465, -6.257070541381836, -6.057859897613525, -5.858649253845215, -5.659438133239746, -5.4602274894714355, -5.261016845703125, -5.0618062019348145, -4.862595081329346, -4.663384437561035, -4.464173793792725, -4.264963150024414, -4.065752029418945, -3.866541624069214, -3.667330741882324, -3.4681200981140137, -3.268909454345703, -3.0696988105773926, -2.870488166809082, -2.6712772846221924, -2.472066640853882, -2.2728559970855713, -2.0736451148986816, -1.874434471130371, -1.6752238273620605, -1.47601318359375, -1.27680242061615, -1.0775916576385498, -0.8783810138702393, -0.6791703104972839, -0.4799596071243286, -0.2807488441467285, -0.08153820037841797, 0.11767250299453735, 0.3168832063674927, 0.516093909740448, 0.7153046131134033, 0.9145153164863586, 1.113726019859314, 1.312936782836914, 1.5121474266052246]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 10.0, 6.0, 23.0, 21.0, 24.0, 34.0, 24.0, 31.0, 42.0, 51.0, 46.0, 64.0, 52.0, 60.0, 58.0, 50.0, 56.0, 50.0, 51.0, 46.0, 32.0, 28.0, 26.0, 27.0, 17.0, 18.0, 9.0, 8.0, 10.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.520456075668335, -1.4812712669372559, -1.4420864582061768, -1.4029016494750977, -1.3637168407440186, -1.3245320320129395, -1.2853472232818604, -1.2461625337600708, -1.2069777250289917, -1.1677929162979126, -1.1286081075668335, -1.0894232988357544, -1.0502384901046753, -1.0110538005828857, -0.9718689322471619, -0.9326841831207275, -0.8934993147850037, -0.8543145060539246, -0.8151296973228455, -0.7759449481964111, -0.736760139465332, -0.6975753307342529, -0.6583905220031738, -0.6192057132720947, -0.5800209045410156, -0.5408360958099365, -0.5016512870788574, -0.4624665081501007, -0.423281729221344, -0.3840969204902649, -0.3449121117591858, -0.3057273328304291, -0.26654261350631714, -0.22735781967639923, -0.18817302584648132, -0.14898821711540222, -0.10980342328548431, -0.0706186294555664, -0.031433820724487305, 0.007750958204269409, 0.04693576693534851, 0.08612056076526642, 0.12530535459518433, 0.16449016332626343, 0.20367495715618134, 0.24285975098609924, 0.28204455971717834, 0.32122933864593506, 0.36041414737701416, 0.39959895610809326, 0.43878373503685, 0.4779685437679291, 0.5171533226966858, 0.5563381314277649, 0.595522940158844, 0.6347076892852783, 0.6738924980163574, 0.7130773067474365, 0.7522621154785156, 0.7914469242095947, 0.830631673336029, 0.8698164820671082, 0.9090012907981873, 0.9481860399246216, 0.9873709082603455]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 2.0, 11.0, 11.0, 23.0, 27.0, 44.0, 84.0, 115.0, 179.0, 251.0, 468.0, 890.0, 1895.0, 4348.0, 10882.0, 33016.0, 120173.0, 529693.0, 258169.0, 58105.0, 18112.0, 6599.0, 2611.0, 1290.0, 661.0, 347.0, 207.0, 106.0, 74.0, 42.0, 34.0, 35.0, 14.0, 12.0, 13.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5654296875, -0.54345703125, -0.521484375, -0.49951171875, -0.4775390625, -0.45556640625, -0.43359375, -0.41162109375, -0.3896484375, -0.36767578125, -0.345703125, -0.32373046875, -0.3017578125, -0.27978515625, -0.2578125, -0.23583984375, -0.2138671875, -0.19189453125, -0.169921875, -0.14794921875, -0.1259765625, -0.10400390625, -0.08203125, -0.06005859375, -0.0380859375, -0.01611328125, 0.005859375, 0.02783203125, 0.0498046875, 0.07177734375, 0.09375, 0.11572265625, 0.1376953125, 0.15966796875, 0.181640625, 0.20361328125, 0.2255859375, 0.24755859375, 0.26953125, 0.29150390625, 0.3134765625, 0.33544921875, 0.357421875, 0.37939453125, 0.4013671875, 0.42333984375, 0.4453125, 0.46728515625, 0.4892578125, 0.51123046875, 0.533203125, 0.55517578125, 0.5771484375, 0.59912109375, 0.62109375, 0.64306640625, 0.6650390625, 0.68701171875, 0.708984375, 0.73095703125, 0.7529296875, 0.77490234375, 0.796875, 0.81884765625, 0.8408203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 22.0, 34.0, 25.0, 23.0, 28.0, 35.0, 35.0, 40.0, 59.0, 52.0, 55.0, 55.0, 62.0, 56.0, 58.0, 57.0, 39.0, 35.0, 45.0, 29.0, 32.0, 17.0, 13.0, 20.0, 9.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.151611328125, -0.14554595947265625, -0.1394805908203125, -0.13341522216796875, -0.127349853515625, -0.12128448486328125, -0.1152191162109375, -0.10915374755859375, -0.10308837890625, -0.09702301025390625, -0.0909576416015625, -0.08489227294921875, -0.078826904296875, -0.07276153564453125, -0.0666961669921875, -0.06063079833984375, -0.0545654296875, -0.04850006103515625, -0.0424346923828125, -0.03636932373046875, -0.030303955078125, -0.02423858642578125, -0.0181732177734375, -0.01210784912109375, -0.00604248046875, 2.288818359375e-05, 0.0060882568359375, 0.01215362548828125, 0.018218994140625, 0.02428436279296875, 0.0303497314453125, 0.03641510009765625, 0.04248046875, 0.04854583740234375, 0.0546112060546875, 0.06067657470703125, 0.066741943359375, 0.07280731201171875, 0.0788726806640625, 0.08493804931640625, 0.09100341796875, 0.09706878662109375, 0.1031341552734375, 0.10919952392578125, 0.115264892578125, 0.12133026123046875, 0.1273956298828125, 0.13346099853515625, 0.1395263671875, 0.14559173583984375, 0.1516571044921875, 0.15772247314453125, 0.163787841796875, 0.16985321044921875, 0.1759185791015625, 0.18198394775390625, 0.18804931640625, 0.19411468505859375, 0.2001800537109375, 0.20624542236328125, 0.212310791015625, 0.21837615966796875, 0.2244415283203125, 0.23050689697265625, 0.236572265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 3.0, 7.0, 7.0, 7.0, 14.0, 7.0, 12.0, 23.0, 30.0, 40.0, 58.0, 77.0, 118.0, 255.0, 414.0, 785.0, 1736.0, 4224.0, 12335.0, 43323.0, 217363.0, 600549.0, 124059.0, 28368.0, 8643.0, 3155.0, 1398.0, 639.0, 317.0, 207.0, 135.0, 76.0, 40.0, 34.0, 15.0, 14.0, 14.0, 13.0, 8.0, 7.0, 7.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67578125, -0.6535110473632812, -0.6312408447265625, -0.6089706420898438, -0.586700439453125, -0.5644302368164062, -0.5421600341796875, -0.5198898315429688, -0.49761962890625, -0.47534942626953125, -0.4530792236328125, -0.43080902099609375, -0.408538818359375, -0.38626861572265625, -0.3639984130859375, -0.34172821044921875, -0.3194580078125, -0.29718780517578125, -0.2749176025390625, -0.25264739990234375, -0.230377197265625, -0.20810699462890625, -0.1858367919921875, -0.16356658935546875, -0.14129638671875, -0.11902618408203125, -0.0967559814453125, -0.07448577880859375, -0.052215576171875, -0.02994537353515625, -0.0076751708984375, 0.01459503173828125, 0.036865234375, 0.05913543701171875, 0.0814056396484375, 0.10367584228515625, 0.125946044921875, 0.14821624755859375, 0.1704864501953125, 0.19275665283203125, 0.21502685546875, 0.23729705810546875, 0.2595672607421875, 0.28183746337890625, 0.304107666015625, 0.32637786865234375, 0.3486480712890625, 0.37091827392578125, 0.3931884765625, 0.41545867919921875, 0.4377288818359375, 0.45999908447265625, 0.482269287109375, 0.5045394897460938, 0.5268096923828125, 0.5490798950195312, 0.57135009765625, 0.5936203002929688, 0.6158905029296875, 0.6381607055664062, 0.660430908203125, 0.6827011108398438, 0.7049713134765625, 0.7272415161132812, 0.74951171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 10.0, 11.0, 13.0, 18.0, 24.0, 16.0, 25.0, 28.0, 37.0, 41.0, 43.0, 59.0, 39.0, 48.0, 57.0, 55.0, 51.0, 51.0, 40.0, 40.0, 38.0, 45.0, 33.0, 31.0, 22.0, 18.0, 24.0, 12.0, 8.0, 7.0, 10.0, 9.0, 2.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.78955078125, -0.7642898559570312, -0.7390289306640625, -0.7137680053710938, -0.688507080078125, -0.6632461547851562, -0.6379852294921875, -0.6127243041992188, -0.58746337890625, -0.5622024536132812, -0.5369415283203125, -0.5116806030273438, -0.486419677734375, -0.46115875244140625, -0.4358978271484375, -0.41063690185546875, -0.3853759765625, -0.36011505126953125, -0.3348541259765625, -0.30959320068359375, -0.284332275390625, -0.25907135009765625, -0.2338104248046875, -0.20854949951171875, -0.18328857421875, -0.15802764892578125, -0.1327667236328125, -0.10750579833984375, -0.082244873046875, -0.05698394775390625, -0.0317230224609375, -0.00646209716796875, 0.018798828125, 0.04405975341796875, 0.0693206787109375, 0.09458160400390625, 0.119842529296875, 0.14510345458984375, 0.1703643798828125, 0.19562530517578125, 0.22088623046875, 0.24614715576171875, 0.2714080810546875, 0.29666900634765625, 0.321929931640625, 0.34719085693359375, 0.3724517822265625, 0.39771270751953125, 0.4229736328125, 0.44823455810546875, 0.4734954833984375, 0.49875640869140625, 0.524017333984375, 0.5492782592773438, 0.5745391845703125, 0.5998001098632812, 0.62506103515625, 0.6503219604492188, 0.6755828857421875, 0.7008438110351562, 0.726104736328125, 0.7513656616210938, 0.7766265869140625, 0.8018875122070312, 0.8271484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 5.0, 12.0, 13.0, 45.0, 145.0, 375.0, 1438.0, 20299.0, 1013143.0, 11538.0, 1061.0, 278.0, 120.0, 43.0, 14.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.230377197265625, -1.19122314453125, -1.152069091796875, -1.1129150390625, -1.073760986328125, -1.03460693359375, -0.995452880859375, -0.956298828125, -0.917144775390625, -0.87799072265625, -0.838836669921875, -0.7996826171875, -0.760528564453125, -0.72137451171875, -0.682220458984375, -0.64306640625, -0.603912353515625, -0.56475830078125, -0.525604248046875, -0.4864501953125, -0.447296142578125, -0.40814208984375, -0.368988037109375, -0.329833984375, -0.290679931640625, -0.25152587890625, -0.212371826171875, -0.1732177734375, -0.134063720703125, -0.09490966796875, -0.055755615234375, -0.0166015625, 0.022552490234375, 0.06170654296875, 0.100860595703125, 0.1400146484375, 0.179168701171875, 0.21832275390625, 0.257476806640625, 0.296630859375, 0.335784912109375, 0.37493896484375, 0.414093017578125, 0.4532470703125, 0.492401123046875, 0.53155517578125, 0.570709228515625, 0.60986328125, 0.649017333984375, 0.68817138671875, 0.727325439453125, 0.7664794921875, 0.805633544921875, 0.84478759765625, 0.883941650390625, 0.923095703125, 0.962249755859375, 1.00140380859375, 1.040557861328125, 1.0797119140625, 1.118865966796875, 1.15802001953125, 1.197174072265625, 1.236328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 26.0, 37.0, 48.0, 88.0, 135.0, 168.0, 166.0, 104.0, 78.0, 51.0, 20.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1975250244140625e-05, -5.034264177083969e-05, -4.871003329753876e-05, -4.7077424824237823e-05, -4.544481635093689e-05, -4.3812207877635956e-05, -4.217959940433502e-05, -4.054699093103409e-05, -3.8914382457733154e-05, -3.728177398443222e-05, -3.564916551113129e-05, -3.401655703783035e-05, -3.238394856452942e-05, -3.0751340091228485e-05, -2.911873161792755e-05, -2.7486123144626617e-05, -2.5853514671325684e-05, -2.422090619802475e-05, -2.2588297724723816e-05, -2.0955689251422882e-05, -1.9323080778121948e-05, -1.7690472304821014e-05, -1.605786383152008e-05, -1.4425255358219147e-05, -1.2792646884918213e-05, -1.1160038411617279e-05, -9.527429938316345e-06, -7.894821465015411e-06, -6.2622129917144775e-06, -4.629604518413544e-06, -2.99699604511261e-06, -1.364387571811676e-06, 2.682209014892578e-07, 1.9008293747901917e-06, 3.5334378480911255e-06, 5.166046321392059e-06, 6.798654794692993e-06, 8.431263267993927e-06, 1.006387174129486e-05, 1.1696480214595795e-05, 1.3329088687896729e-05, 1.4961697161197662e-05, 1.6594305634498596e-05, 1.822691410779953e-05, 1.9859522581100464e-05, 2.1492131054401398e-05, 2.312473952770233e-05, 2.4757348001003265e-05, 2.63899564743042e-05, 2.8022564947605133e-05, 2.9655173420906067e-05, 3.1287781894207e-05, 3.2920390367507935e-05, 3.455299884080887e-05, 3.61856073141098e-05, 3.7818215787410736e-05, 3.945082426071167e-05, 4.1083432734012604e-05, 4.271604120731354e-05, 4.434864968061447e-05, 4.5981258153915405e-05, 4.761386662721634e-05, 4.924647510051727e-05, 5.087908357381821e-05, 5.251169204711914e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 19.0, 35.0, 60.0, 94.0, 159.0, 282.0, 1059.0, 31374.0, 1009323.0, 5096.0, 505.0, 211.0, 117.0, 86.0, 41.0, 24.0, 23.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.115234375, -1.0758209228515625, -1.036407470703125, -0.9969940185546875, -0.95758056640625, -0.9181671142578125, -0.878753662109375, -0.8393402099609375, -0.7999267578125, -0.7605133056640625, -0.721099853515625, -0.6816864013671875, -0.64227294921875, -0.6028594970703125, -0.563446044921875, -0.5240325927734375, -0.484619140625, -0.4452056884765625, -0.405792236328125, -0.3663787841796875, -0.32696533203125, -0.2875518798828125, -0.248138427734375, -0.2087249755859375, -0.1693115234375, -0.1298980712890625, -0.090484619140625, -0.0510711669921875, -0.01165771484375, 0.0277557373046875, 0.067169189453125, 0.1065826416015625, 0.14599609375, 0.1854095458984375, 0.224822998046875, 0.2642364501953125, 0.30364990234375, 0.3430633544921875, 0.382476806640625, 0.4218902587890625, 0.4613037109375, 0.5007171630859375, 0.540130615234375, 0.5795440673828125, 0.61895751953125, 0.6583709716796875, 0.697784423828125, 0.7371978759765625, 0.776611328125, 0.8160247802734375, 0.855438232421875, 0.8948516845703125, 0.93426513671875, 0.9736785888671875, 1.013092041015625, 1.0525054931640625, 1.0919189453125, 1.1313323974609375, 1.170745849609375, 1.2101593017578125, 1.24957275390625, 1.2889862060546875, 1.328399658203125, 1.3678131103515625, 1.4072265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 35.0, 212.0, 530.0, 171.0, 35.0, 8.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.21875, -1.172760009765625, -1.12677001953125, -1.080780029296875, -1.0347900390625, -0.988800048828125, -0.94281005859375, -0.896820068359375, -0.850830078125, -0.804840087890625, -0.75885009765625, -0.712860107421875, -0.6668701171875, -0.620880126953125, -0.57489013671875, -0.528900146484375, -0.48291015625, -0.436920166015625, -0.39093017578125, -0.344940185546875, -0.2989501953125, -0.252960205078125, -0.20697021484375, -0.160980224609375, -0.114990234375, -0.069000244140625, -0.02301025390625, 0.022979736328125, 0.0689697265625, 0.114959716796875, 0.16094970703125, 0.206939697265625, 0.2529296875, 0.298919677734375, 0.34490966796875, 0.390899658203125, 0.4368896484375, 0.482879638671875, 0.52886962890625, 0.574859619140625, 0.620849609375, 0.666839599609375, 0.71282958984375, 0.758819580078125, 0.8048095703125, 0.850799560546875, 0.89678955078125, 0.942779541015625, 0.98876953125, 1.034759521484375, 1.08074951171875, 1.126739501953125, 1.1727294921875, 1.218719482421875, 1.26470947265625, 1.310699462890625, 1.356689453125, 1.402679443359375, 1.44866943359375, 1.494659423828125, 1.5406494140625, 1.586639404296875, 1.63262939453125, 1.678619384765625, 1.724609375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 19.0, 39.0, 93.0, 336.0, 335.0, 134.0, 33.0, 10.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6794753074645996, -3.3204543590545654, -2.9614334106445312, -2.602412223815918, -2.243391275405884, -1.8843703269958496, -1.5253491401672363, -1.1663281917572021, -0.807307243347168, -0.448286235332489, -0.08926522731781006, 0.26975584030151367, 0.6287767887115479, 0.987797737121582, 1.3468189239501953, 1.7058398723602295, 2.0648608207702637, 2.423881769180298, 2.782902717590332, 3.1419239044189453, 3.5009448528289795, 3.8599658012390137, 4.218986988067627, 4.578007698059082, 4.937028884887695, 5.296050071716309, 5.655070781707764, 6.014091968536377, 6.373112678527832, 6.732133865356445, 7.091155052185059, 7.450176239013672, 7.809196472167969, 8.168217658996582, 8.527238845825195, 8.886259078979492, 9.245280265808105, 9.604301452636719, 9.963322639465332, 10.322343826293945, 10.681364059448242, 11.040385246276855, 11.399406433105469, 11.758426666259766, 12.117447853088379, 12.476469039916992, 12.835490226745605, 13.194511413574219, 13.553532600402832, 13.912553787231445, 14.271574974060059, 14.630596160888672, 14.989616394042969, 15.348637580871582, 15.707658767700195, 16.066679000854492, 16.425701141357422, 16.78472137451172, 17.14374351501465, 17.502763748168945, 17.861785888671875, 18.220806121826172, 18.57982635498047, 18.9388484954834, 19.297868728637695]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 3.0, 9.0, 9.0, 11.0, 13.0, 15.0, 13.0, 14.0, 20.0, 36.0, 33.0, 41.0, 39.0, 32.0, 43.0, 37.0, 57.0, 46.0, 47.0, 42.0, 39.0, 41.0, 50.0, 30.0, 33.0, 28.0, 21.0, 39.0, 25.0, 25.0, 17.0, 21.0, 13.0, 10.0, 3.0, 8.0, 3.0, 2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.138191223144531, -4.019832134246826, -3.901472806930542, -3.783113479614258, -3.6647541522979736, -3.5463948249816895, -3.4280357360839844, -3.3096764087677, -3.191317081451416, -3.072957754135132, -2.9545986652374268, -2.8362393379211426, -2.7178800106048584, -2.599520683288574, -2.481161594390869, -2.362802267074585, -2.24444317817688, -2.1260838508605957, -2.0077247619628906, -1.8893654346466064, -1.7710061073303223, -1.6526468992233276, -1.534287691116333, -1.4159283638000488, -1.2975691556930542, -1.1792099475860596, -1.0608506202697754, -0.9424914121627808, -0.8241321444511414, -0.705772876739502, -0.5874136686325073, -0.4690544009208679, -0.3506953716278076, -0.2323361188173294, -0.1139768660068512, 0.00438237190246582, 0.12274163961410522, 0.24110090732574463, 0.35946011543273926, 0.47781938314437866, 0.5961786508560181, 0.7145379185676575, 0.8328971862792969, 0.9512563943862915, 1.0696156024932861, 1.1879749298095703, 1.306334137916565, 1.4246933460235596, 1.5430526733398438, 1.6614118814468384, 1.7797712087631226, 1.8981304168701172, 2.0164897441864014, 2.1348490715026855, 2.2532081604003906, 2.371567487716675, 2.489926815032959, 2.608286142349243, 2.7266452312469482, 2.8450045585632324, 2.9633638858795166, 3.081723213195801, 3.200082302093506, 3.31844162940979, 3.436800718307495]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 16.0, 19.0, 35.0, 56.0, 56.0, 78.0, 132.0, 169.0, 290.0, 436.0, 732.0, 1358.0, 2491.0, 5211.0, 13318.0, 43272.0, 374223.0, 3620227.0, 93592.0, 22271.0, 8065.0, 3622.0, 1888.0, 1034.0, 554.0, 347.0, 247.0, 159.0, 107.0, 67.0, 59.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.5380859375, -0.5228157043457031, -0.5075454711914062, -0.4922752380371094, -0.4770050048828125, -0.4617347717285156, -0.44646453857421875, -0.4311943054199219, -0.415924072265625, -0.4006538391113281, -0.38538360595703125, -0.3701133728027344, -0.3548431396484375, -0.3395729064941406, -0.32430267333984375, -0.3090324401855469, -0.29376220703125, -0.2784919738769531, -0.26322174072265625, -0.24795150756835938, -0.2326812744140625, -0.21741104125976562, -0.20214080810546875, -0.18687057495117188, -0.171600341796875, -0.15633010864257812, -0.14105987548828125, -0.12578964233398438, -0.1105194091796875, -0.09524917602539062, -0.07997894287109375, -0.06470870971679688, -0.0494384765625, -0.034168243408203125, -0.01889801025390625, -0.003627777099609375, 0.0116424560546875, 0.026912689208984375, 0.04218292236328125, 0.057453155517578125, 0.072723388671875, 0.08799362182617188, 0.10326385498046875, 0.11853408813476562, 0.1338043212890625, 0.14907455444335938, 0.16434478759765625, 0.17961502075195312, 0.19488525390625, 0.21015548706054688, 0.22542572021484375, 0.24069595336914062, 0.2559661865234375, 0.2712364196777344, 0.28650665283203125, 0.3017768859863281, 0.317047119140625, 0.3323173522949219, 0.34758758544921875, 0.3628578186035156, 0.3781280517578125, 0.3933982849121094, 0.40866851806640625, 0.4239387512207031, 0.439208984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 11.0, 14.0, 22.0, 24.0, 29.0, 36.0, 36.0, 42.0, 62.0, 55.0, 45.0, 48.0, 56.0, 39.0, 62.0, 51.0, 34.0, 43.0, 36.0, 33.0, 42.0, 32.0, 25.0, 15.0, 17.0, 14.0, 15.0, 7.0, 11.0, 14.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.15790748596191406, -0.15114212036132812, -0.1443767547607422, -0.13761138916015625, -0.1308460235595703, -0.12408065795898438, -0.11731529235839844, -0.1105499267578125, -0.10378456115722656, -0.09701919555664062, -0.09025382995605469, -0.08348846435546875, -0.07672309875488281, -0.06995773315429688, -0.06319236755371094, -0.056427001953125, -0.04966163635253906, -0.042896270751953125, -0.03613090515136719, -0.02936553955078125, -0.022600173950195312, -0.015834808349609375, -0.009069442749023438, -0.0023040771484375, 0.0044612884521484375, 0.011226654052734375, 0.017992019653320312, 0.02475738525390625, 0.03152275085449219, 0.038288116455078125, 0.04505348205566406, 0.05181884765625, 0.05858421325683594, 0.06534957885742188, 0.07211494445800781, 0.07888031005859375, 0.08564567565917969, 0.09241104125976562, 0.09917640686035156, 0.1059417724609375, 0.11270713806152344, 0.11947250366210938, 0.1262378692626953, 0.13300323486328125, 0.1397686004638672, 0.14653396606445312, 0.15329933166503906, 0.160064697265625, 0.16683006286621094, 0.17359542846679688, 0.1803607940673828, 0.18712615966796875, 0.1938915252685547, 0.20065689086914062, 0.20742225646972656, 0.2141876220703125, 0.22095298767089844, 0.22771835327148438, 0.2344837188720703, 0.24124908447265625, 0.2480144500732422, 0.2547798156738281, 0.26154518127441406, 0.268310546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 11.0, 22.0, 17.0, 27.0, 35.0, 62.0, 76.0, 122.0, 235.0, 391.0, 962.0, 3668.0, 30723.0, 4049555.0, 99334.0, 6509.0, 1340.0, 474.0, 242.0, 145.0, 83.0, 75.0, 63.0, 38.0, 23.0, 14.0, 7.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.039093017578125, -0.99517822265625, -0.951263427734375, -0.9073486328125, -0.863433837890625, -0.81951904296875, -0.775604248046875, -0.731689453125, -0.687774658203125, -0.64385986328125, -0.599945068359375, -0.5560302734375, -0.512115478515625, -0.46820068359375, -0.424285888671875, -0.38037109375, -0.336456298828125, -0.29254150390625, -0.248626708984375, -0.2047119140625, -0.160797119140625, -0.11688232421875, -0.072967529296875, -0.029052734375, 0.014862060546875, 0.05877685546875, 0.102691650390625, 0.1466064453125, 0.190521240234375, 0.23443603515625, 0.278350830078125, 0.322265625, 0.366180419921875, 0.41009521484375, 0.454010009765625, 0.4979248046875, 0.541839599609375, 0.58575439453125, 0.629669189453125, 0.673583984375, 0.717498779296875, 0.76141357421875, 0.805328369140625, 0.8492431640625, 0.893157958984375, 0.93707275390625, 0.980987548828125, 1.02490234375, 1.068817138671875, 1.11273193359375, 1.156646728515625, 1.2005615234375, 1.244476318359375, 1.28839111328125, 1.332305908203125, 1.376220703125, 1.420135498046875, 1.46405029296875, 1.507965087890625, 1.5518798828125, 1.595794677734375, 1.63970947265625, 1.683624267578125, 1.7275390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 26.0, 64.0, 430.0, 3240.0, 198.0, 52.0, 18.0, 12.0, 9.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5546875, -0.5309219360351562, -0.5071563720703125, -0.48339080810546875, -0.459625244140625, -0.43585968017578125, -0.4120941162109375, -0.38832855224609375, -0.36456298828125, -0.34079742431640625, -0.3170318603515625, -0.29326629638671875, -0.269500732421875, -0.24573516845703125, -0.2219696044921875, -0.19820404052734375, -0.1744384765625, -0.15067291259765625, -0.1269073486328125, -0.10314178466796875, -0.079376220703125, -0.05561065673828125, -0.0318450927734375, -0.00807952880859375, 0.01568603515625, 0.03945159912109375, 0.0632171630859375, 0.08698272705078125, 0.110748291015625, 0.13451385498046875, 0.1582794189453125, 0.18204498291015625, 0.205810546875, 0.22957611083984375, 0.2533416748046875, 0.27710723876953125, 0.300872802734375, 0.32463836669921875, 0.3484039306640625, 0.37216949462890625, 0.39593505859375, 0.41970062255859375, 0.4434661865234375, 0.46723175048828125, 0.490997314453125, 0.5147628784179688, 0.5385284423828125, 0.5622940063476562, 0.5860595703125, 0.6098251342773438, 0.6335906982421875, 0.6573562622070312, 0.681121826171875, 0.7048873901367188, 0.7286529541015625, 0.7524185180664062, 0.77618408203125, 0.7999496459960938, 0.8237152099609375, 0.8474807739257812, 0.871246337890625, 0.8950119018554688, 0.9187774658203125, 0.9425430297851562, 0.96630859375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 27.0, 138.0, 365.0, 346.0, 84.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.105861186981201, -5.992343425750732, -5.8788251876831055, -5.765307426452637, -5.651789665222168, -5.538271903991699, -5.424753665924072, -5.3112359046936035, -5.197718143463135, -5.084200382232666, -4.970682144165039, -4.85716438293457, -4.743646621704102, -4.630128860473633, -4.516610622406006, -4.403092861175537, -4.28957462310791, -4.176056861877441, -4.0625386238098145, -3.9490208625793457, -3.835503101348877, -3.721985101699829, -3.6084671020507812, -3.4949493408203125, -3.3814315795898438, -3.267913579940796, -3.154395818710327, -3.0408778190612793, -2.9273600578308105, -2.8138420581817627, -2.700324058532715, -2.586806297302246, -2.4732885360717773, -2.3597705364227295, -2.2462527751922607, -2.132734775543213, -2.019217014312744, -1.9056990146636963, -1.792181134223938, -1.6786632537841797, -1.5651453733444214, -1.451627492904663, -1.3381096124649048, -1.2245917320251465, -1.1110737323760986, -0.9975559115409851, -0.884037971496582, -0.7705200910568237, -0.6570022106170654, -0.5434843301773071, -0.42996641993522644, -0.31644850969314575, -0.20293062925338745, -0.08941274881362915, 0.024105191230773926, 0.13762307167053223, 0.2511409521102905, 0.36465883255004883, 0.4781767427921295, 0.5916946530342102, 0.7052125334739685, 0.8187304139137268, 0.9322483539581299, 1.0457662343978882, 1.1592841148376465]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 2.0, 2.0, 6.0, 8.0, 11.0, 9.0, 19.0, 23.0, 22.0, 27.0, 37.0, 41.0, 40.0, 48.0, 52.0, 51.0, 64.0, 62.0, 51.0, 73.0, 43.0, 43.0, 43.0, 43.0, 50.0, 21.0, 22.0, 20.0, 17.0, 10.0, 10.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.045449137687683, -1.0140300989151, -0.9826111197471619, -0.9511920809745789, -0.9197731018066406, -0.8883540630340576, -0.8569350242614746, -0.8255160450935364, -0.7940970659255981, -0.7626780271530151, -0.7312590479850769, -0.6998400092124939, -0.6684210300445557, -0.6370019912719727, -0.6055829524993896, -0.5741639733314514, -0.5427449345588684, -0.5113258957862854, -0.47990691661834717, -0.44848787784576416, -0.4170688986778259, -0.3856498599052429, -0.3542308509349823, -0.3228118419647217, -0.29139283299446106, -0.25997382402420044, -0.22855481505393982, -0.197135791182518, -0.16571678221225739, -0.13429777324199677, -0.10287874937057495, -0.07145974040031433, -0.040040671825408936, -0.008621659129858017, 0.0227973535656929, 0.05421636998653412, 0.08563537895679474, 0.11705438792705536, 0.14847341179847717, 0.1798924207687378, 0.2113114297389984, 0.24273043870925903, 0.27414944767951965, 0.3055684566497803, 0.3369874954223633, 0.3684064745903015, 0.3998255133628845, 0.43124452233314514, 0.46266353130340576, 0.4940825402736664, 0.525501549243927, 0.55692058801651, 0.5883395671844482, 0.6197586059570312, 0.6511776447296143, 0.6825966238975525, 0.7140156030654907, 0.7454346418380737, 0.776853621006012, 0.808272659778595, 0.8396916389465332, 0.8711106777191162, 0.9025297164916992, 0.9339486956596375, 0.9653677344322205]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 12.0, 9.0, 12.0, 18.0, 21.0, 41.0, 49.0, 94.0, 158.0, 271.0, 465.0, 913.0, 1873.0, 4215.0, 10009.0, 26018.0, 80193.0, 301120.0, 435571.0, 125442.0, 37700.0, 13792.0, 5429.0, 2516.0, 1142.0, 614.0, 327.0, 170.0, 116.0, 70.0, 45.0, 40.0, 16.0, 19.0, 11.0, 17.0, 3.0, 12.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6953125, -0.6755447387695312, -0.6557769775390625, -0.6360092163085938, -0.616241455078125, -0.5964736938476562, -0.5767059326171875, -0.5569381713867188, -0.53717041015625, -0.5174026489257812, -0.4976348876953125, -0.47786712646484375, -0.458099365234375, -0.43833160400390625, -0.4185638427734375, -0.39879608154296875, -0.3790283203125, -0.35926055908203125, -0.3394927978515625, -0.31972503662109375, -0.299957275390625, -0.28018951416015625, -0.2604217529296875, -0.24065399169921875, -0.22088623046875, -0.20111846923828125, -0.1813507080078125, -0.16158294677734375, -0.141815185546875, -0.12204742431640625, -0.1022796630859375, -0.08251190185546875, -0.062744140625, -0.04297637939453125, -0.0232086181640625, -0.00344085693359375, 0.016326904296875, 0.03609466552734375, 0.0558624267578125, 0.07563018798828125, 0.09539794921875, 0.11516571044921875, 0.1349334716796875, 0.15470123291015625, 0.174468994140625, 0.19423675537109375, 0.2140045166015625, 0.23377227783203125, 0.2535400390625, 0.27330780029296875, 0.2930755615234375, 0.31284332275390625, 0.332611083984375, 0.35237884521484375, 0.3721466064453125, 0.39191436767578125, 0.41168212890625, 0.43144989013671875, 0.4512176513671875, 0.47098541259765625, 0.490753173828125, 0.5105209350585938, 0.5302886962890625, 0.5500564575195312, 0.56982421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 1.0, 5.0, 2.0, 3.0, 9.0, 11.0, 18.0, 18.0, 30.0, 32.0, 32.0, 37.0, 52.0, 49.0, 50.0, 54.0, 49.0, 49.0, 43.0, 51.0, 47.0, 36.0, 49.0, 37.0, 32.0, 29.0, 31.0, 28.0, 18.0, 26.0, 9.0, 11.0, 12.0, 11.0, 8.0, 5.0, 9.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1771240234375, -0.17061233520507812, -0.16410064697265625, -0.15758895874023438, -0.1510772705078125, -0.14456558227539062, -0.13805389404296875, -0.13154220581054688, -0.125030517578125, -0.11851882934570312, -0.11200714111328125, -0.10549545288085938, -0.0989837646484375, -0.09247207641601562, -0.08596038818359375, -0.07944869995117188, -0.07293701171875, -0.06642532348632812, -0.05991363525390625, -0.053401947021484375, -0.0468902587890625, -0.040378570556640625, -0.03386688232421875, -0.027355194091796875, -0.020843505859375, -0.014331817626953125, -0.00782012939453125, -0.001308441162109375, 0.0052032470703125, 0.011714935302734375, 0.01822662353515625, 0.024738311767578125, 0.03125, 0.037761688232421875, 0.04427337646484375, 0.050785064697265625, 0.0572967529296875, 0.06380844116210938, 0.07032012939453125, 0.07683181762695312, 0.083343505859375, 0.08985519409179688, 0.09636688232421875, 0.10287857055664062, 0.1093902587890625, 0.11590194702148438, 0.12241363525390625, 0.12892532348632812, 0.13543701171875, 0.14194869995117188, 0.14846038818359375, 0.15497207641601562, 0.1614837646484375, 0.16799545288085938, 0.17450714111328125, 0.18101882934570312, 0.187530517578125, 0.19404220581054688, 0.20055389404296875, 0.20706558227539062, 0.2135772705078125, 0.22008895874023438, 0.22660064697265625, 0.23311233520507812, 0.2396240234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 12.0, 17.0, 31.0, 23.0, 41.0, 69.0, 79.0, 148.0, 246.0, 484.0, 1146.0, 2982.0, 9075.0, 32433.0, 147508.0, 574759.0, 216300.0, 44788.0, 11868.0, 3782.0, 1422.0, 596.0, 289.0, 142.0, 95.0, 45.0, 40.0, 37.0, 17.0, 14.0, 13.0, 8.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.693359375, -0.6699447631835938, -0.6465301513671875, -0.6231155395507812, -0.599700927734375, -0.5762863159179688, -0.5528717041015625, -0.5294570922851562, -0.50604248046875, -0.48262786865234375, -0.4592132568359375, -0.43579864501953125, -0.412384033203125, -0.38896942138671875, -0.3655548095703125, -0.34214019775390625, -0.3187255859375, -0.29531097412109375, -0.2718963623046875, -0.24848175048828125, -0.225067138671875, -0.20165252685546875, -0.1782379150390625, -0.15482330322265625, -0.13140869140625, -0.10799407958984375, -0.0845794677734375, -0.06116485595703125, -0.037750244140625, -0.01433563232421875, 0.0090789794921875, 0.03249359130859375, 0.055908203125, 0.07932281494140625, 0.1027374267578125, 0.12615203857421875, 0.149566650390625, 0.17298126220703125, 0.1963958740234375, 0.21981048583984375, 0.24322509765625, 0.26663970947265625, 0.2900543212890625, 0.31346893310546875, 0.336883544921875, 0.36029815673828125, 0.3837127685546875, 0.40712738037109375, 0.4305419921875, 0.45395660400390625, 0.4773712158203125, 0.5007858276367188, 0.524200439453125, 0.5476150512695312, 0.5710296630859375, 0.5944442749023438, 0.61785888671875, 0.6412734985351562, 0.6646881103515625, 0.6881027221679688, 0.711517333984375, 0.7349319458007812, 0.7583465576171875, 0.7817611694335938, 0.80517578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 10.0, 10.0, 8.0, 17.0, 15.0, 28.0, 20.0, 27.0, 31.0, 34.0, 31.0, 31.0, 44.0, 54.0, 47.0, 46.0, 46.0, 38.0, 45.0, 40.0, 44.0, 37.0, 34.0, 31.0, 30.0, 31.0, 29.0, 21.0, 15.0, 15.0, 16.0, 23.0, 7.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.7900390625, -0.7654495239257812, -0.7408599853515625, -0.7162704467773438, -0.691680908203125, -0.6670913696289062, -0.6425018310546875, -0.6179122924804688, -0.59332275390625, -0.5687332153320312, -0.5441436767578125, -0.5195541381835938, -0.494964599609375, -0.47037506103515625, -0.4457855224609375, -0.42119598388671875, -0.3966064453125, -0.37201690673828125, -0.3474273681640625, -0.32283782958984375, -0.298248291015625, -0.27365875244140625, -0.2490692138671875, -0.22447967529296875, -0.19989013671875, -0.17530059814453125, -0.1507110595703125, -0.12612152099609375, -0.101531982421875, -0.07694244384765625, -0.0523529052734375, -0.02776336669921875, -0.003173828125, 0.02141571044921875, 0.0460052490234375, 0.07059478759765625, 0.095184326171875, 0.11977386474609375, 0.1443634033203125, 0.16895294189453125, 0.19354248046875, 0.21813201904296875, 0.2427215576171875, 0.26731109619140625, 0.291900634765625, 0.31649017333984375, 0.3410797119140625, 0.36566925048828125, 0.3902587890625, 0.41484832763671875, 0.4394378662109375, 0.46402740478515625, 0.488616943359375, 0.5132064819335938, 0.5377960205078125, 0.5623855590820312, 0.58697509765625, 0.6115646362304688, 0.6361541748046875, 0.6607437133789062, 0.685333251953125, 0.7099227905273438, 0.7345123291015625, 0.7591018676757812, 0.78369140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 10.0, 6.0, 17.0, 17.0, 28.0, 32.0, 47.0, 106.0, 176.0, 266.0, 601.0, 1358.0, 3752.0, 14470.0, 92496.0, 581781.0, 303688.0, 37969.0, 7517.0, 2215.0, 943.0, 408.0, 247.0, 125.0, 91.0, 51.0, 40.0, 22.0, 23.0, 12.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2413330078125, -0.23232078552246094, -0.22330856323242188, -0.2142963409423828, -0.20528411865234375, -0.1962718963623047, -0.18725967407226562, -0.17824745178222656, -0.1692352294921875, -0.16022300720214844, -0.15121078491210938, -0.1421985626220703, -0.13318634033203125, -0.12417411804199219, -0.11516189575195312, -0.10614967346191406, -0.097137451171875, -0.08812522888183594, -0.07911300659179688, -0.07010078430175781, -0.06108856201171875, -0.05207633972167969, -0.043064117431640625, -0.03405189514160156, -0.0250396728515625, -0.016027450561523438, -0.007015228271484375, 0.0019969940185546875, 0.01100921630859375, 0.020021438598632812, 0.029033660888671875, 0.03804588317871094, 0.04705810546875, 0.05607032775878906, 0.06508255004882812, 0.07409477233886719, 0.08310699462890625, 0.09211921691894531, 0.10113143920898438, 0.11014366149902344, 0.1191558837890625, 0.12816810607910156, 0.13718032836914062, 0.1461925506591797, 0.15520477294921875, 0.1642169952392578, 0.17322921752929688, 0.18224143981933594, 0.191253662109375, 0.20026588439941406, 0.20927810668945312, 0.2182903289794922, 0.22730255126953125, 0.2363147735595703, 0.24532699584960938, 0.25433921813964844, 0.2633514404296875, 0.27236366271972656, 0.2813758850097656, 0.2903881072998047, 0.29940032958984375, 0.3084125518798828, 0.3174247741699219, 0.32643699645996094, 0.33544921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 20.0, 17.0, 22.0, 42.0, 59.0, 100.0, 124.0, 123.0, 129.0, 111.0, 69.0, 60.0, 32.0, 22.0, 14.0, 8.0, 15.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.849102020263672e-05, -2.6963651180267334e-05, -2.543628215789795e-05, -2.3908913135528564e-05, -2.238154411315918e-05, -2.0854175090789795e-05, -1.932680606842041e-05, -1.7799437046051025e-05, -1.627206802368164e-05, -1.4744699001312256e-05, -1.3217329978942871e-05, -1.1689960956573486e-05, -1.0162591934204102e-05, -8.635222911834717e-06, -7.107853889465332e-06, -5.580484867095947e-06, -4.0531158447265625e-06, -2.5257468223571777e-06, -9.98377799987793e-07, 5.289912223815918e-07, 2.0563602447509766e-06, 3.5837292671203613e-06, 5.111098289489746e-06, 6.638467311859131e-06, 8.165836334228516e-06, 9.6932053565979e-06, 1.1220574378967285e-05, 1.274794340133667e-05, 1.4275312423706055e-05, 1.580268144607544e-05, 1.7330050468444824e-05, 1.885741949081421e-05, 2.0384788513183594e-05, 2.191215753555298e-05, 2.3439526557922363e-05, 2.4966895580291748e-05, 2.6494264602661133e-05, 2.8021633625030518e-05, 2.9549002647399902e-05, 3.107637166976929e-05, 3.260374069213867e-05, 3.413110971450806e-05, 3.565847873687744e-05, 3.7185847759246826e-05, 3.871321678161621e-05, 4.0240585803985596e-05, 4.176795482635498e-05, 4.3295323848724365e-05, 4.482269287109375e-05, 4.6350061893463135e-05, 4.787743091583252e-05, 4.9404799938201904e-05, 5.093216896057129e-05, 5.2459537982940674e-05, 5.398690700531006e-05, 5.551427602767944e-05, 5.704164505004883e-05, 5.856901407241821e-05, 6.00963830947876e-05, 6.162375211715698e-05, 6.315112113952637e-05, 6.467849016189575e-05, 6.620585918426514e-05, 6.773322820663452e-05, 6.92605972290039e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 6.0, 13.0, 21.0, 21.0, 40.0, 71.0, 138.0, 332.0, 910.0, 3882.0, 27952.0, 410564.0, 558445.0, 39473.0, 4929.0, 1028.0, 346.0, 187.0, 91.0, 42.0, 26.0, 12.0, 11.0, 6.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.442626953125, -0.43068695068359375, -0.4187469482421875, -0.40680694580078125, -0.394866943359375, -0.38292694091796875, -0.3709869384765625, -0.35904693603515625, -0.34710693359375, -0.33516693115234375, -0.3232269287109375, -0.31128692626953125, -0.299346923828125, -0.28740692138671875, -0.2754669189453125, -0.26352691650390625, -0.2515869140625, -0.23964691162109375, -0.2277069091796875, -0.21576690673828125, -0.203826904296875, -0.19188690185546875, -0.1799468994140625, -0.16800689697265625, -0.15606689453125, -0.14412689208984375, -0.1321868896484375, -0.12024688720703125, -0.108306884765625, -0.09636688232421875, -0.0844268798828125, -0.07248687744140625, -0.060546875, -0.04860687255859375, -0.0366668701171875, -0.02472686767578125, -0.012786865234375, -0.00084686279296875, 0.0110931396484375, 0.02303314208984375, 0.03497314453125, 0.04691314697265625, 0.0588531494140625, 0.07079315185546875, 0.082733154296875, 0.09467315673828125, 0.1066131591796875, 0.11855316162109375, 0.1304931640625, 0.14243316650390625, 0.1543731689453125, 0.16631317138671875, 0.178253173828125, 0.19019317626953125, 0.2021331787109375, 0.21407318115234375, 0.22601318359375, 0.23795318603515625, 0.2498931884765625, 0.26183319091796875, 0.273773193359375, 0.28571319580078125, 0.2976531982421875, 0.30959320068359375, 0.321533203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 4.0, 14.0, 15.0, 25.0, 38.0, 49.0, 63.0, 95.0, 115.0, 122.0, 120.0, 92.0, 76.0, 68.0, 31.0, 29.0, 18.0, 11.0, 8.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.4816303253173828, -0.4700965881347656, -0.45856285095214844, -0.44702911376953125, -0.43549537658691406, -0.4239616394042969, -0.4124279022216797, -0.4008941650390625, -0.3893604278564453, -0.3778266906738281, -0.36629295349121094, -0.35475921630859375, -0.34322547912597656, -0.3316917419433594, -0.3201580047607422, -0.308624267578125, -0.2970905303955078, -0.2855567932128906, -0.27402305603027344, -0.26248931884765625, -0.25095558166503906, -0.23942184448242188, -0.2278881072998047, -0.2163543701171875, -0.2048206329345703, -0.19328689575195312, -0.18175315856933594, -0.17021942138671875, -0.15868568420410156, -0.14715194702148438, -0.1356182098388672, -0.12408447265625, -0.11255073547363281, -0.10101699829101562, -0.08948326110839844, -0.07794952392578125, -0.06641578674316406, -0.054882049560546875, -0.04334831237792969, -0.0318145751953125, -0.020280838012695312, -0.008747100830078125, 0.0027866363525390625, 0.01432037353515625, 0.025854110717773438, 0.037387847900390625, 0.04892158508300781, 0.060455322265625, 0.07198905944824219, 0.08352279663085938, 0.09505653381347656, 0.10659027099609375, 0.11812400817871094, 0.12965774536132812, 0.1411914825439453, 0.1527252197265625, 0.1642589569091797, 0.17579269409179688, 0.18732643127441406, 0.19886016845703125, 0.21039390563964844, 0.22192764282226562, 0.2334613800048828, 0.2449951171875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 14.0, 14.0, 29.0, 64.0, 135.0, 270.0, 237.0, 146.0, 51.0, 23.0, 13.0, 11.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.018630027770996, -11.787850379943848, -11.557071685791016, -11.326292037963867, -11.095513343811035, -10.864733695983887, -10.633955001831055, -10.403175354003906, -10.172395706176758, -9.94161605834961, -9.710837364196777, -9.480057716369629, -9.249279022216797, -9.018499374389648, -8.787720680236816, -8.556941032409668, -8.326162338256836, -8.095382690429688, -7.8646039962768555, -7.633824825286865, -7.403045654296875, -7.172266006469727, -6.941486835479736, -6.710707664489746, -6.479928493499756, -6.249149322509766, -6.018370151519775, -5.787590980529785, -5.556811332702637, -5.326032638549805, -5.095252990722656, -4.864473819732666, -4.633694171905518, -4.402915000915527, -4.172135829925537, -3.9413564205169678, -3.7105772495269775, -3.4797980785369873, -3.249018669128418, -3.0182394981384277, -2.7874603271484375, -2.5566811561584473, -2.325901985168457, -2.0951225757598877, -1.8643434047698975, -1.6335642337799072, -1.4027849435806274, -1.1720056533813477, -0.9412264823913574, -0.7104472517967224, -0.4796680212020874, -0.2488887906074524, -0.018109560012817383, 0.21266961097717285, 0.44344890117645264, 0.6742281913757324, 0.9050073623657227, 1.135786533355713, 1.3665658235549927, 1.5973451137542725, 1.8281242847442627, 2.058903455734253, 2.2896828651428223, 2.5204620361328125, 2.7512412071228027]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 9.0, 11.0, 11.0, 15.0, 13.0, 21.0, 15.0, 25.0, 28.0, 30.0, 31.0, 39.0, 45.0, 48.0, 50.0, 52.0, 51.0, 36.0, 45.0, 60.0, 47.0, 44.0, 38.0, 41.0, 42.0, 27.0, 21.0, 26.0, 9.0, 15.0, 13.0, 8.0, 4.0, 3.0, 7.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.715194225311279, -4.5851969718933105, -4.455199241638184, -4.325201988220215, -4.195204734802246, -4.065207481384277, -3.9352097511291504, -3.8052124977111816, -3.675215005874634, -3.545217514038086, -3.415220260620117, -3.2852227687835693, -3.1552252769470215, -3.0252280235290527, -2.895230531692505, -2.765233039855957, -2.6352357864379883, -2.5052382946014404, -2.3752410411834717, -2.245243549346924, -2.115246295928955, -1.9852488040924072, -1.8552513122558594, -1.725253939628601, -1.5952565670013428, -1.4652591943740845, -1.3352618217468262, -1.2052643299102783, -1.07526695728302, -0.9452695846557617, -0.8152721524238586, -0.6852747201919556, -0.5552773475646973, -0.4252799451351166, -0.2952825427055359, -0.1652851402759552, -0.03528773784637451, 0.09470963478088379, 0.22470706701278687, 0.35470449924468994, 0.48470187187194824, 0.6146992444992065, 0.7446966767311096, 0.8746941089630127, 1.004691481590271, 1.1346888542175293, 1.2646863460540771, 1.3946837186813354, 1.5246810913085938, 1.654678463935852, 1.7846758365631104, 1.9146733283996582, 2.044670581817627, 2.174668073654175, 2.3046655654907227, 2.4346628189086914, 2.5646603107452393, 2.694657802581787, 2.824655055999756, 2.9546525478363037, 3.0846500396728516, 3.2146472930908203, 3.344644784927368, 3.474642276763916, 3.6046395301818848]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 9.0, 9.0, 8.0, 16.0, 17.0, 32.0, 35.0, 52.0, 73.0, 110.0, 165.0, 235.0, 349.0, 517.0, 868.0, 1490.0, 2905.0, 6534.0, 18435.0, 131393.0, 3931024.0, 74163.0, 14468.0, 5376.0, 2470.0, 1404.0, 776.0, 438.0, 290.0, 206.0, 134.0, 81.0, 45.0, 45.0, 34.0, 19.0, 20.0, 12.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-1.0478515625, -1.0198287963867188, -0.9918060302734375, -0.9637832641601562, -0.935760498046875, -0.9077377319335938, -0.8797149658203125, -0.8516921997070312, -0.82366943359375, -0.7956466674804688, -0.7676239013671875, -0.7396011352539062, -0.711578369140625, -0.6835556030273438, -0.6555328369140625, -0.6275100708007812, -0.5994873046875, -0.5714645385742188, -0.5434417724609375, -0.5154190063476562, -0.487396240234375, -0.45937347412109375, -0.4313507080078125, -0.40332794189453125, -0.37530517578125, -0.34728240966796875, -0.3192596435546875, -0.29123687744140625, -0.263214111328125, -0.23519134521484375, -0.2071685791015625, -0.17914581298828125, -0.151123046875, -0.12310028076171875, -0.0950775146484375, -0.06705474853515625, -0.039031982421875, -0.01100921630859375, 0.0170135498046875, 0.04503631591796875, 0.07305908203125, 0.10108184814453125, 0.1291046142578125, 0.15712738037109375, 0.185150146484375, 0.21317291259765625, 0.2411956787109375, 0.26921844482421875, 0.2972412109375, 0.32526397705078125, 0.3532867431640625, 0.38130950927734375, 0.409332275390625, 0.43735504150390625, 0.4653778076171875, 0.49340057373046875, 0.52142333984375, 0.5494461059570312, 0.5774688720703125, 0.6054916381835938, 0.633514404296875, 0.6615371704101562, 0.6895599365234375, 0.7175827026367188, 0.74560546875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 1.0, 4.0, 12.0, 11.0, 10.0, 20.0, 17.0, 24.0, 34.0, 33.0, 36.0, 39.0, 40.0, 48.0, 34.0, 47.0, 46.0, 53.0, 47.0, 48.0, 46.0, 42.0, 35.0, 42.0, 32.0, 24.0, 39.0, 24.0, 27.0, 15.0, 14.0, 11.0, 9.0, 7.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246337890625, -0.23920059204101562, -0.23206329345703125, -0.22492599487304688, -0.2177886962890625, -0.21065139770507812, -0.20351409912109375, -0.19637680053710938, -0.189239501953125, -0.18210220336914062, -0.17496490478515625, -0.16782760620117188, -0.1606903076171875, -0.15355300903320312, -0.14641571044921875, -0.13927841186523438, -0.13214111328125, -0.12500381469726562, -0.11786651611328125, -0.11072921752929688, -0.1035919189453125, -0.09645462036132812, -0.08931732177734375, -0.08218002319335938, -0.075042724609375, -0.06790542602539062, -0.06076812744140625, -0.053630828857421875, -0.0464935302734375, -0.039356231689453125, -0.03221893310546875, -0.025081634521484375, -0.0179443359375, -0.010807037353515625, -0.00366973876953125, 0.003467559814453125, 0.0106048583984375, 0.017742156982421875, 0.02487945556640625, 0.032016754150390625, 0.039154052734375, 0.046291351318359375, 0.05342864990234375, 0.060565948486328125, 0.0677032470703125, 0.07484054565429688, 0.08197784423828125, 0.08911514282226562, 0.09625244140625, 0.10338973999023438, 0.11052703857421875, 0.11766433715820312, 0.1248016357421875, 0.13193893432617188, 0.13907623291015625, 0.14621353149414062, 0.153350830078125, 0.16048812866210938, 0.16762542724609375, 0.17476272583007812, 0.1819000244140625, 0.18903732299804688, 0.19617462158203125, 0.20331192016601562, 0.21044921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 11.0, 13.0, 18.0, 20.0, 37.0, 43.0, 46.0, 73.0, 114.0, 164.0, 297.0, 1068.0, 8642.0, 4046995.0, 131870.0, 3483.0, 718.0, 259.0, 120.0, 62.0, 69.0, 47.0, 30.0, 34.0, 24.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.0960235595703125, -3.016265869140625, -2.9365081787109375, -2.85675048828125, -2.7769927978515625, -2.697235107421875, -2.6174774169921875, -2.5377197265625, -2.4579620361328125, -2.378204345703125, -2.2984466552734375, -2.21868896484375, -2.1389312744140625, -2.059173583984375, -1.9794158935546875, -1.899658203125, -1.8199005126953125, -1.740142822265625, -1.6603851318359375, -1.58062744140625, -1.5008697509765625, -1.421112060546875, -1.3413543701171875, -1.2615966796875, -1.1818389892578125, -1.102081298828125, -1.0223236083984375, -0.94256591796875, -0.8628082275390625, -0.783050537109375, -0.7032928466796875, -0.62353515625, -0.5437774658203125, -0.464019775390625, -0.3842620849609375, -0.30450439453125, -0.2247467041015625, -0.144989013671875, -0.0652313232421875, 0.0145263671875, 0.0942840576171875, 0.174041748046875, 0.2537994384765625, 0.33355712890625, 0.4133148193359375, 0.493072509765625, 0.5728302001953125, 0.652587890625, 0.7323455810546875, 0.812103271484375, 0.8918609619140625, 0.97161865234375, 1.0513763427734375, 1.131134033203125, 1.2108917236328125, 1.2906494140625, 1.3704071044921875, 1.450164794921875, 1.5299224853515625, 1.60968017578125, 1.6894378662109375, 1.769195556640625, 1.8489532470703125, 1.9287109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 14.0, 29.0, 170.0, 3608.0, 197.0, 36.0, 10.0, 9.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.7155685424804688, -1.6743011474609375, -1.6330337524414062, -1.591766357421875, -1.5504989624023438, -1.5092315673828125, -1.4679641723632812, -1.42669677734375, -1.3854293823242188, -1.3441619873046875, -1.3028945922851562, -1.261627197265625, -1.2203598022460938, -1.1790924072265625, -1.1378250122070312, -1.0965576171875, -1.0552902221679688, -1.0140228271484375, -0.9727554321289062, -0.931488037109375, -0.8902206420898438, -0.8489532470703125, -0.8076858520507812, -0.76641845703125, -0.7251510620117188, -0.6838836669921875, -0.6426162719726562, -0.601348876953125, -0.5600814819335938, -0.5188140869140625, -0.47754669189453125, -0.436279296875, -0.39501190185546875, -0.3537445068359375, -0.31247711181640625, -0.271209716796875, -0.22994232177734375, -0.1886749267578125, -0.14740753173828125, -0.10614013671875, -0.06487274169921875, -0.0236053466796875, 0.01766204833984375, 0.058929443359375, 0.10019683837890625, 0.1414642333984375, 0.18273162841796875, 0.2239990234375, 0.26526641845703125, 0.3065338134765625, 0.34780120849609375, 0.389068603515625, 0.43033599853515625, 0.4716033935546875, 0.5128707885742188, 0.55413818359375, 0.5954055786132812, 0.6366729736328125, 0.6779403686523438, 0.719207763671875, 0.7604751586914062, 0.8017425537109375, 0.8430099487304688, 0.88427734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 14.0, 25.0, 81.0, 233.0, 374.0, 184.0, 51.0, 18.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.567192077636719, -5.452269077301025, -5.33734655380249, -5.222423553466797, -5.1075005531311035, -4.99257755279541, -4.877655029296875, -4.762732028961182, -4.647809028625488, -4.532886028289795, -4.41796350479126, -4.303040504455566, -4.188117504119873, -4.07319450378418, -3.9582719802856445, -3.843348979949951, -3.728426218032837, -3.6135034561157227, -3.4985804557800293, -3.383657693862915, -3.2687346935272217, -3.1538119316101074, -3.038888931274414, -2.9239661693573, -2.8090434074401855, -2.6941206455230713, -2.579197645187378, -2.4642748832702637, -2.3493518829345703, -2.234429121017456, -2.119506359100342, -2.0045833587646484, -1.8896605968475342, -1.7747377157211304, -1.6598148345947266, -1.5448920726776123, -1.429969072341919, -1.3150463104248047, -1.2001234292984009, -1.085200548171997, -0.9702776670455933, -0.8553547859191895, -0.7404319047927856, -0.6255090832710266, -0.5105862021446228, -0.395663321018219, -0.28074049949645996, -0.16581761837005615, -0.050894737243652344, 0.06402812898159027, 0.17895099520683289, 0.2938738465309143, 0.4087967276573181, 0.5237196087837219, 0.638642430305481, 0.7535653114318848, 0.8684881925582886, 0.9834110736846924, 1.0983339548110962, 1.2132568359375, 1.3281795978546143, 1.4431025981903076, 1.5580253601074219, 1.6729482412338257, 1.7878711223602295]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 13.0, 18.0, 16.0, 22.0, 27.0, 33.0, 49.0, 43.0, 42.0, 53.0, 53.0, 59.0, 61.0, 68.0, 65.0, 46.0, 55.0, 44.0, 39.0, 34.0, 34.0, 25.0, 22.0, 16.0, 11.0, 9.0, 12.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7369763851165771, -1.688307523727417, -1.6396386623382568, -1.5909698009490967, -1.542301058769226, -1.493632197380066, -1.4449633359909058, -1.3962944746017456, -1.347625732421875, -1.2989568710327148, -1.2502880096435547, -1.2016191482543945, -1.152950406074524, -1.1042815446853638, -1.0556126832962036, -1.0069438219070435, -0.9582749605178833, -0.9096060991287231, -0.8609372973442078, -0.8122684359550476, -0.7635996341705322, -0.7149307727813721, -0.6662619113922119, -0.6175930500030518, -0.5689242482185364, -0.5202553868293762, -0.47158658504486084, -0.4229177236557007, -0.3742488920688629, -0.32558006048202515, -0.276911199092865, -0.22824236750602722, -0.17957353591918945, -0.13090470433235168, -0.08223585784435272, -0.03356701135635376, 0.015101820230484009, 0.06377065181732178, 0.11243951320648193, 0.1611083447933197, 0.20977717638015747, 0.25844600796699524, 0.307114839553833, 0.35578370094299316, 0.40445253252983093, 0.4531213641166687, 0.5017902255058289, 0.5504590272903442, 0.5991278886795044, 0.6477967500686646, 0.6964655518531799, 0.7451344132423401, 0.7938032150268555, 0.8424720764160156, 0.8911409378051758, 0.9398097991943359, 0.9884786009788513, 1.0371474027633667, 1.0858162641525269, 1.134485125541687, 1.1831539869308472, 1.2318227291107178, 1.280491590499878, 1.329160451889038, 1.3778293132781982]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 5.0, 14.0, 25.0, 27.0, 42.0, 62.0, 101.0, 157.0, 198.0, 305.0, 469.0, 749.0, 1106.0, 1860.0, 3004.0, 5051.0, 8424.0, 14055.0, 24676.0, 45371.0, 88630.0, 182522.0, 278690.0, 190445.0, 93278.0, 46930.0, 25539.0, 14580.0, 8642.0, 5055.0, 3179.0, 1929.0, 1154.0, 824.0, 490.0, 310.0, 213.0, 143.0, 103.0, 58.0, 35.0, 29.0, 22.0, 11.0, 11.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.414306640625, -0.4019508361816406, -0.38959503173828125, -0.3772392272949219, -0.3648834228515625, -0.3525276184082031, -0.34017181396484375, -0.3278160095214844, -0.315460205078125, -0.3031044006347656, -0.29074859619140625, -0.2783927917480469, -0.2660369873046875, -0.2536811828613281, -0.24132537841796875, -0.22896957397460938, -0.21661376953125, -0.20425796508789062, -0.19190216064453125, -0.17954635620117188, -0.1671905517578125, -0.15483474731445312, -0.14247894287109375, -0.13012313842773438, -0.117767333984375, -0.10541152954101562, -0.09305572509765625, -0.08069992065429688, -0.0683441162109375, -0.055988311767578125, -0.04363250732421875, -0.031276702880859375, -0.0189208984375, -0.006565093994140625, 0.00579071044921875, 0.018146514892578125, 0.0305023193359375, 0.042858123779296875, 0.05521392822265625, 0.06756973266601562, 0.079925537109375, 0.09228134155273438, 0.10463714599609375, 0.11699295043945312, 0.1293487548828125, 0.14170455932617188, 0.15406036376953125, 0.16641616821289062, 0.17877197265625, 0.19112777709960938, 0.20348358154296875, 0.21583938598632812, 0.2281951904296875, 0.24055099487304688, 0.25290679931640625, 0.2652626037597656, 0.277618408203125, 0.2899742126464844, 0.30233001708984375, 0.3146858215332031, 0.3270416259765625, 0.3393974304199219, 0.35175323486328125, 0.3641090393066406, 0.37646484375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 11.0, 5.0, 9.0, 4.0, 14.0, 18.0, 12.0, 16.0, 16.0, 23.0, 28.0, 35.0, 25.0, 26.0, 53.0, 56.0, 55.0, 52.0, 42.0, 37.0, 47.0, 43.0, 40.0, 57.0, 36.0, 40.0, 24.0, 27.0, 28.0, 26.0, 22.0, 15.0, 17.0, 15.0, 11.0, 3.0, 7.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.276123046875, -0.26850128173828125, -0.2608795166015625, -0.25325775146484375, -0.245635986328125, -0.23801422119140625, -0.2303924560546875, -0.22277069091796875, -0.21514892578125, -0.20752716064453125, -0.1999053955078125, -0.19228363037109375, -0.184661865234375, -0.17704010009765625, -0.1694183349609375, -0.16179656982421875, -0.1541748046875, -0.14655303955078125, -0.1389312744140625, -0.13130950927734375, -0.123687744140625, -0.11606597900390625, -0.1084442138671875, -0.10082244873046875, -0.09320068359375, -0.08557891845703125, -0.0779571533203125, -0.07033538818359375, -0.062713623046875, -0.05509185791015625, -0.0474700927734375, -0.03984832763671875, -0.0322265625, -0.02460479736328125, -0.0169830322265625, -0.00936126708984375, -0.001739501953125, 0.00588226318359375, 0.0135040283203125, 0.02112579345703125, 0.02874755859375, 0.03636932373046875, 0.0439910888671875, 0.05161285400390625, 0.059234619140625, 0.06685638427734375, 0.0744781494140625, 0.08209991455078125, 0.0897216796875, 0.09734344482421875, 0.1049652099609375, 0.11258697509765625, 0.120208740234375, 0.12783050537109375, 0.1354522705078125, 0.14307403564453125, 0.15069580078125, 0.15831756591796875, 0.1659393310546875, 0.17356109619140625, 0.181182861328125, 0.18880462646484375, 0.1964263916015625, 0.20404815673828125, 0.211669921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 11.0, 28.0, 27.0, 54.0, 56.0, 113.0, 168.0, 231.0, 400.0, 689.0, 1268.0, 2467.0, 5210.0, 12077.0, 32922.0, 112516.0, 426444.0, 328512.0, 81379.0, 25347.0, 9715.0, 4175.0, 2035.0, 1103.0, 582.0, 392.0, 225.0, 137.0, 92.0, 47.0, 31.0, 25.0, 20.0, 10.0, 5.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.697265625, -0.6753921508789062, -0.6535186767578125, -0.6316452026367188, -0.609771728515625, -0.5878982543945312, -0.5660247802734375, -0.5441513061523438, -0.52227783203125, -0.5004043579101562, -0.4785308837890625, -0.45665740966796875, -0.434783935546875, -0.41291046142578125, -0.3910369873046875, -0.36916351318359375, -0.3472900390625, -0.32541656494140625, -0.3035430908203125, -0.28166961669921875, -0.259796142578125, -0.23792266845703125, -0.2160491943359375, -0.19417572021484375, -0.17230224609375, -0.15042877197265625, -0.1285552978515625, -0.10668182373046875, -0.084808349609375, -0.06293487548828125, -0.0410614013671875, -0.01918792724609375, 0.002685546875, 0.02455902099609375, 0.0464324951171875, 0.06830596923828125, 0.090179443359375, 0.11205291748046875, 0.1339263916015625, 0.15579986572265625, 0.17767333984375, 0.19954681396484375, 0.2214202880859375, 0.24329376220703125, 0.265167236328125, 0.28704071044921875, 0.3089141845703125, 0.33078765869140625, 0.3526611328125, 0.37453460693359375, 0.3964080810546875, 0.41828155517578125, 0.440155029296875, 0.46202850341796875, 0.4839019775390625, 0.5057754516601562, 0.52764892578125, 0.5495223999023438, 0.5713958740234375, 0.5932693481445312, 0.615142822265625, 0.6370162963867188, 0.6588897705078125, 0.6807632446289062, 0.70263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 2.0, 7.0, 15.0, 8.0, 10.0, 14.0, 19.0, 19.0, 34.0, 45.0, 47.0, 50.0, 52.0, 51.0, 56.0, 54.0, 60.0, 56.0, 60.0, 71.0, 47.0, 37.0, 43.0, 25.0, 26.0, 19.0, 18.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4541015625, -1.409881591796875, -1.36566162109375, -1.321441650390625, -1.2772216796875, -1.233001708984375, -1.18878173828125, -1.144561767578125, -1.100341796875, -1.056121826171875, -1.01190185546875, -0.967681884765625, -0.9234619140625, -0.879241943359375, -0.83502197265625, -0.790802001953125, -0.74658203125, -0.702362060546875, -0.65814208984375, -0.613922119140625, -0.5697021484375, -0.525482177734375, -0.48126220703125, -0.437042236328125, -0.392822265625, -0.348602294921875, -0.30438232421875, -0.260162353515625, -0.2159423828125, -0.171722412109375, -0.12750244140625, -0.083282470703125, -0.0390625, 0.005157470703125, 0.04937744140625, 0.093597412109375, 0.1378173828125, 0.182037353515625, 0.22625732421875, 0.270477294921875, 0.314697265625, 0.358917236328125, 0.40313720703125, 0.447357177734375, 0.4915771484375, 0.535797119140625, 0.58001708984375, 0.624237060546875, 0.66845703125, 0.712677001953125, 0.75689697265625, 0.801116943359375, 0.8453369140625, 0.889556884765625, 0.93377685546875, 0.977996826171875, 1.022216796875, 1.066436767578125, 1.11065673828125, 1.154876708984375, 1.1990966796875, 1.243316650390625, 1.28753662109375, 1.331756591796875, 1.3759765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 10.0, 14.0, 20.0, 36.0, 58.0, 123.0, 224.0, 537.0, 1238.0, 3678.0, 17622.0, 189456.0, 722939.0, 96710.0, 11240.0, 2732.0, 1005.0, 442.0, 220.0, 101.0, 60.0, 32.0, 18.0, 14.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.482177734375, -0.4705238342285156, -0.45886993408203125, -0.4472160339355469, -0.4355621337890625, -0.4239082336425781, -0.41225433349609375, -0.4006004333496094, -0.388946533203125, -0.3772926330566406, -0.36563873291015625, -0.3539848327636719, -0.3423309326171875, -0.3306770324707031, -0.31902313232421875, -0.3073692321777344, -0.29571533203125, -0.2840614318847656, -0.27240753173828125, -0.2607536315917969, -0.2490997314453125, -0.23744583129882812, -0.22579193115234375, -0.21413803100585938, -0.202484130859375, -0.19083023071289062, -0.17917633056640625, -0.16752243041992188, -0.1558685302734375, -0.14421463012695312, -0.13256072998046875, -0.12090682983398438, -0.1092529296875, -0.09759902954101562, -0.08594512939453125, -0.07429122924804688, -0.0626373291015625, -0.050983428955078125, -0.03932952880859375, -0.027675628662109375, -0.016021728515625, -0.004367828369140625, 0.00728607177734375, 0.018939971923828125, 0.0305938720703125, 0.042247772216796875, 0.05390167236328125, 0.06555557250976562, 0.07720947265625, 0.08886337280273438, 0.10051727294921875, 0.11217117309570312, 0.1238250732421875, 0.13547897338867188, 0.14713287353515625, 0.15878677368164062, 0.170440673828125, 0.18209457397460938, 0.19374847412109375, 0.20540237426757812, 0.2170562744140625, 0.22871017456054688, 0.24036407470703125, 0.2520179748535156, 0.263671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 6.0, 5.0, 12.0, 18.0, 15.0, 28.0, 58.0, 57.0, 83.0, 115.0, 109.0, 122.0, 93.0, 79.0, 53.0, 41.0, 33.0, 15.0, 15.0, 11.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.023313522338867e-05, -3.877934068441391e-05, -3.732554614543915e-05, -3.5871751606464386e-05, -3.4417957067489624e-05, -3.296416252851486e-05, -3.15103679895401e-05, -3.0056573450565338e-05, -2.8602778911590576e-05, -2.7148984372615814e-05, -2.5695189833641052e-05, -2.424139529466629e-05, -2.278760075569153e-05, -2.1333806216716766e-05, -1.9880011677742004e-05, -1.8426217138767242e-05, -1.697242259979248e-05, -1.551862806081772e-05, -1.4064833521842957e-05, -1.2611038982868195e-05, -1.1157244443893433e-05, -9.70344990491867e-06, -8.249655365943909e-06, -6.795860826969147e-06, -5.342066287994385e-06, -3.888271749019623e-06, -2.434477210044861e-06, -9.806826710700989e-07, 4.731118679046631e-07, 1.926906406879425e-06, 3.380700945854187e-06, 4.834495484828949e-06, 6.288290023803711e-06, 7.742084562778473e-06, 9.195879101753235e-06, 1.0649673640727997e-05, 1.2103468179702759e-05, 1.355726271867752e-05, 1.5011057257652283e-05, 1.6464851796627045e-05, 1.7918646335601807e-05, 1.937244087457657e-05, 2.082623541355133e-05, 2.2280029952526093e-05, 2.3733824491500854e-05, 2.5187619030475616e-05, 2.664141356945038e-05, 2.809520810842514e-05, 2.9549002647399902e-05, 3.1002797186374664e-05, 3.2456591725349426e-05, 3.391038626432419e-05, 3.536418080329895e-05, 3.681797534227371e-05, 3.8271769881248474e-05, 3.9725564420223236e-05, 4.1179358959198e-05, 4.263315349817276e-05, 4.408694803714752e-05, 4.5540742576122284e-05, 4.6994537115097046e-05, 4.844833165407181e-05, 4.990212619304657e-05, 5.135592073202133e-05, 5.2809715270996094e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 6.0, 11.0, 23.0, 27.0, 46.0, 59.0, 99.0, 142.0, 283.0, 477.0, 943.0, 2229.0, 6490.0, 25430.0, 131253.0, 491219.0, 309384.0, 60746.0, 12963.0, 3784.0, 1384.0, 638.0, 363.0, 214.0, 126.0, 72.0, 44.0, 27.0, 19.0, 9.0, 8.0, 11.0, 7.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2508888244628906, -0.24323272705078125, -0.23557662963867188, -0.2279205322265625, -0.22026443481445312, -0.21260833740234375, -0.20495223999023438, -0.197296142578125, -0.18964004516601562, -0.18198394775390625, -0.17432785034179688, -0.1666717529296875, -0.15901565551757812, -0.15135955810546875, -0.14370346069335938, -0.13604736328125, -0.12839126586914062, -0.12073516845703125, -0.11307907104492188, -0.1054229736328125, -0.09776687622070312, -0.09011077880859375, -0.08245468139648438, -0.074798583984375, -0.06714248657226562, -0.05948638916015625, -0.051830291748046875, -0.0441741943359375, -0.036518096923828125, -0.02886199951171875, -0.021205902099609375, -0.0135498046875, -0.005893707275390625, 0.00176239013671875, 0.009418487548828125, 0.0170745849609375, 0.024730682373046875, 0.03238677978515625, 0.040042877197265625, 0.047698974609375, 0.055355072021484375, 0.06301116943359375, 0.07066726684570312, 0.0783233642578125, 0.08597946166992188, 0.09363555908203125, 0.10129165649414062, 0.10894775390625, 0.11660385131835938, 0.12425994873046875, 0.13191604614257812, 0.1395721435546875, 0.14722824096679688, 0.15488433837890625, 0.16254043579101562, 0.170196533203125, 0.17785263061523438, 0.18550872802734375, 0.19316482543945312, 0.2008209228515625, 0.20847702026367188, 0.21613311767578125, 0.22378921508789062, 0.2314453125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 13.0, 15.0, 23.0, 36.0, 58.0, 54.0, 84.0, 99.0, 93.0, 104.0, 98.0, 79.0, 69.0, 44.0, 37.0, 24.0, 16.0, 12.0, 11.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.449951171875, -0.43747711181640625, -0.4250030517578125, -0.41252899169921875, -0.400054931640625, -0.38758087158203125, -0.3751068115234375, -0.36263275146484375, -0.35015869140625, -0.33768463134765625, -0.3252105712890625, -0.31273651123046875, -0.300262451171875, -0.28778839111328125, -0.2753143310546875, -0.26284027099609375, -0.2503662109375, -0.23789215087890625, -0.2254180908203125, -0.21294403076171875, -0.200469970703125, -0.18799591064453125, -0.1755218505859375, -0.16304779052734375, -0.15057373046875, -0.13809967041015625, -0.1256256103515625, -0.11315155029296875, -0.100677490234375, -0.08820343017578125, -0.0757293701171875, -0.06325531005859375, -0.05078125, -0.03830718994140625, -0.0258331298828125, -0.01335906982421875, -0.000885009765625, 0.01158905029296875, 0.0240631103515625, 0.03653717041015625, 0.04901123046875, 0.06148529052734375, 0.0739593505859375, 0.08643341064453125, 0.098907470703125, 0.11138153076171875, 0.1238555908203125, 0.13632965087890625, 0.1488037109375, 0.16127777099609375, 0.1737518310546875, 0.18622589111328125, 0.198699951171875, 0.21117401123046875, 0.2236480712890625, 0.23612213134765625, 0.24859619140625, 0.26107025146484375, 0.2735443115234375, 0.28601837158203125, 0.298492431640625, 0.31096649169921875, 0.3234405517578125, 0.33591461181640625, 0.348388671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 8.0, 17.0, 29.0, 61.0, 134.0, 216.0, 278.0, 161.0, 50.0, 28.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.122644901275635, -6.786108493804932, -6.449572563171387, -6.113036155700684, -5.776500225067139, -5.4399638175964355, -5.103427886962891, -4.7668914794921875, -4.430355072021484, -4.093818664550781, -3.7572827339172363, -3.420746326446533, -3.0842103958129883, -2.747673988342285, -2.411137819290161, -2.074601650238037, -1.7380657196044922, -1.4015295505523682, -1.0649933815002441, -0.7284570932388306, -0.39192092418670654, -0.05538475513458252, 0.28115153312683105, 0.6176877021789551, 0.9542238712310791, 1.2907600402832031, 1.6272962093353271, 1.9638324975967407, 2.3003687858581543, 2.636904716491699, 2.9734411239624023, 3.3099772930145264, 3.646512985229492, 3.983049154281616, 4.31958532333374, 4.656121730804443, 4.992657661437988, 5.329194068908691, 5.6657304763793945, 6.0022664070129395, 6.338802337646484, 6.6753387451171875, 7.011874675750732, 7.3484110832214355, 7.6849470138549805, 8.021483421325684, 8.358019828796387, 8.694555282592773, 9.031091690063477, 9.36762809753418, 9.704164505004883, 10.04069995880127, 10.377236366271973, 10.713772773742676, 11.050309181213379, 11.386844635009766, 11.723381996154785, 12.059918403625488, 12.396454811096191, 12.732990264892578, 13.069526672363281, 13.406063079833984, 13.742599487304688, 14.07913589477539, 14.415671348571777]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 14.0, 5.0, 8.0, 17.0, 29.0, 13.0, 23.0, 22.0, 17.0, 25.0, 29.0, 39.0, 22.0, 41.0, 39.0, 51.0, 38.0, 39.0, 34.0, 49.0, 31.0, 34.0, 44.0, 37.0, 31.0, 35.0, 25.0, 12.0, 23.0, 23.0, 10.0, 19.0, 18.0, 14.0, 8.0, 10.0, 7.0, 11.0, 8.0, 1.0, 8.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 3.0], "bins": [-5.70883321762085, -5.541421413421631, -5.374009132385254, -5.206597328186035, -5.039185047149658, -4.8717732429504395, -4.7043609619140625, -4.536949157714844, -4.369537353515625, -4.202125549316406, -4.034713268280029, -3.8673014640808105, -3.6998894214630127, -3.532477378845215, -3.365065336227417, -3.197653293609619, -3.0302412509918213, -2.8628292083740234, -2.6954171657562256, -2.5280051231384277, -2.360593318939209, -2.193181276321411, -2.0257692337036133, -1.858357310295105, -1.6909452676773071, -1.5235332250595093, -1.356121301651001, -1.1887092590332031, -1.0212972164154053, -0.853885293006897, -0.6864732503890991, -0.5190613269805908, -0.35164928436279297, -0.1842372864484787, -0.01682528853416443, 0.15058672428131104, 0.3179987072944641, 0.4854106903076172, 0.652822732925415, 0.8202346563339233, 0.9876466989517212, 1.155058741569519, 1.3224706649780273, 1.4898827075958252, 1.657294750213623, 1.8247066736221313, 1.9921187162399292, 2.1595306396484375, 2.3269426822662354, 2.494354724884033, 2.661766767501831, 2.829178810119629, 2.9965906143188477, 3.1640026569366455, 3.3314146995544434, 3.498826503753662, 3.666238784790039, 3.833650827407837, 4.001062870025635, 4.1684746742248535, 4.3358869552612305, 4.503298759460449, 4.670710563659668, 4.838122844696045, 5.005534648895264]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 3.0, 7.0, 6.0, 8.0, 7.0, 12.0, 28.0, 44.0, 31.0, 58.0, 82.0, 105.0, 132.0, 215.0, 317.0, 431.0, 599.0, 985.0, 1446.0, 2431.0, 4020.0, 7956.0, 18302.0, 68608.0, 3794607.0, 236065.0, 31690.0, 11480.0, 5830.0, 3123.0, 1941.0, 1229.0, 804.0, 536.0, 351.0, 238.0, 178.0, 109.0, 85.0, 63.0, 30.0, 30.0, 21.0, 14.0, 7.0, 5.0, 9.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8818359375, -0.8557052612304688, -0.8295745849609375, -0.8034439086914062, -0.777313232421875, -0.7511825561523438, -0.7250518798828125, -0.6989212036132812, -0.67279052734375, -0.6466598510742188, -0.6205291748046875, -0.5943984985351562, -0.568267822265625, -0.5421371459960938, -0.5160064697265625, -0.48987579345703125, -0.4637451171875, -0.43761444091796875, -0.4114837646484375, -0.38535308837890625, -0.359222412109375, -0.33309173583984375, -0.3069610595703125, -0.28083038330078125, -0.25469970703125, -0.22856903076171875, -0.2024383544921875, -0.17630767822265625, -0.150177001953125, -0.12404632568359375, -0.0979156494140625, -0.07178497314453125, -0.045654296875, -0.01952362060546875, 0.0066070556640625, 0.03273773193359375, 0.058868408203125, 0.08499908447265625, 0.1111297607421875, 0.13726043701171875, 0.16339111328125, 0.18952178955078125, 0.2156524658203125, 0.24178314208984375, 0.267913818359375, 0.29404449462890625, 0.3201751708984375, 0.34630584716796875, 0.3724365234375, 0.39856719970703125, 0.4246978759765625, 0.45082855224609375, 0.476959228515625, 0.5030899047851562, 0.5292205810546875, 0.5553512573242188, 0.58148193359375, 0.6076126098632812, 0.6337432861328125, 0.6598739624023438, 0.686004638671875, 0.7121353149414062, 0.7382659912109375, 0.7643966674804688, 0.79052734375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 4.0, 8.0, 13.0, 9.0, 16.0, 23.0, 23.0, 29.0, 24.0, 37.0, 39.0, 38.0, 35.0, 52.0, 48.0, 52.0, 54.0, 47.0, 38.0, 41.0, 50.0, 38.0, 36.0, 29.0, 32.0, 35.0, 25.0, 26.0, 11.0, 12.0, 14.0, 20.0, 8.0, 7.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.32505035400390625, -0.3151397705078125, -0.30522918701171875, -0.295318603515625, -0.28540802001953125, -0.2754974365234375, -0.26558685302734375, -0.25567626953125, -0.24576568603515625, -0.2358551025390625, -0.22594451904296875, -0.216033935546875, -0.20612335205078125, -0.1962127685546875, -0.18630218505859375, -0.1763916015625, -0.16648101806640625, -0.1565704345703125, -0.14665985107421875, -0.136749267578125, -0.12683868408203125, -0.1169281005859375, -0.10701751708984375, -0.09710693359375, -0.08719635009765625, -0.0772857666015625, -0.06737518310546875, -0.057464599609375, -0.04755401611328125, -0.0376434326171875, -0.02773284912109375, -0.017822265625, -0.00791168212890625, 0.0019989013671875, 0.01190948486328125, 0.021820068359375, 0.03173065185546875, 0.0416412353515625, 0.05155181884765625, 0.06146240234375, 0.07137298583984375, 0.0812835693359375, 0.09119415283203125, 0.101104736328125, 0.11101531982421875, 0.1209259033203125, 0.13083648681640625, 0.1407470703125, 0.15065765380859375, 0.1605682373046875, 0.17047882080078125, 0.180389404296875, 0.19029998779296875, 0.2002105712890625, 0.21012115478515625, 0.22003173828125, 0.22994232177734375, 0.2398529052734375, 0.24976348876953125, 0.259674072265625, 0.26958465576171875, 0.2794952392578125, 0.28940582275390625, 0.29931640625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 23.0, 20.0, 23.0, 39.0, 43.0, 79.0, 95.0, 156.0, 252.0, 436.0, 944.0, 2410.0, 7841.0, 34619.0, 821932.0, 3270736.0, 40730.0, 8878.0, 2709.0, 1062.0, 477.0, 233.0, 138.0, 109.0, 59.0, 46.0, 35.0, 35.0, 16.0, 22.0, 17.0, 11.0, 6.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.359375, -1.320587158203125, -1.28179931640625, -1.243011474609375, -1.2042236328125, -1.165435791015625, -1.12664794921875, -1.087860107421875, -1.049072265625, -1.010284423828125, -0.97149658203125, -0.932708740234375, -0.8939208984375, -0.855133056640625, -0.81634521484375, -0.777557373046875, -0.73876953125, -0.699981689453125, -0.66119384765625, -0.622406005859375, -0.5836181640625, -0.544830322265625, -0.50604248046875, -0.467254638671875, -0.428466796875, -0.389678955078125, -0.35089111328125, -0.312103271484375, -0.2733154296875, -0.234527587890625, -0.19573974609375, -0.156951904296875, -0.1181640625, -0.079376220703125, -0.04058837890625, -0.001800537109375, 0.0369873046875, 0.075775146484375, 0.11456298828125, 0.153350830078125, 0.192138671875, 0.230926513671875, 0.26971435546875, 0.308502197265625, 0.3472900390625, 0.386077880859375, 0.42486572265625, 0.463653564453125, 0.50244140625, 0.541229248046875, 0.58001708984375, 0.618804931640625, 0.6575927734375, 0.696380615234375, 0.73516845703125, 0.773956298828125, 0.812744140625, 0.851531982421875, 0.89031982421875, 0.929107666015625, 0.9678955078125, 1.006683349609375, 1.04547119140625, 1.084259033203125, 1.123046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 13.0, 20.0, 29.0, 44.0, 108.0, 681.0, 2889.0, 135.0, 60.0, 37.0, 23.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2607421875, -1.2293243408203125, -1.197906494140625, -1.1664886474609375, -1.13507080078125, -1.1036529541015625, -1.072235107421875, -1.0408172607421875, -1.0093994140625, -0.9779815673828125, -0.946563720703125, -0.9151458740234375, -0.88372802734375, -0.8523101806640625, -0.820892333984375, -0.7894744873046875, -0.758056640625, -0.7266387939453125, -0.695220947265625, -0.6638031005859375, -0.63238525390625, -0.6009674072265625, -0.569549560546875, -0.5381317138671875, -0.5067138671875, -0.4752960205078125, -0.443878173828125, -0.4124603271484375, -0.38104248046875, -0.3496246337890625, -0.318206787109375, -0.2867889404296875, -0.25537109375, -0.2239532470703125, -0.192535400390625, -0.1611175537109375, -0.12969970703125, -0.0982818603515625, -0.066864013671875, -0.0354461669921875, -0.0040283203125, 0.0273895263671875, 0.058807373046875, 0.0902252197265625, 0.12164306640625, 0.1530609130859375, 0.184478759765625, 0.2158966064453125, 0.247314453125, 0.2787322998046875, 0.310150146484375, 0.3415679931640625, 0.37298583984375, 0.4044036865234375, 0.435821533203125, 0.4672393798828125, 0.4986572265625, 0.5300750732421875, 0.561492919921875, 0.5929107666015625, 0.62432861328125, 0.6557464599609375, 0.687164306640625, 0.7185821533203125, 0.75]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 23.0, 48.0, 131.0, 276.0, 283.0, 148.0, 50.0, 15.0, 11.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9765621423721313, -1.8348950147628784, -1.693228006362915, -1.551560878753662, -1.4098937511444092, -1.2682267427444458, -1.1265596151351929, -0.9848925471305847, -0.8432254791259766, -0.7015584111213684, -0.5598913431167603, -0.4182242155075073, -0.27655714750289917, -0.13489007949829102, 0.006777048110961914, 0.14844411611557007, 0.2901111841201782, 0.4317782521247864, 0.5734453201293945, 0.7151124477386475, 0.8567795157432556, 0.9984465837478638, 1.1401137113571167, 1.28178071975708, 1.423447847366333, 1.565114974975586, 1.7067819833755493, 1.8484491109848022, 1.9901161193847656, 2.1317832469940186, 2.2734503746032715, 2.4151175022125244, 2.5567846298217773, 2.6984517574310303, 2.840118885040283, 2.981785774230957, 3.12345290184021, 3.265120029449463, 3.406787157058716, 3.5484542846679688, 3.6901211738586426, 3.8317883014678955, 3.9734554290771484, 4.115122318267822, 4.256789684295654, 4.398456573486328, 4.54012393951416, 4.681790828704834, 4.823457717895508, 4.965124607086182, 5.106791973114014, 5.2484588623046875, 5.3901262283325195, 5.531793117523193, 5.673460006713867, 5.815127372741699, 5.956794738769531, 6.098461627960205, 6.240128993988037, 6.381795883178711, 6.523463249206543, 6.665130138397217, 6.806797027587891, 6.948464393615723, 7.0901312828063965]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 11.0, 14.0, 16.0, 17.0, 23.0, 14.0, 25.0, 29.0, 39.0, 46.0, 49.0, 40.0, 53.0, 48.0, 40.0, 51.0, 47.0, 60.0, 46.0, 49.0, 41.0, 37.0, 41.0, 22.0, 16.0, 20.0, 18.0, 17.0, 12.0, 7.0, 6.0, 13.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4657471179962158, -1.4160938262939453, -1.3664405345916748, -1.3167871236801147, -1.2671338319778442, -1.2174805402755737, -1.1678271293640137, -1.1181738376617432, -1.0685205459594727, -1.0188672542572021, -0.9692139029502869, -0.9195605516433716, -0.8699072599411011, -0.8202539682388306, -0.7706006169319153, -0.720947265625, -0.6712939739227295, -0.621640682220459, -0.5719873309135437, -0.5223339796066284, -0.4726806879043579, -0.423027366399765, -0.3733740448951721, -0.3237207233905792, -0.27406740188598633, -0.22441408038139343, -0.17476075887680054, -0.12510743737220764, -0.07545411586761475, -0.02580079436302185, 0.023852527141571045, 0.07350584864616394, 0.12315917015075684, 0.17281249165534973, 0.22246581315994263, 0.2721191346645355, 0.3217724561691284, 0.3714257776737213, 0.4210790991783142, 0.4707324206829071, 0.5203857421875, 0.5700390338897705, 0.6196923851966858, 0.6693457365036011, 0.7189990282058716, 0.7686523199081421, 0.8183056712150574, 0.8679590225219727, 0.9176123142242432, 0.9672656059265137, 1.0169188976287842, 1.0665723085403442, 1.1162256002426147, 1.1658788919448853, 1.2155323028564453, 1.2651855945587158, 1.3148388862609863, 1.3644921779632568, 1.4141454696655273, 1.4637988805770874, 1.513452172279358, 1.5631054639816284, 1.6127588748931885, 1.662412166595459, 1.7120654582977295]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 11.0, 9.0, 12.0, 20.0, 30.0, 36.0, 47.0, 66.0, 72.0, 120.0, 187.0, 307.0, 477.0, 855.0, 1560.0, 3109.0, 6440.0, 13781.0, 32801.0, 91299.0, 312042.0, 392365.0, 119401.0, 41268.0, 16610.0, 7623.0, 3635.0, 1806.0, 982.0, 547.0, 325.0, 206.0, 147.0, 93.0, 64.0, 46.0, 35.0, 32.0, 16.0, 18.0, 14.0, 8.0, 8.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0263671875, -0.9971389770507812, -0.9679107666015625, -0.9386825561523438, -0.909454345703125, -0.8802261352539062, -0.8509979248046875, -0.8217697143554688, -0.79254150390625, -0.7633132934570312, -0.7340850830078125, -0.7048568725585938, -0.675628662109375, -0.6464004516601562, -0.6171722412109375, -0.5879440307617188, -0.5587158203125, -0.5294876098632812, -0.5002593994140625, -0.47103118896484375, -0.441802978515625, -0.41257476806640625, -0.3833465576171875, -0.35411834716796875, -0.32489013671875, -0.29566192626953125, -0.2664337158203125, -0.23720550537109375, -0.207977294921875, -0.17874908447265625, -0.1495208740234375, -0.12029266357421875, -0.091064453125, -0.06183624267578125, -0.0326080322265625, -0.00337982177734375, 0.025848388671875, 0.05507659912109375, 0.0843048095703125, 0.11353302001953125, 0.14276123046875, 0.17198944091796875, 0.2012176513671875, 0.23044586181640625, 0.259674072265625, 0.28890228271484375, 0.3181304931640625, 0.34735870361328125, 0.3765869140625, 0.40581512451171875, 0.4350433349609375, 0.46427154541015625, 0.493499755859375, 0.5227279663085938, 0.5519561767578125, 0.5811843872070312, 0.61041259765625, 0.6396408081054688, 0.6688690185546875, 0.6980972290039062, 0.727325439453125, 0.7565536499023438, 0.7857818603515625, 0.8150100708007812, 0.84423828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 6.0, 8.0, 6.0, 5.0, 13.0, 15.0, 18.0, 18.0, 25.0, 19.0, 35.0, 27.0, 34.0, 44.0, 41.0, 49.0, 45.0, 45.0, 51.0, 48.0, 54.0, 49.0, 32.0, 47.0, 38.0, 37.0, 38.0, 27.0, 29.0, 20.0, 12.0, 12.0, 8.0, 17.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3818359375, -0.37113189697265625, -0.3604278564453125, -0.34972381591796875, -0.339019775390625, -0.32831573486328125, -0.3176116943359375, -0.30690765380859375, -0.29620361328125, -0.28549957275390625, -0.2747955322265625, -0.26409149169921875, -0.253387451171875, -0.24268341064453125, -0.2319793701171875, -0.22127532958984375, -0.2105712890625, -0.19986724853515625, -0.1891632080078125, -0.17845916748046875, -0.167755126953125, -0.15705108642578125, -0.1463470458984375, -0.13564300537109375, -0.12493896484375, -0.11423492431640625, -0.1035308837890625, -0.09282684326171875, -0.082122802734375, -0.07141876220703125, -0.0607147216796875, -0.05001068115234375, -0.039306640625, -0.02860260009765625, -0.0178985595703125, -0.00719451904296875, 0.003509521484375, 0.01421356201171875, 0.0249176025390625, 0.03562164306640625, 0.04632568359375, 0.05702972412109375, 0.0677337646484375, 0.07843780517578125, 0.089141845703125, 0.09984588623046875, 0.1105499267578125, 0.12125396728515625, 0.1319580078125, 0.14266204833984375, 0.1533660888671875, 0.16407012939453125, 0.174774169921875, 0.18547821044921875, 0.1961822509765625, 0.20688629150390625, 0.21759033203125, 0.22829437255859375, 0.2389984130859375, 0.24970245361328125, 0.260406494140625, 0.27111053466796875, 0.2818145751953125, 0.29251861572265625, 0.30322265625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 3.0, 2.0, 16.0, 21.0, 28.0, 32.0, 82.0, 166.0, 295.0, 630.0, 1471.0, 3809.0, 11562.0, 43396.0, 300229.0, 585061.0, 75343.0, 17160.0, 5560.0, 1979.0, 867.0, 390.0, 196.0, 93.0, 56.0, 30.0, 24.0, 13.0, 15.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.73828125, -1.6915130615234375, -1.644744873046875, -1.5979766845703125, -1.55120849609375, -1.5044403076171875, -1.457672119140625, -1.4109039306640625, -1.3641357421875, -1.3173675537109375, -1.270599365234375, -1.2238311767578125, -1.17706298828125, -1.1302947998046875, -1.083526611328125, -1.0367584228515625, -0.989990234375, -0.9432220458984375, -0.896453857421875, -0.8496856689453125, -0.80291748046875, -0.7561492919921875, -0.709381103515625, -0.6626129150390625, -0.6158447265625, -0.5690765380859375, -0.522308349609375, -0.4755401611328125, -0.42877197265625, -0.3820037841796875, -0.335235595703125, -0.2884674072265625, -0.24169921875, -0.1949310302734375, -0.148162841796875, -0.1013946533203125, -0.05462646484375, -0.0078582763671875, 0.038909912109375, 0.0856781005859375, 0.1324462890625, 0.1792144775390625, 0.225982666015625, 0.2727508544921875, 0.31951904296875, 0.3662872314453125, 0.413055419921875, 0.4598236083984375, 0.506591796875, 0.5533599853515625, 0.600128173828125, 0.6468963623046875, 0.69366455078125, 0.7404327392578125, 0.787200927734375, 0.8339691162109375, 0.8807373046875, 0.9275054931640625, 0.974273681640625, 1.0210418701171875, 1.06781005859375, 1.1145782470703125, 1.161346435546875, 1.2081146240234375, 1.2548828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 6.0, 10.0, 18.0, 17.0, 29.0, 30.0, 30.0, 27.0, 32.0, 40.0, 50.0, 55.0, 46.0, 53.0, 55.0, 68.0, 55.0, 45.0, 55.0, 42.0, 39.0, 29.0, 27.0, 30.0, 21.0, 17.0, 16.0, 16.0, 9.0, 3.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.802642822265625, -1.74200439453125, -1.681365966796875, -1.6207275390625, -1.560089111328125, -1.49945068359375, -1.438812255859375, -1.378173828125, -1.317535400390625, -1.25689697265625, -1.196258544921875, -1.1356201171875, -1.074981689453125, -1.01434326171875, -0.953704833984375, -0.89306640625, -0.832427978515625, -0.77178955078125, -0.711151123046875, -0.6505126953125, -0.589874267578125, -0.52923583984375, -0.468597412109375, -0.407958984375, -0.347320556640625, -0.28668212890625, -0.226043701171875, -0.1654052734375, -0.104766845703125, -0.04412841796875, 0.016510009765625, 0.0771484375, 0.137786865234375, 0.19842529296875, 0.259063720703125, 0.3197021484375, 0.380340576171875, 0.44097900390625, 0.501617431640625, 0.562255859375, 0.622894287109375, 0.68353271484375, 0.744171142578125, 0.8048095703125, 0.865447998046875, 0.92608642578125, 0.986724853515625, 1.04736328125, 1.108001708984375, 1.16864013671875, 1.229278564453125, 1.2899169921875, 1.350555419921875, 1.41119384765625, 1.471832275390625, 1.532470703125, 1.593109130859375, 1.65374755859375, 1.714385986328125, 1.7750244140625, 1.835662841796875, 1.89630126953125, 1.956939697265625, 2.017578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 14.0, 23.0, 26.0, 32.0, 46.0, 72.0, 124.0, 172.0, 256.0, 546.0, 926.0, 1984.0, 5488.0, 29126.0, 722163.0, 264476.0, 15608.0, 3946.0, 1615.0, 764.0, 393.0, 264.0, 161.0, 96.0, 59.0, 51.0, 30.0, 18.0, 15.0, 12.0, 9.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9462890625, -0.9191360473632812, -0.8919830322265625, -0.8648300170898438, -0.837677001953125, -0.8105239868164062, -0.7833709716796875, -0.7562179565429688, -0.72906494140625, -0.7019119262695312, -0.6747589111328125, -0.6476058959960938, -0.620452880859375, -0.5932998657226562, -0.5661468505859375, -0.5389938354492188, -0.5118408203125, -0.48468780517578125, -0.4575347900390625, -0.43038177490234375, -0.403228759765625, -0.37607574462890625, -0.3489227294921875, -0.32176971435546875, -0.29461669921875, -0.26746368408203125, -0.2403106689453125, -0.21315765380859375, -0.186004638671875, -0.15885162353515625, -0.1316986083984375, -0.10454559326171875, -0.077392578125, -0.05023956298828125, -0.0230865478515625, 0.00406646728515625, 0.031219482421875, 0.05837249755859375, 0.0855255126953125, 0.11267852783203125, 0.13983154296875, 0.16698455810546875, 0.1941375732421875, 0.22129058837890625, 0.248443603515625, 0.27559661865234375, 0.3027496337890625, 0.32990264892578125, 0.3570556640625, 0.38420867919921875, 0.4113616943359375, 0.43851470947265625, 0.465667724609375, 0.49282073974609375, 0.5199737548828125, 0.5471267700195312, 0.57427978515625, 0.6014328002929688, 0.6285858154296875, 0.6557388305664062, 0.682891845703125, 0.7100448608398438, 0.7371978759765625, 0.7643508911132812, 0.79150390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 13.0, 24.0, 58.0, 124.0, 259.0, 247.0, 143.0, 58.0, 28.0, 15.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.249243885278702e-05, -8.765049278736115e-05, -8.280854672193527e-05, -7.79666006565094e-05, -7.312465459108353e-05, -6.828270852565765e-05, -6.344076246023178e-05, -5.859881639480591e-05, -5.3756870329380035e-05, -4.891492426395416e-05, -4.407297819852829e-05, -3.923103213310242e-05, -3.4389086067676544e-05, -2.954714000225067e-05, -2.47051939368248e-05, -1.9863247871398926e-05, -1.5021301805973053e-05, -1.017935574054718e-05, -5.337409675121307e-06, -4.954636096954346e-07, 4.346482455730438e-06, 9.188428521156311e-06, 1.4030374586582184e-05, 1.8872320652008057e-05, 2.371426671743393e-05, 2.8556212782859802e-05, 3.3398158848285675e-05, 3.824010491371155e-05, 4.308205097913742e-05, 4.7923997044563293e-05, 5.2765943109989166e-05, 5.760788917541504e-05, 6.244983524084091e-05, 6.729178130626678e-05, 7.213372737169266e-05, 7.697567343711853e-05, 8.18176195025444e-05, 8.665956556797028e-05, 9.150151163339615e-05, 9.634345769882202e-05, 0.0001011854037642479, 0.00010602734982967377, 0.00011086929589509964, 0.00011571124196052551, 0.00012055318802595139, 0.00012539513409137726, 0.00013023708015680313, 0.000135079026222229, 0.00013992097228765488, 0.00014476291835308075, 0.00014960486441850662, 0.0001544468104839325, 0.00015928875654935837, 0.00016413070261478424, 0.0001689726486802101, 0.00017381459474563599, 0.00017865654081106186, 0.00018349848687648773, 0.0001883404329419136, 0.00019318237900733948, 0.00019802432507276535, 0.00020286627113819122, 0.0002077082172036171, 0.00021255016326904297]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 16.0, 21.0, 22.0, 31.0, 51.0, 77.0, 132.0, 209.0, 415.0, 727.0, 1610.0, 4331.0, 26443.0, 823529.0, 176325.0, 9458.0, 2589.0, 1141.0, 599.0, 329.0, 181.0, 113.0, 61.0, 50.0, 25.0, 18.0, 14.0, 14.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.884765625, -0.85504150390625, -0.8253173828125, -0.79559326171875, -0.765869140625, -0.73614501953125, -0.7064208984375, -0.67669677734375, -0.64697265625, -0.61724853515625, -0.5875244140625, -0.55780029296875, -0.528076171875, -0.49835205078125, -0.4686279296875, -0.43890380859375, -0.4091796875, -0.37945556640625, -0.3497314453125, -0.32000732421875, -0.290283203125, -0.26055908203125, -0.2308349609375, -0.20111083984375, -0.17138671875, -0.14166259765625, -0.1119384765625, -0.08221435546875, -0.052490234375, -0.02276611328125, 0.0069580078125, 0.03668212890625, 0.06640625, 0.09613037109375, 0.1258544921875, 0.15557861328125, 0.185302734375, 0.21502685546875, 0.2447509765625, 0.27447509765625, 0.30419921875, 0.33392333984375, 0.3636474609375, 0.39337158203125, 0.423095703125, 0.45281982421875, 0.4825439453125, 0.51226806640625, 0.5419921875, 0.57171630859375, 0.6014404296875, 0.63116455078125, 0.660888671875, 0.69061279296875, 0.7203369140625, 0.75006103515625, 0.77978515625, 0.80950927734375, 0.8392333984375, 0.86895751953125, 0.898681640625, 0.92840576171875, 0.9581298828125, 0.98785400390625, 1.017578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 8.0, 13.0, 15.0, 32.0, 94.0, 213.0, 281.0, 176.0, 88.0, 34.0, 15.0, 8.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85400390625, -0.8074569702148438, -0.7609100341796875, -0.7143630981445312, -0.667816162109375, -0.6212692260742188, -0.5747222900390625, -0.5281753540039062, -0.48162841796875, -0.43508148193359375, -0.3885345458984375, -0.34198760986328125, -0.295440673828125, -0.24889373779296875, -0.2023468017578125, -0.15579986572265625, -0.1092529296875, -0.06270599365234375, -0.0161590576171875, 0.03038787841796875, 0.076934814453125, 0.12348175048828125, 0.1700286865234375, 0.21657562255859375, 0.26312255859375, 0.30966949462890625, 0.3562164306640625, 0.40276336669921875, 0.449310302734375, 0.49585723876953125, 0.5424041748046875, 0.5889511108398438, 0.635498046875, 0.6820449829101562, 0.7285919189453125, 0.7751388549804688, 0.821685791015625, 0.8682327270507812, 0.9147796630859375, 0.9613265991210938, 1.00787353515625, 1.0544204711914062, 1.1009674072265625, 1.1475143432617188, 1.194061279296875, 1.2406082153320312, 1.2871551513671875, 1.3337020874023438, 1.3802490234375, 1.4267959594726562, 1.4733428955078125, 1.5198898315429688, 1.566436767578125, 1.6129837036132812, 1.6595306396484375, 1.7060775756835938, 1.75262451171875, 1.7991714477539062, 1.8457183837890625, 1.8922653198242188, 1.938812255859375, 1.9853591918945312, 2.0319061279296875, 2.0784530639648438, 2.125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 19.0, 45.0, 88.0, 215.0, 259.0, 172.0, 112.0, 47.0, 10.0, 13.0, 9.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.22579574584961, -17.72553062438965, -17.225263595581055, -16.724998474121094, -16.224733352661133, -15.724466323852539, -15.224201202392578, -14.7239351272583, -14.223669052124023, -13.723402976989746, -13.223137855529785, -12.722871780395508, -12.22260570526123, -11.722339630126953, -11.222074508666992, -10.721808433532715, -10.221543312072754, -9.721277236938477, -9.221012115478516, -8.720746040344238, -8.220479965209961, -7.720214366912842, -7.219948768615723, -6.719682693481445, -6.219417095184326, -5.719151496887207, -5.21888542175293, -4.7186198234558105, -4.218354225158691, -3.718088150024414, -3.217822551727295, -2.7175567150115967, -2.2172908782958984, -1.7170250415802002, -1.2167593240737915, -0.7164936065673828, -0.21622776985168457, 0.28403806686401367, 0.7843036651611328, 1.284569501876831, 1.7848353385925293, 2.2851011753082275, 2.785367012023926, 3.285632610321045, 3.785898447036743, 4.286164283752441, 4.7864298820495605, 5.28669548034668, 5.786961555480957, 6.287227153778076, 6.7874932289123535, 7.287758827209473, 7.78802490234375, 8.288290023803711, 8.788556098937988, 9.288822174072266, 9.789087295532227, 10.289353370666504, 10.789618492126465, 11.289884567260742, 11.79015064239502, 12.290416717529297, 12.790681838989258, 13.290947914123535, 13.791213989257812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 10.0, 10.0, 10.0, 14.0, 10.0, 11.0, 18.0, 20.0, 28.0, 29.0, 36.0, 28.0, 37.0, 55.0, 51.0, 51.0, 40.0, 33.0, 51.0, 38.0, 37.0, 44.0, 47.0, 38.0, 30.0, 26.0, 29.0, 34.0, 16.0, 26.0, 20.0, 16.0, 17.0, 6.0, 5.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0], "bins": [-10.728023529052734, -10.451824188232422, -10.17562484741211, -9.899425506591797, -9.6232271194458, -9.347027778625488, -9.070828437805176, -8.794629096984863, -8.51842975616455, -8.242230415344238, -7.966031551361084, -7.6898322105407715, -7.413632869720459, -7.137434005737305, -6.861234664916992, -6.58503532409668, -6.308836460113525, -6.032637119293213, -5.756438255310059, -5.480238914489746, -5.204039573669434, -4.927840232849121, -4.651641368865967, -4.375442028045654, -4.0992431640625, -3.8230440616607666, -3.546844720840454, -3.2706456184387207, -2.994446277618408, -2.718247175216675, -2.4420480728149414, -2.165848731994629, -1.8896493911743164, -1.6134501695632935, -1.3372509479522705, -1.061051845550537, -0.7848526239395142, -0.5086534023284912, -0.2324542999267578, 0.04374492168426514, 0.3199441432952881, 0.596143364906311, 0.8723425269126892, 1.1485416889190674, 1.4247409105300903, 1.7009401321411133, 1.9771392345428467, 2.25333833694458, 2.5295376777648926, 2.805736780166626, 3.0819361209869385, 3.358135223388672, 3.6343345642089844, 3.9105336666107178, 4.186732769012451, 4.462932109832764, 4.739130973815918, 5.0153303146362305, 5.291529178619385, 5.567728519439697, 5.84392786026001, 6.120126724243164, 6.396326065063477, 6.672525405883789, 6.948724746704102]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 12.0, 14.0, 12.0, 20.0, 22.0, 36.0, 42.0, 48.0, 54.0, 83.0, 97.0, 137.0, 141.0, 195.0, 297.0, 425.0, 669.0, 1185.0, 2582.0, 14315.0, 4146562.0, 20518.0, 3103.0, 1244.0, 710.0, 431.0, 345.0, 239.0, 161.0, 102.0, 106.0, 83.0, 72.0, 41.0, 34.0, 27.0, 21.0, 25.0, 7.0, 10.0, 13.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.52734375, -2.4542236328125, -2.381103515625, -2.3079833984375, -2.23486328125, -2.1617431640625, -2.088623046875, -2.0155029296875, -1.9423828125, -1.8692626953125, -1.796142578125, -1.7230224609375, -1.64990234375, -1.5767822265625, -1.503662109375, -1.4305419921875, -1.357421875, -1.2843017578125, -1.211181640625, -1.1380615234375, -1.06494140625, -0.9918212890625, -0.918701171875, -0.8455810546875, -0.7724609375, -0.6993408203125, -0.626220703125, -0.5531005859375, -0.47998046875, -0.4068603515625, -0.333740234375, -0.2606201171875, -0.1875, -0.1143798828125, -0.041259765625, 0.0318603515625, 0.10498046875, 0.1781005859375, 0.251220703125, 0.3243408203125, 0.3974609375, 0.4705810546875, 0.543701171875, 0.6168212890625, 0.68994140625, 0.7630615234375, 0.836181640625, 0.9093017578125, 0.982421875, 1.0555419921875, 1.128662109375, 1.2017822265625, 1.27490234375, 1.3480224609375, 1.421142578125, 1.4942626953125, 1.5673828125, 1.6405029296875, 1.713623046875, 1.7867431640625, 1.85986328125, 1.9329833984375, 2.006103515625, 2.0792236328125, 2.15234375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 13.0, 14.0, 15.0, 20.0, 14.0, 23.0, 21.0, 33.0, 36.0, 27.0, 38.0, 42.0, 45.0, 44.0, 51.0, 39.0, 41.0, 42.0, 53.0, 23.0, 44.0, 24.0, 33.0, 32.0, 30.0, 21.0, 29.0, 18.0, 20.0, 16.0, 9.0, 9.0, 10.0, 7.0, 5.0, 6.0, 3.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.431640625, -0.4192352294921875, -0.406829833984375, -0.3944244384765625, -0.38201904296875, -0.3696136474609375, -0.357208251953125, -0.3448028564453125, -0.3323974609375, -0.3199920654296875, -0.307586669921875, -0.2951812744140625, -0.28277587890625, -0.2703704833984375, -0.257965087890625, -0.2455596923828125, -0.233154296875, -0.2207489013671875, -0.208343505859375, -0.1959381103515625, -0.18353271484375, -0.1711273193359375, -0.158721923828125, -0.1463165283203125, -0.1339111328125, -0.1215057373046875, -0.109100341796875, -0.0966949462890625, -0.08428955078125, -0.0718841552734375, -0.059478759765625, -0.0470733642578125, -0.03466796875, -0.0222625732421875, -0.009857177734375, 0.0025482177734375, 0.01495361328125, 0.0273590087890625, 0.039764404296875, 0.0521697998046875, 0.0645751953125, 0.0769805908203125, 0.089385986328125, 0.1017913818359375, 0.11419677734375, 0.1266021728515625, 0.139007568359375, 0.1514129638671875, 0.163818359375, 0.1762237548828125, 0.188629150390625, 0.2010345458984375, 0.21343994140625, 0.2258453369140625, 0.238250732421875, 0.2506561279296875, 0.2630615234375, 0.2754669189453125, 0.287872314453125, 0.3002777099609375, 0.31268310546875, 0.3250885009765625, 0.337493896484375, 0.3498992919921875, 0.3623046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 7.0, 11.0, 13.0, 10.0, 15.0, 20.0, 32.0, 34.0, 53.0, 60.0, 107.0, 120.0, 142.0, 211.0, 279.0, 377.0, 561.0, 828.0, 1255.0, 2232.0, 5159.0, 17769.0, 4053889.0, 92173.0, 10007.0, 3560.0, 1786.0, 1064.0, 734.0, 453.0, 339.0, 254.0, 181.0, 148.0, 104.0, 67.0, 62.0, 39.0, 39.0, 23.0, 18.0, 10.0, 13.0, 11.0, 12.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.857421875, -1.7990264892578125, -1.740631103515625, -1.6822357177734375, -1.62384033203125, -1.5654449462890625, -1.507049560546875, -1.4486541748046875, -1.3902587890625, -1.3318634033203125, -1.273468017578125, -1.2150726318359375, -1.15667724609375, -1.0982818603515625, -1.039886474609375, -0.9814910888671875, -0.923095703125, -0.8647003173828125, -0.806304931640625, -0.7479095458984375, -0.68951416015625, -0.6311187744140625, -0.572723388671875, -0.5143280029296875, -0.4559326171875, -0.3975372314453125, -0.339141845703125, -0.2807464599609375, -0.22235107421875, -0.1639556884765625, -0.105560302734375, -0.0471649169921875, 0.01123046875, 0.0696258544921875, 0.128021240234375, 0.1864166259765625, 0.24481201171875, 0.3032073974609375, 0.361602783203125, 0.4199981689453125, 0.4783935546875, 0.5367889404296875, 0.595184326171875, 0.6535797119140625, 0.71197509765625, 0.7703704833984375, 0.828765869140625, 0.8871612548828125, 0.945556640625, 1.0039520263671875, 1.062347412109375, 1.1207427978515625, 1.17913818359375, 1.2375335693359375, 1.295928955078125, 1.3543243408203125, 1.4127197265625, 1.4711151123046875, 1.529510498046875, 1.5879058837890625, 1.64630126953125, 1.7046966552734375, 1.763092041015625, 1.8214874267578125, 1.8798828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 22.0, 141.0, 3818.0, 41.0, 16.0, 12.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7828445434570312, -0.7585601806640625, -0.7342758178710938, -0.709991455078125, -0.6857070922851562, -0.6614227294921875, -0.6371383666992188, -0.61285400390625, -0.5885696411132812, -0.5642852783203125, -0.5400009155273438, -0.515716552734375, -0.49143218994140625, -0.4671478271484375, -0.44286346435546875, -0.4185791015625, -0.39429473876953125, -0.3700103759765625, -0.34572601318359375, -0.321441650390625, -0.29715728759765625, -0.2728729248046875, -0.24858856201171875, -0.22430419921875, -0.20001983642578125, -0.1757354736328125, -0.15145111083984375, -0.127166748046875, -0.10288238525390625, -0.0785980224609375, -0.05431365966796875, -0.030029296875, -0.00574493408203125, 0.0185394287109375, 0.04282379150390625, 0.067108154296875, 0.09139251708984375, 0.1156768798828125, 0.13996124267578125, 0.16424560546875, 0.18852996826171875, 0.2128143310546875, 0.23709869384765625, 0.261383056640625, 0.28566741943359375, 0.3099517822265625, 0.33423614501953125, 0.3585205078125, 0.38280487060546875, 0.4070892333984375, 0.43137359619140625, 0.455657958984375, 0.47994232177734375, 0.5042266845703125, 0.5285110473632812, 0.55279541015625, 0.5770797729492188, 0.6013641357421875, 0.6256484985351562, 0.649932861328125, 0.6742172241210938, 0.6985015869140625, 0.7227859497070312, 0.7470703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 6.0, 23.0, 18.0, 38.0, 64.0, 81.0, 121.0, 162.0, 160.0, 126.0, 73.0, 51.0, 25.0, 14.0, 10.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1238667964935303, -1.0766856670379639, -1.029504418373108, -0.9823232889175415, -0.9351420998573303, -0.8879609107971191, -0.8407797813415527, -0.7935985922813416, -0.7464174032211304, -0.6992362141609192, -0.652055025100708, -0.6048738956451416, -0.5576927065849304, -0.5105115175247192, -0.46333035826683044, -0.41614919900894165, -0.36896800994873047, -0.3217868208885193, -0.2746056616306305, -0.2274244874715805, -0.18024331331253052, -0.13306213915348053, -0.08588096499443054, -0.03869980573654175, 0.008481383323669434, 0.05566255748271942, 0.10284373164176941, 0.1500249058008194, 0.19720607995986938, 0.24438725411891937, 0.29156842827796936, 0.33874958753585815, 0.3859308958053589, 0.43311208486557007, 0.48029324412345886, 0.5274744033813477, 0.5746555924415588, 0.62183678150177, 0.6690179109573364, 0.7161991000175476, 0.7633802890777588, 0.81056147813797, 0.8577426671981812, 0.9049237966537476, 0.9521049857139587, 0.9992861747741699, 1.0464673042297363, 1.0936484336853027, 1.1408296823501587, 1.188010811805725, 1.235192060470581, 1.2823731899261475, 1.3295543193817139, 1.3767355680465698, 1.4239166975021362, 1.4710979461669922, 1.5182790756225586, 1.565460205078125, 1.612641453742981, 1.6598225831985474, 1.7070038318634033, 1.7541849613189697, 1.8013660907745361, 1.8485472202301025, 1.8957284688949585]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 6.0, 5.0, 8.0, 12.0, 10.0, 21.0, 19.0, 21.0, 22.0, 30.0, 43.0, 45.0, 39.0, 38.0, 57.0, 48.0, 51.0, 62.0, 51.0, 42.0, 47.0, 39.0, 33.0, 43.0, 33.0, 35.0, 25.0, 27.0, 22.0, 16.0, 11.0, 10.0, 12.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0886290073394775, -1.0520042181015015, -1.0153794288635254, -0.9787546396255493, -0.9421297907829285, -0.9055050015449524, -0.8688802123069763, -0.8322553634643555, -0.7956305742263794, -0.7590057849884033, -0.7223809957504272, -0.6857562065124512, -0.6491313576698303, -0.6125065684318542, -0.5758817791938782, -0.5392569303512573, -0.502632200717926, -0.46600741147994995, -0.4293825924396515, -0.3927578032016754, -0.35613298416137695, -0.3195081949234009, -0.2828834056854248, -0.24625858664512634, -0.20963379740715027, -0.173008993268013, -0.13638418912887573, -0.09975939989089966, -0.06313459575176239, -0.026509791612625122, 0.010114997625350952, 0.046739816665649414, 0.08336460590362549, 0.11998941004276276, 0.15661421418190002, 0.1932390034198761, 0.22986380755901337, 0.26648861169815063, 0.3031134009361267, 0.33973821997642517, 0.37636300921440125, 0.4129877984523773, 0.4496126174926758, 0.48623740673065186, 0.5228621959686279, 0.559486985206604, 0.5961117744445801, 0.6327366232872009, 0.669361412525177, 0.7059862017631531, 0.7426109910011292, 0.77923583984375, 0.8158606290817261, 0.8524854183197021, 0.8891102075576782, 0.9257349967956543, 0.9623597860336304, 0.9989845752716064, 1.0356093645095825, 1.0722341537475586, 1.1088589429855347, 1.1454837322235107, 1.1821086406707764, 1.2187334299087524, 1.2553582191467285]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 10.0, 4.0, 12.0, 8.0, 18.0, 30.0, 32.0, 63.0, 84.0, 102.0, 171.0, 203.0, 369.0, 525.0, 864.0, 1235.0, 1960.0, 3221.0, 5181.0, 8589.0, 14497.0, 25269.0, 46626.0, 92741.0, 202872.0, 298189.0, 170851.0, 78779.0, 40597.0, 22292.0, 12845.0, 7558.0, 4728.0, 2787.0, 1804.0, 1145.0, 756.0, 509.0, 334.0, 211.0, 145.0, 100.0, 72.0, 54.0, 31.0, 24.0, 20.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 3.0], "bins": [-0.70458984375, -0.6834869384765625, -0.662384033203125, -0.6412811279296875, -0.62017822265625, -0.5990753173828125, -0.577972412109375, -0.5568695068359375, -0.5357666015625, -0.5146636962890625, -0.493560791015625, -0.4724578857421875, -0.45135498046875, -0.4302520751953125, -0.409149169921875, -0.3880462646484375, -0.366943359375, -0.3458404541015625, -0.324737548828125, -0.3036346435546875, -0.28253173828125, -0.2614288330078125, -0.240325927734375, -0.2192230224609375, -0.1981201171875, -0.1770172119140625, -0.155914306640625, -0.1348114013671875, -0.11370849609375, -0.0926055908203125, -0.071502685546875, -0.0503997802734375, -0.029296875, -0.0081939697265625, 0.012908935546875, 0.0340118408203125, 0.05511474609375, 0.0762176513671875, 0.097320556640625, 0.1184234619140625, 0.1395263671875, 0.1606292724609375, 0.181732177734375, 0.2028350830078125, 0.22393798828125, 0.2450408935546875, 0.266143798828125, 0.2872467041015625, 0.308349609375, 0.3294525146484375, 0.350555419921875, 0.3716583251953125, 0.39276123046875, 0.4138641357421875, 0.434967041015625, 0.4560699462890625, 0.4771728515625, 0.4982757568359375, 0.519378662109375, 0.5404815673828125, 0.56158447265625, 0.5826873779296875, 0.603790283203125, 0.6248931884765625, 0.64599609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 9.0, 7.0, 5.0, 7.0, 9.0, 14.0, 16.0, 12.0, 17.0, 20.0, 15.0, 35.0, 35.0, 30.0, 31.0, 45.0, 37.0, 52.0, 44.0, 55.0, 50.0, 34.0, 32.0, 44.0, 40.0, 34.0, 36.0, 24.0, 28.0, 30.0, 23.0, 17.0, 21.0, 20.0, 16.0, 8.0, 12.0, 9.0, 5.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5107421875, -0.495849609375, -0.48095703125, -0.466064453125, -0.451171875, -0.436279296875, -0.42138671875, -0.406494140625, -0.3916015625, -0.376708984375, -0.36181640625, -0.346923828125, -0.33203125, -0.317138671875, -0.30224609375, -0.287353515625, -0.2724609375, -0.257568359375, -0.24267578125, -0.227783203125, -0.212890625, -0.197998046875, -0.18310546875, -0.168212890625, -0.1533203125, -0.138427734375, -0.12353515625, -0.108642578125, -0.09375, -0.078857421875, -0.06396484375, -0.049072265625, -0.0341796875, -0.019287109375, -0.00439453125, 0.010498046875, 0.025390625, 0.040283203125, 0.05517578125, 0.070068359375, 0.0849609375, 0.099853515625, 0.11474609375, 0.129638671875, 0.14453125, 0.159423828125, 0.17431640625, 0.189208984375, 0.2041015625, 0.218994140625, 0.23388671875, 0.248779296875, 0.263671875, 0.278564453125, 0.29345703125, 0.308349609375, 0.3232421875, 0.338134765625, 0.35302734375, 0.367919921875, 0.3828125, 0.397705078125, 0.41259765625, 0.427490234375, 0.4423828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 13.0, 13.0, 20.0, 35.0, 37.0, 39.0, 58.0, 125.0, 212.0, 409.0, 917.0, 2196.0, 6318.0, 21465.0, 91138.0, 546609.0, 304387.0, 53108.0, 14038.0, 4383.0, 1544.0, 684.0, 318.0, 174.0, 82.0, 61.0, 47.0, 26.0, 28.0, 18.0, 8.0, 9.0, 7.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.001953125, -1.946075439453125, -1.89019775390625, -1.834320068359375, -1.7784423828125, -1.722564697265625, -1.66668701171875, -1.610809326171875, -1.554931640625, -1.499053955078125, -1.44317626953125, -1.387298583984375, -1.3314208984375, -1.275543212890625, -1.21966552734375, -1.163787841796875, -1.10791015625, -1.052032470703125, -0.99615478515625, -0.940277099609375, -0.8843994140625, -0.828521728515625, -0.77264404296875, -0.716766357421875, -0.660888671875, -0.605010986328125, -0.54913330078125, -0.493255615234375, -0.4373779296875, -0.381500244140625, -0.32562255859375, -0.269744873046875, -0.2138671875, -0.157989501953125, -0.10211181640625, -0.046234130859375, 0.0096435546875, 0.065521240234375, 0.12139892578125, 0.177276611328125, 0.233154296875, 0.289031982421875, 0.34490966796875, 0.400787353515625, 0.4566650390625, 0.512542724609375, 0.56842041015625, 0.624298095703125, 0.68017578125, 0.736053466796875, 0.79193115234375, 0.847808837890625, 0.9036865234375, 0.959564208984375, 1.01544189453125, 1.071319580078125, 1.127197265625, 1.183074951171875, 1.23895263671875, 1.294830322265625, 1.3507080078125, 1.406585693359375, 1.46246337890625, 1.518341064453125, 1.57421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 4.0, 9.0, 11.0, 18.0, 17.0, 23.0, 23.0, 29.0, 23.0, 30.0, 47.0, 40.0, 49.0, 39.0, 57.0, 45.0, 45.0, 31.0, 52.0, 48.0, 54.0, 46.0, 41.0, 37.0, 33.0, 23.0, 19.0, 16.0, 18.0, 12.0, 9.0, 13.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.103515625, -3.010284423828125, -2.91705322265625, -2.823822021484375, -2.7305908203125, -2.637359619140625, -2.54412841796875, -2.450897216796875, -2.357666015625, -2.264434814453125, -2.17120361328125, -2.077972412109375, -1.9847412109375, -1.891510009765625, -1.79827880859375, -1.705047607421875, -1.61181640625, -1.518585205078125, -1.42535400390625, -1.332122802734375, -1.2388916015625, -1.145660400390625, -1.05242919921875, -0.959197998046875, -0.865966796875, -0.772735595703125, -0.67950439453125, -0.586273193359375, -0.4930419921875, -0.399810791015625, -0.30657958984375, -0.213348388671875, -0.1201171875, -0.026885986328125, 0.06634521484375, 0.159576416015625, 0.2528076171875, 0.346038818359375, 0.43927001953125, 0.532501220703125, 0.625732421875, 0.718963623046875, 0.81219482421875, 0.905426025390625, 0.9986572265625, 1.091888427734375, 1.18511962890625, 1.278350830078125, 1.37158203125, 1.464813232421875, 1.55804443359375, 1.651275634765625, 1.7445068359375, 1.837738037109375, 1.93096923828125, 2.024200439453125, 2.117431640625, 2.210662841796875, 2.30389404296875, 2.397125244140625, 2.4903564453125, 2.583587646484375, 2.67681884765625, 2.770050048828125, 2.86328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 12.0, 14.0, 19.0, 46.0, 85.0, 265.0, 720.0, 2837.0, 24508.0, 737815.0, 268202.0, 11408.0, 1827.0, 451.0, 155.0, 78.0, 41.0, 21.0, 14.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8729629516601562, -0.8391876220703125, -0.8054122924804688, -0.771636962890625, -0.7378616333007812, -0.7040863037109375, -0.6703109741210938, -0.63653564453125, -0.6027603149414062, -0.5689849853515625, -0.5352096557617188, -0.501434326171875, -0.46765899658203125, -0.4338836669921875, -0.40010833740234375, -0.3663330078125, -0.33255767822265625, -0.2987823486328125, -0.26500701904296875, -0.231231689453125, -0.19745635986328125, -0.1636810302734375, -0.12990570068359375, -0.09613037109375, -0.06235504150390625, -0.0285797119140625, 0.00519561767578125, 0.038970947265625, 0.07274627685546875, 0.1065216064453125, 0.14029693603515625, 0.174072265625, 0.20784759521484375, 0.2416229248046875, 0.27539825439453125, 0.309173583984375, 0.34294891357421875, 0.3767242431640625, 0.41049957275390625, 0.44427490234375, 0.47805023193359375, 0.5118255615234375, 0.5456008911132812, 0.579376220703125, 0.6131515502929688, 0.6469268798828125, 0.6807022094726562, 0.7144775390625, 0.7482528686523438, 0.7820281982421875, 0.8158035278320312, 0.849578857421875, 0.8833541870117188, 0.9171295166015625, 0.9509048461914062, 0.98468017578125, 1.0184555053710938, 1.0522308349609375, 1.0860061645507812, 1.119781494140625, 1.1535568237304688, 1.1873321533203125, 1.2211074829101562, 1.2548828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 6.0, 9.0, 26.0, 26.0, 63.0, 95.0, 117.0, 146.0, 155.0, 118.0, 89.0, 57.0, 33.0, 24.0, 13.0, 9.0, 8.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010907649993896484, -0.0001053251326084137, -0.00010157376527786255, -9.78223979473114e-05, -9.407103061676025e-05, -9.03196632862091e-05, -8.656829595565796e-05, -8.281692862510681e-05, -7.906556129455566e-05, -7.531419396400452e-05, -7.156282663345337e-05, -6.781145930290222e-05, -6.406009197235107e-05, -6.030872464179993e-05, -5.655735731124878e-05, -5.280598998069763e-05, -4.9054622650146484e-05, -4.530325531959534e-05, -4.155188798904419e-05, -3.780052065849304e-05, -3.4049153327941895e-05, -3.0297785997390747e-05, -2.65464186668396e-05, -2.2795051336288452e-05, -1.9043684005737305e-05, -1.5292316675186157e-05, -1.154094934463501e-05, -7.789582014083862e-06, -4.038214683532715e-06, -2.868473529815674e-07, 3.46451997756958e-06, 7.2158873081207275e-06, 1.0967254638671875e-05, 1.4718621969223022e-05, 1.846998929977417e-05, 2.2221356630325317e-05, 2.5972723960876465e-05, 2.9724091291427612e-05, 3.347545862197876e-05, 3.722682595252991e-05, 4.0978193283081055e-05, 4.47295606136322e-05, 4.848092794418335e-05, 5.22322952747345e-05, 5.5983662605285645e-05, 5.973502993583679e-05, 6.348639726638794e-05, 6.723776459693909e-05, 7.098913192749023e-05, 7.474049925804138e-05, 7.849186658859253e-05, 8.224323391914368e-05, 8.599460124969482e-05, 8.974596858024597e-05, 9.349733591079712e-05, 9.724870324134827e-05, 0.00010100007057189941, 0.00010475143790245056, 0.00010850280523300171, 0.00011225417256355286, 0.000116005539894104, 0.00011975690722465515, 0.0001235082745552063, 0.00012725964188575745, 0.0001310110092163086]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 10.0, 7.0, 9.0, 27.0, 43.0, 54.0, 122.0, 304.0, 904.0, 4352.0, 37119.0, 608022.0, 370969.0, 22481.0, 2976.0, 685.0, 231.0, 101.0, 57.0, 36.0, 23.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43053436279296875, -0.4064788818359375, -0.38242340087890625, -0.358367919921875, -0.33431243896484375, -0.3102569580078125, -0.28620147705078125, -0.26214599609375, -0.23809051513671875, -0.2140350341796875, -0.18997955322265625, -0.165924072265625, -0.14186859130859375, -0.1178131103515625, -0.09375762939453125, -0.0697021484375, -0.04564666748046875, -0.0215911865234375, 0.00246429443359375, 0.026519775390625, 0.05057525634765625, 0.0746307373046875, 0.09868621826171875, 0.12274169921875, 0.14679718017578125, 0.1708526611328125, 0.19490814208984375, 0.218963623046875, 0.24301910400390625, 0.2670745849609375, 0.29113006591796875, 0.315185546875, 0.33924102783203125, 0.3632965087890625, 0.38735198974609375, 0.411407470703125, 0.43546295166015625, 0.4595184326171875, 0.48357391357421875, 0.50762939453125, 0.5316848754882812, 0.5557403564453125, 0.5797958374023438, 0.603851318359375, 0.6279067993164062, 0.6519622802734375, 0.6760177612304688, 0.7000732421875, 0.7241287231445312, 0.7481842041015625, 0.7722396850585938, 0.796295166015625, 0.8203506469726562, 0.8444061279296875, 0.8684616088867188, 0.89251708984375, 0.9165725708007812, 0.9406280517578125, 0.9646835327148438, 0.988739013671875, 1.0127944946289062, 1.0368499755859375, 1.0609054565429688, 1.0849609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 10.0, 8.0, 22.0, 26.0, 38.0, 43.0, 50.0, 73.0, 89.0, 91.0, 105.0, 80.0, 97.0, 59.0, 44.0, 38.0, 39.0, 19.0, 10.0, 9.0, 9.0, 9.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.462646484375, -0.4397773742675781, -0.41690826416015625, -0.3940391540527344, -0.3711700439453125, -0.3483009338378906, -0.32543182373046875, -0.3025627136230469, -0.279693603515625, -0.2568244934082031, -0.23395538330078125, -0.21108627319335938, -0.1882171630859375, -0.16534805297851562, -0.14247894287109375, -0.11960983276367188, -0.09674072265625, -0.07387161254882812, -0.05100250244140625, -0.028133392333984375, -0.0052642822265625, 0.017604827880859375, 0.04047393798828125, 0.06334304809570312, 0.086212158203125, 0.10908126831054688, 0.13195037841796875, 0.15481948852539062, 0.1776885986328125, 0.20055770874023438, 0.22342681884765625, 0.24629592895507812, 0.2691650390625, 0.2920341491699219, 0.31490325927734375, 0.3377723693847656, 0.3606414794921875, 0.3835105895996094, 0.40637969970703125, 0.4292488098144531, 0.452117919921875, 0.4749870300292969, 0.49785614013671875, 0.5207252502441406, 0.5435943603515625, 0.5664634704589844, 0.5893325805664062, 0.6122016906738281, 0.63507080078125, 0.6579399108886719, 0.6808090209960938, 0.7036781311035156, 0.7265472412109375, 0.7494163513183594, 0.7722854614257812, 0.7951545715332031, 0.818023681640625, 0.8408927917480469, 0.8637619018554688, 0.8866310119628906, 0.9095001220703125, 0.9323692321777344, 0.9552383422851562, 0.9781074523925781, 1.0009765625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 10.0, 18.0, 34.0, 65.0, 179.0, 327.0, 221.0, 77.0, 49.0, 18.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.836753845214844, -6.047939777374268, -5.259125709533691, -4.470311164855957, -3.68149733543396, -2.892683267593384, -2.1038689613342285, -1.3150548934936523, -0.5262408256530762, 0.2625733017921448, 1.0513874292373657, 1.8402016162872314, 2.6290156841278076, 3.417829751968384, 4.206644058227539, 4.995458126068115, 5.784272193908691, 6.573086261749268, 7.361900329589844, 8.150714874267578, 8.939528465270996, 9.72834300994873, 10.517156600952148, 11.305971145629883, 12.094785690307617, 12.883600234985352, 13.67241382598877, 14.461228370666504, 15.250041961669922, 16.038856506347656, 16.82767105102539, 17.616485595703125, 18.405298233032227, 19.19411277770996, 19.982927322387695, 20.771739959716797, 21.56055450439453, 22.349369049072266, 23.13818359375, 23.926998138427734, 24.715810775756836, 25.50462532043457, 26.293439865112305, 27.082252502441406, 27.87106704711914, 28.659881591796875, 29.44869613647461, 30.237510681152344, 31.026325225830078, 31.815139770507812, 32.60395431518555, 33.39276885986328, 34.181583404541016, 34.970394134521484, 35.75920867919922, 36.54802322387695, 37.33683776855469, 38.12565231323242, 38.914466857910156, 39.70328140258789, 40.492095947265625, 41.280906677246094, 42.06972122192383, 42.85853576660156, 43.6473503112793]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 9.0, 6.0, 7.0, 11.0, 15.0, 21.0, 18.0, 16.0, 28.0, 30.0, 54.0, 42.0, 36.0, 54.0, 71.0, 65.0, 62.0, 62.0, 56.0, 43.0, 35.0, 44.0, 34.0, 22.0, 20.0, 28.0, 24.0, 18.0, 19.0, 5.0, 11.0, 5.0, 5.0, 11.0, 4.0, 2.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.14488983154297, -15.629015922546387, -15.113142967224121, -14.597269058227539, -14.081395149230957, -13.565521240234375, -13.04964828491211, -12.533774375915527, -12.017900466918945, -11.502026557922363, -10.986153602600098, -10.470279693603516, -9.954405784606934, -9.438531875610352, -8.922658920288086, -8.406785011291504, -7.890912055969238, -7.3750386238098145, -6.859164714813232, -6.343291282653809, -5.827417373657227, -5.311543941497803, -4.795670509338379, -4.279796600341797, -3.763923168182373, -3.24804949760437, -2.732175827026367, -2.2163023948669434, -1.7004287242889404, -1.1845550537109375, -0.6686816215515137, -0.15280795097351074, 0.3630657196044922, 0.8789393305778503, 1.3948129415512085, 1.9106864929199219, 2.426560163497925, 2.9424338340759277, 3.4583072662353516, 3.9741809368133545, 4.490054607391357, 5.005928039550781, 5.521801948547363, 6.037675380706787, 6.553548812866211, 7.069422721862793, 7.585296154022217, 8.10116958618164, 8.617043495178223, 9.132917404174805, 9.64879035949707, 10.164664268493652, 10.680538177490234, 11.1964111328125, 11.712285041809082, 12.228158950805664, 12.74403190612793, 13.259905815124512, 13.775778770446777, 14.29165267944336, 14.807526588439941, 15.323400497436523, 15.839273452758789, 16.355146408081055, 16.871021270751953]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 12.0, 11.0, 16.0, 32.0, 26.0, 36.0, 48.0, 75.0, 110.0, 151.0, 248.0, 346.0, 570.0, 943.0, 1746.0, 3912.0, 11646.0, 264044.0, 3888578.0, 13006.0, 3973.0, 1892.0, 1013.0, 594.0, 407.0, 225.0, 189.0, 112.0, 87.0, 51.0, 34.0, 31.0, 19.0, 19.0, 15.0, 23.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-1.3076171875, -1.2667999267578125, -1.225982666015625, -1.1851654052734375, -1.14434814453125, -1.1035308837890625, -1.062713623046875, -1.0218963623046875, -0.9810791015625, -0.9402618408203125, -0.899444580078125, -0.8586273193359375, -0.81781005859375, -0.7769927978515625, -0.736175537109375, -0.6953582763671875, -0.654541015625, -0.6137237548828125, -0.572906494140625, -0.5320892333984375, -0.49127197265625, -0.4504547119140625, -0.409637451171875, -0.3688201904296875, -0.3280029296875, -0.2871856689453125, -0.246368408203125, -0.2055511474609375, -0.16473388671875, -0.1239166259765625, -0.083099365234375, -0.0422821044921875, -0.00146484375, 0.0393524169921875, 0.080169677734375, 0.1209869384765625, 0.16180419921875, 0.2026214599609375, 0.243438720703125, 0.2842559814453125, 0.3250732421875, 0.3658905029296875, 0.406707763671875, 0.4475250244140625, 0.48834228515625, 0.5291595458984375, 0.569976806640625, 0.6107940673828125, 0.651611328125, 0.6924285888671875, 0.733245849609375, 0.7740631103515625, 0.81488037109375, 0.8556976318359375, 0.896514892578125, 0.9373321533203125, 0.9781494140625, 1.0189666748046875, 1.059783935546875, 1.1006011962890625, 1.14141845703125, 1.1822357177734375, 1.223052978515625, 1.2638702392578125, 1.3046875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 9.0, 11.0, 16.0, 11.0, 12.0, 15.0, 32.0, 21.0, 27.0, 51.0, 37.0, 38.0, 49.0, 56.0, 59.0, 57.0, 66.0, 66.0, 57.0, 47.0, 33.0, 34.0, 39.0, 31.0, 19.0, 20.0, 9.0, 10.0, 20.0, 5.0, 6.0, 7.0, 8.0, 6.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7090606689453125, -0.685211181640625, -0.6613616943359375, -0.63751220703125, -0.6136627197265625, -0.589813232421875, -0.5659637451171875, -0.5421142578125, -0.5182647705078125, -0.494415283203125, -0.4705657958984375, -0.44671630859375, -0.4228668212890625, -0.399017333984375, -0.3751678466796875, -0.351318359375, -0.3274688720703125, -0.303619384765625, -0.2797698974609375, -0.25592041015625, -0.2320709228515625, -0.208221435546875, -0.1843719482421875, -0.1605224609375, -0.1366729736328125, -0.112823486328125, -0.0889739990234375, -0.06512451171875, -0.0412750244140625, -0.017425537109375, 0.0064239501953125, 0.0302734375, 0.0541229248046875, 0.077972412109375, 0.1018218994140625, 0.12567138671875, 0.1495208740234375, 0.173370361328125, 0.1972198486328125, 0.2210693359375, 0.2449188232421875, 0.268768310546875, 0.2926177978515625, 0.31646728515625, 0.3403167724609375, 0.364166259765625, 0.3880157470703125, 0.411865234375, 0.4357147216796875, 0.459564208984375, 0.4834136962890625, 0.50726318359375, 0.5311126708984375, 0.554962158203125, 0.5788116455078125, 0.6026611328125, 0.6265106201171875, 0.650360107421875, 0.6742095947265625, 0.69805908203125, 0.7219085693359375, 0.745758056640625, 0.7696075439453125, 0.79345703125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 10.0, 5.0, 5.0, 7.0, 17.0, 13.0, 23.0, 34.0, 41.0, 45.0, 69.0, 97.0, 130.0, 145.0, 207.0, 319.0, 408.0, 590.0, 1049.0, 1736.0, 3353.0, 8608.0, 36344.0, 4031026.0, 86530.0, 13033.0, 4525.0, 2129.0, 1183.0, 777.0, 530.0, 326.0, 254.0, 194.0, 123.0, 105.0, 77.0, 66.0, 41.0, 33.0, 25.0, 17.0, 10.0, 7.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2587890625, -1.2148895263671875, -1.170989990234375, -1.1270904541015625, -1.08319091796875, -1.0392913818359375, -0.995391845703125, -0.9514923095703125, -0.9075927734375, -0.8636932373046875, -0.819793701171875, -0.7758941650390625, -0.73199462890625, -0.6880950927734375, -0.644195556640625, -0.6002960205078125, -0.556396484375, -0.5124969482421875, -0.468597412109375, -0.4246978759765625, -0.38079833984375, -0.3368988037109375, -0.292999267578125, -0.2490997314453125, -0.2052001953125, -0.1613006591796875, -0.117401123046875, -0.0735015869140625, -0.02960205078125, 0.0142974853515625, 0.058197021484375, 0.1020965576171875, 0.14599609375, 0.1898956298828125, 0.233795166015625, 0.2776947021484375, 0.32159423828125, 0.3654937744140625, 0.409393310546875, 0.4532928466796875, 0.4971923828125, 0.5410919189453125, 0.584991455078125, 0.6288909912109375, 0.67279052734375, 0.7166900634765625, 0.760589599609375, 0.8044891357421875, 0.848388671875, 0.8922882080078125, 0.936187744140625, 0.9800872802734375, 1.02398681640625, 1.0678863525390625, 1.111785888671875, 1.1556854248046875, 1.1995849609375, 1.2434844970703125, 1.287384033203125, 1.3312835693359375, 1.37518310546875, 1.4190826416015625, 1.462982177734375, 1.5068817138671875, 1.55078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 8.0, 20.0, 62.0, 3318.0, 530.0, 58.0, 21.0, 21.0, 9.0, 1.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5976524353027344, -0.5805587768554688, -0.5634651184082031, -0.5463714599609375, -0.5292778015136719, -0.5121841430664062, -0.4950904846191406, -0.477996826171875, -0.4609031677246094, -0.44380950927734375, -0.4267158508300781, -0.4096221923828125, -0.3925285339355469, -0.37543487548828125, -0.3583412170410156, -0.34124755859375, -0.3241539001464844, -0.30706024169921875, -0.2899665832519531, -0.2728729248046875, -0.2557792663574219, -0.23868560791015625, -0.22159194946289062, -0.204498291015625, -0.18740463256835938, -0.17031097412109375, -0.15321731567382812, -0.1361236572265625, -0.11902999877929688, -0.10193634033203125, -0.08484268188476562, -0.0677490234375, -0.050655364990234375, -0.03356170654296875, -0.016468048095703125, 0.0006256103515625, 0.017719268798828125, 0.03481292724609375, 0.051906585693359375, 0.069000244140625, 0.08609390258789062, 0.10318756103515625, 0.12028121948242188, 0.1373748779296875, 0.15446853637695312, 0.17156219482421875, 0.18865585327148438, 0.20574951171875, 0.22284317016601562, 0.23993682861328125, 0.2570304870605469, 0.2741241455078125, 0.2912178039550781, 0.30831146240234375, 0.3254051208496094, 0.342498779296875, 0.3595924377441406, 0.37668609619140625, 0.3937797546386719, 0.4108734130859375, 0.4279670715332031, 0.44506072998046875, 0.4621543884277344, 0.479248046875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 8.0, 33.0, 87.0, 179.0, 280.0, 242.0, 105.0, 42.0, 18.0, 13.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7683079242706299, -1.677186131477356, -1.586064338684082, -1.4949424266815186, -1.4038207530975342, -1.3126988410949707, -1.2215770483016968, -1.1304552555084229, -1.039333462715149, -0.948211669921875, -0.8570898771286011, -0.7659680247306824, -0.6748462319374084, -0.5837244391441345, -0.4926025867462158, -0.4014807939529419, -0.31035900115966797, -0.21923719346523285, -0.12811538577079773, -0.036993563175201416, 0.05412822961807251, 0.14525002241134644, 0.23637187480926514, 0.32749366760253906, 0.418615460395813, 0.5097372531890869, 0.6008590459823608, 0.6919808983802795, 0.7831026911735535, 0.8742244839668274, 0.9653463363647461, 1.05646812915802, 1.147590160369873, 1.238711953163147, 1.329833745956421, 1.4209556579589844, 1.5120773315429688, 1.6031992435455322, 1.6943210363388062, 1.78544282913208, 1.876564621925354, 1.967686414718628, 2.0588083267211914, 2.149930000305176, 2.2410519123077393, 2.3321735858917236, 2.423295497894287, 2.5144171714782715, 2.605539083480835, 2.6966609954833984, 2.787782669067383, 2.8789045810699463, 2.9700262546539307, 3.061148166656494, 3.1522698402404785, 3.243391752243042, 3.3345136642456055, 3.425635576248169, 3.5167572498321533, 3.607879161834717, 3.699000835418701, 3.7901227474212646, 3.881244659423828, 3.9723663330078125, 4.063488006591797]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 9.0, 15.0, 3.0, 12.0, 10.0, 13.0, 15.0, 22.0, 21.0, 40.0, 23.0, 31.0, 41.0, 40.0, 35.0, 54.0, 39.0, 56.0, 55.0, 53.0, 52.0, 38.0, 51.0, 41.0, 31.0, 35.0, 31.0, 22.0, 22.0, 15.0, 16.0, 16.0, 10.0, 10.0, 8.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8254018425941467, -0.7982668876647949, -0.7711318731307983, -0.7439968585968018, -0.71686190366745, -0.6897269487380981, -0.6625919342041016, -0.635456919670105, -0.6083219647407532, -0.5811870098114014, -0.5540519952774048, -0.5269169807434082, -0.4997820258140564, -0.4726470410823822, -0.445512056350708, -0.4183770716190338, -0.3912420868873596, -0.3641071021556854, -0.33697211742401123, -0.30983713269233704, -0.28270214796066284, -0.25556716322898865, -0.22843217849731445, -0.20129719376564026, -0.17416220903396606, -0.14702722430229187, -0.11989223957061768, -0.09275725483894348, -0.06562227010726929, -0.03848728537559509, -0.011352300643920898, 0.015782684087753296, 0.042917728424072266, 0.07005271315574646, 0.09718769788742065, 0.12432268261909485, 0.15145766735076904, 0.17859265208244324, 0.20572763681411743, 0.23286262154579163, 0.2599976062774658, 0.28713259100914, 0.3142675757408142, 0.3414025604724884, 0.3685375452041626, 0.3956725299358368, 0.422807514667511, 0.4499424993991852, 0.4770774841308594, 0.504212498664856, 0.5313474535942078, 0.5584824085235596, 0.5856174230575562, 0.6127524375915527, 0.6398873925209045, 0.6670223474502563, 0.6941573619842529, 0.7212923765182495, 0.7484273314476013, 0.7755622863769531, 0.8026973009109497, 0.8298323154449463, 0.8569672703742981, 0.8841022253036499, 0.9112372398376465]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 6.0, 16.0, 18.0, 29.0, 45.0, 58.0, 63.0, 130.0, 157.0, 195.0, 363.0, 551.0, 836.0, 1379.0, 2377.0, 4430.0, 8048.0, 16741.0, 37775.0, 101033.0, 321511.0, 357503.0, 114955.0, 41939.0, 18208.0, 8847.0, 4687.0, 2511.0, 1451.0, 905.0, 576.0, 378.0, 246.0, 158.0, 117.0, 83.0, 58.0, 42.0, 37.0, 18.0, 16.0, 11.0, 6.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.0625, -1.028289794921875, -0.99407958984375, -0.959869384765625, -0.9256591796875, -0.891448974609375, -0.85723876953125, -0.823028564453125, -0.788818359375, -0.754608154296875, -0.72039794921875, -0.686187744140625, -0.6519775390625, -0.617767333984375, -0.58355712890625, -0.549346923828125, -0.51513671875, -0.480926513671875, -0.44671630859375, -0.412506103515625, -0.3782958984375, -0.344085693359375, -0.30987548828125, -0.275665283203125, -0.241455078125, -0.207244873046875, -0.17303466796875, -0.138824462890625, -0.1046142578125, -0.070404052734375, -0.03619384765625, -0.001983642578125, 0.0322265625, 0.066436767578125, 0.10064697265625, 0.134857177734375, 0.1690673828125, 0.203277587890625, 0.23748779296875, 0.271697998046875, 0.305908203125, 0.340118408203125, 0.37432861328125, 0.408538818359375, 0.4427490234375, 0.476959228515625, 0.51116943359375, 0.545379638671875, 0.57958984375, 0.613800048828125, 0.64801025390625, 0.682220458984375, 0.7164306640625, 0.750640869140625, 0.78485107421875, 0.819061279296875, 0.853271484375, 0.887481689453125, 0.92169189453125, 0.955902099609375, 0.9901123046875, 1.024322509765625, 1.05853271484375, 1.092742919921875, 1.126953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 12.0, 13.0, 7.0, 15.0, 25.0, 23.0, 29.0, 29.0, 36.0, 35.0, 33.0, 49.0, 63.0, 56.0, 51.0, 63.0, 71.0, 50.0, 53.0, 46.0, 28.0, 42.0, 29.0, 14.0, 18.0, 17.0, 11.0, 10.0, 14.0, 9.0, 4.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.763671875, -0.739715576171875, -0.71575927734375, -0.691802978515625, -0.6678466796875, -0.643890380859375, -0.61993408203125, -0.595977783203125, -0.572021484375, -0.548065185546875, -0.52410888671875, -0.500152587890625, -0.4761962890625, -0.452239990234375, -0.42828369140625, -0.404327392578125, -0.38037109375, -0.356414794921875, -0.33245849609375, -0.308502197265625, -0.2845458984375, -0.260589599609375, -0.23663330078125, -0.212677001953125, -0.188720703125, -0.164764404296875, -0.14080810546875, -0.116851806640625, -0.0928955078125, -0.068939208984375, -0.04498291015625, -0.021026611328125, 0.0029296875, 0.026885986328125, 0.05084228515625, 0.074798583984375, 0.0987548828125, 0.122711181640625, 0.14666748046875, 0.170623779296875, 0.194580078125, 0.218536376953125, 0.24249267578125, 0.266448974609375, 0.2904052734375, 0.314361572265625, 0.33831787109375, 0.362274169921875, 0.38623046875, 0.410186767578125, 0.43414306640625, 0.458099365234375, 0.4820556640625, 0.506011962890625, 0.52996826171875, 0.553924560546875, 0.577880859375, 0.601837158203125, 0.62579345703125, 0.649749755859375, 0.6737060546875, 0.697662353515625, 0.72161865234375, 0.745574951171875, 0.76953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 16.0, 38.0, 52.0, 77.0, 148.0, 259.0, 515.0, 1262.0, 3791.0, 17940.0, 218053.0, 747979.0, 47726.0, 7227.0, 1891.0, 750.0, 352.0, 179.0, 110.0, 48.0, 42.0, 24.0, 14.0, 8.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.2064208984375, -3.100341796875, -2.9942626953125, -2.88818359375, -2.7821044921875, -2.676025390625, -2.5699462890625, -2.4638671875, -2.3577880859375, -2.251708984375, -2.1456298828125, -2.03955078125, -1.9334716796875, -1.827392578125, -1.7213134765625, -1.615234375, -1.5091552734375, -1.403076171875, -1.2969970703125, -1.19091796875, -1.0848388671875, -0.978759765625, -0.8726806640625, -0.7666015625, -0.6605224609375, -0.554443359375, -0.4483642578125, -0.34228515625, -0.2362060546875, -0.130126953125, -0.0240478515625, 0.08203125, 0.1881103515625, 0.294189453125, 0.4002685546875, 0.50634765625, 0.6124267578125, 0.718505859375, 0.8245849609375, 0.9306640625, 1.0367431640625, 1.142822265625, 1.2489013671875, 1.35498046875, 1.4610595703125, 1.567138671875, 1.6732177734375, 1.779296875, 1.8853759765625, 1.991455078125, 2.0975341796875, 2.20361328125, 2.3096923828125, 2.415771484375, 2.5218505859375, 2.6279296875, 2.7340087890625, 2.840087890625, 2.9461669921875, 3.05224609375, 3.1583251953125, 3.264404296875, 3.3704833984375, 3.4765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 9.0, 13.0, 13.0, 22.0, 39.0, 48.0, 64.0, 65.0, 82.0, 76.0, 81.0, 98.0, 71.0, 71.0, 59.0, 58.0, 38.0, 24.0, 22.0, 11.0, 11.0, 11.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.258544921875, -5.07177734375, -4.885009765625, -4.6982421875, -4.511474609375, -4.32470703125, -4.137939453125, -3.951171875, -3.764404296875, -3.57763671875, -3.390869140625, -3.2041015625, -3.017333984375, -2.83056640625, -2.643798828125, -2.45703125, -2.270263671875, -2.08349609375, -1.896728515625, -1.7099609375, -1.523193359375, -1.33642578125, -1.149658203125, -0.962890625, -0.776123046875, -0.58935546875, -0.402587890625, -0.2158203125, -0.029052734375, 0.15771484375, 0.344482421875, 0.53125, 0.718017578125, 0.90478515625, 1.091552734375, 1.2783203125, 1.465087890625, 1.65185546875, 1.838623046875, 2.025390625, 2.212158203125, 2.39892578125, 2.585693359375, 2.7724609375, 2.959228515625, 3.14599609375, 3.332763671875, 3.51953125, 3.706298828125, 3.89306640625, 4.079833984375, 4.2666015625, 4.453369140625, 4.64013671875, 4.826904296875, 5.013671875, 5.200439453125, 5.38720703125, 5.573974609375, 5.7607421875, 5.947509765625, 6.13427734375, 6.321044921875, 6.5078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 14.0, 15.0, 23.0, 37.0, 65.0, 162.0, 365.0, 1022.0, 3618.0, 31385.0, 991660.0, 15999.0, 2682.0, 858.0, 320.0, 149.0, 67.0, 36.0, 22.0, 17.0, 11.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7268524169921875, -1.642181396484375, -1.5575103759765625, -1.47283935546875, -1.3881683349609375, -1.303497314453125, -1.2188262939453125, -1.1341552734375, -1.0494842529296875, -0.964813232421875, -0.8801422119140625, -0.79547119140625, -0.7108001708984375, -0.626129150390625, -0.5414581298828125, -0.456787109375, -0.3721160888671875, -0.287445068359375, -0.2027740478515625, -0.11810302734375, -0.0334320068359375, 0.051239013671875, 0.1359100341796875, 0.2205810546875, 0.3052520751953125, 0.389923095703125, 0.4745941162109375, 0.55926513671875, 0.6439361572265625, 0.728607177734375, 0.8132781982421875, 0.89794921875, 0.9826202392578125, 1.067291259765625, 1.1519622802734375, 1.23663330078125, 1.3213043212890625, 1.405975341796875, 1.4906463623046875, 1.5753173828125, 1.6599884033203125, 1.744659423828125, 1.8293304443359375, 1.91400146484375, 1.9986724853515625, 2.083343505859375, 2.1680145263671875, 2.252685546875, 2.3373565673828125, 2.422027587890625, 2.5066986083984375, 2.59136962890625, 2.6760406494140625, 2.760711669921875, 2.8453826904296875, 2.9300537109375, 3.0147247314453125, 3.099395751953125, 3.1840667724609375, 3.26873779296875, 3.3534088134765625, 3.438079833984375, 3.5227508544921875, 3.607421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 3.0, 7.0, 11.0, 9.0, 21.0, 29.0, 29.0, 32.0, 76.0, 138.0, 190.0, 148.0, 112.0, 63.0, 45.0, 23.0, 14.0, 11.0, 9.0, 3.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001690387725830078, -0.00016478542238473892, -0.00016053207218647003, -0.00015627872198820114, -0.00015202537178993225, -0.00014777202159166336, -0.00014351867139339447, -0.00013926532119512558, -0.0001350119709968567, -0.0001307586207985878, -0.0001265052706003189, -0.00012225192040205002, -0.00011799857020378113, -0.00011374522000551224, -0.00010949186980724335, -0.00010523851960897446, -0.00010098516941070557, -9.673181921243668e-05, -9.247846901416779e-05, -8.82251188158989e-05, -8.397176861763e-05, -7.971841841936111e-05, -7.546506822109222e-05, -7.121171802282333e-05, -6.695836782455444e-05, -6.270501762628555e-05, -5.845166742801666e-05, -5.419831722974777e-05, -4.994496703147888e-05, -4.569161683320999e-05, -4.14382666349411e-05, -3.718491643667221e-05, -3.293156623840332e-05, -2.867821604013443e-05, -2.442486584186554e-05, -2.017151564359665e-05, -1.591816544532776e-05, -1.1664815247058868e-05, -7.411465048789978e-06, -3.1581148505210876e-06, 1.0952353477478027e-06, 5.348585546016693e-06, 9.601935744285583e-06, 1.3855285942554474e-05, 1.8108636140823364e-05, 2.2361986339092255e-05, 2.6615336537361145e-05, 3.0868686735630035e-05, 3.5122036933898926e-05, 3.9375387132167816e-05, 4.3628737330436707e-05, 4.78820875287056e-05, 5.213543772697449e-05, 5.638878792524338e-05, 6.064213812351227e-05, 6.489548832178116e-05, 6.914883852005005e-05, 7.340218871831894e-05, 7.765553891658783e-05, 8.190888911485672e-05, 8.616223931312561e-05, 9.04155895113945e-05, 9.466893970966339e-05, 9.892228990793228e-05, 0.00010317564010620117]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 9.0, 6.0, 12.0, 18.0, 43.0, 48.0, 78.0, 141.0, 392.0, 1563.0, 16920.0, 1017246.0, 10140.0, 1238.0, 336.0, 148.0, 72.0, 40.0, 34.0, 18.0, 13.0, 11.0, 10.0, 5.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.224884033203125, -4.11773681640625, -4.010589599609375, -3.9034423828125, -3.796295166015625, -3.68914794921875, -3.582000732421875, -3.474853515625, -3.367706298828125, -3.26055908203125, -3.153411865234375, -3.0462646484375, -2.939117431640625, -2.83197021484375, -2.724822998046875, -2.61767578125, -2.510528564453125, -2.40338134765625, -2.296234130859375, -2.1890869140625, -2.081939697265625, -1.97479248046875, -1.867645263671875, -1.760498046875, -1.653350830078125, -1.54620361328125, -1.439056396484375, -1.3319091796875, -1.224761962890625, -1.11761474609375, -1.010467529296875, -0.9033203125, -0.796173095703125, -0.68902587890625, -0.581878662109375, -0.4747314453125, -0.367584228515625, -0.26043701171875, -0.153289794921875, -0.046142578125, 0.061004638671875, 0.16815185546875, 0.275299072265625, 0.3824462890625, 0.489593505859375, 0.59674072265625, 0.703887939453125, 0.81103515625, 0.918182373046875, 1.02532958984375, 1.132476806640625, 1.2396240234375, 1.346771240234375, 1.45391845703125, 1.561065673828125, 1.668212890625, 1.775360107421875, 1.88250732421875, 1.989654541015625, 2.0968017578125, 2.203948974609375, 2.31109619140625, 2.418243408203125, 2.525390625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 43.0, 271.0, 569.0, 77.0, 21.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4453125, -9.260955810546875, -9.07659912109375, -8.892242431640625, -8.7078857421875, -8.523529052734375, -8.33917236328125, -8.154815673828125, -7.970458984375, -7.786102294921875, -7.60174560546875, -7.417388916015625, -7.2330322265625, -7.048675537109375, -6.86431884765625, -6.679962158203125, -6.49560546875, -6.311248779296875, -6.12689208984375, -5.942535400390625, -5.7581787109375, -5.573822021484375, -5.38946533203125, -5.205108642578125, -5.020751953125, -4.836395263671875, -4.65203857421875, -4.467681884765625, -4.2833251953125, -4.098968505859375, -3.91461181640625, -3.730255126953125, -3.5458984375, -3.361541748046875, -3.17718505859375, -2.992828369140625, -2.8084716796875, -2.624114990234375, -2.43975830078125, -2.255401611328125, -2.071044921875, -1.886688232421875, -1.70233154296875, -1.517974853515625, -1.3336181640625, -1.149261474609375, -0.96490478515625, -0.780548095703125, -0.59619140625, -0.411834716796875, -0.22747802734375, -0.043121337890625, 0.1412353515625, 0.325592041015625, 0.50994873046875, 0.694305419921875, 0.878662109375, 1.063018798828125, 1.24737548828125, 1.431732177734375, 1.6160888671875, 1.800445556640625, 1.98480224609375, 2.169158935546875, 2.353515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 29.0, 51.0, 123.0, 256.0, 279.0, 156.0, 55.0, 23.0, 7.0, 5.0, 5.0, 0.0, 0.0, 1.0], "bins": [-61.468017578125, -60.33716583251953, -59.2063102722168, -58.07545852661133, -56.944602966308594, -55.813751220703125, -54.68289566040039, -53.55204391479492, -52.42118835449219, -51.29033660888672, -50.159481048583984, -49.028629302978516, -47.89777374267578, -46.76692199707031, -45.63606643676758, -44.50521469116211, -43.37436294555664, -42.24351119995117, -41.11265563964844, -39.98180389404297, -38.850948333740234, -37.720096588134766, -36.58924102783203, -35.45838928222656, -34.327537536621094, -33.196685791015625, -32.06583023071289, -30.93497657775879, -29.804122924804688, -28.67327117919922, -27.542417526245117, -26.411563873291016, -25.280712127685547, -24.149858474731445, -23.019004821777344, -21.888151168823242, -20.75729751586914, -19.626445770263672, -18.49559211730957, -17.36473846435547, -16.233882904052734, -15.103029251098633, -13.972175598144531, -12.841322898864746, -11.710469245910645, -10.579615592956543, -9.448762893676758, -8.317909240722656, -7.187056541442871, -6.0562028884887695, -4.925349712371826, -3.7944962978363037, -2.6636428833007812, -1.5327892303466797, -0.40193605422973633, 0.728917121887207, 1.8597707748413086, 2.990624189376831, 4.1214776039123535, 5.252330780029297, 6.383184432983398, 7.5140380859375, 8.644891738891602, 9.775744438171387, 10.906598091125488]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 7.0, 8.0, 12.0, 20.0, 8.0, 14.0, 21.0, 23.0, 29.0, 32.0, 36.0, 49.0, 42.0, 52.0, 43.0, 54.0, 59.0, 59.0, 47.0, 37.0, 42.0, 36.0, 45.0, 35.0, 30.0, 29.0, 19.0, 26.0, 23.0, 14.0, 6.0, 9.0, 3.0, 2.0, 5.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.26739501953125, -16.66203498840332, -16.056676864624023, -15.451316833496094, -14.84595775604248, -14.240598678588867, -13.635239601135254, -13.02988052368164, -12.424520492553711, -11.819161415100098, -11.213802337646484, -10.608442306518555, -10.003083229064941, -9.397724151611328, -8.792365074157715, -8.187005996704102, -7.581646919250488, -6.976287841796875, -6.3709282875061035, -5.76556921005249, -5.160209655761719, -4.5548505783081055, -3.949491500854492, -3.3441319465637207, -2.7387728691101074, -2.133413553237915, -1.5280543565750122, -0.9226951599121094, -0.317335844039917, 0.2880234718322754, 0.8933825492858887, 1.4987421035766602, 2.1041011810302734, 2.709460496902466, 3.314819812774658, 3.9201788902282715, 4.525538444519043, 5.130897521972656, 5.7362565994262695, 6.341616153717041, 6.946975231170654, 7.552334308624268, 8.157693862915039, 8.763052940368652, 9.368412017822266, 9.973772048950195, 10.579130172729492, 11.184490203857422, 11.789849281311035, 12.395208358764648, 13.000567436218262, 13.605926513671875, 14.211286544799805, 14.816645622253418, 15.422004699707031, 16.02736473083496, 16.632722854614258, 17.238082885742188, 17.843441009521484, 18.448801040649414, 19.05415916442871, 19.65951919555664, 20.264877319335938, 20.870237350463867, 21.475597381591797]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 11.0, 14.0, 13.0, 22.0, 31.0, 44.0, 66.0, 85.0, 111.0, 196.0, 312.0, 620.0, 1389.0, 5572.0, 4092387.0, 86698.0, 4083.0, 1232.0, 497.0, 293.0, 169.0, 124.0, 85.0, 63.0, 38.0, 39.0, 23.0, 18.0, 7.0, 15.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3671875, -3.27838134765625, -3.1895751953125, -3.10076904296875, -3.011962890625, -2.92315673828125, -2.8343505859375, -2.74554443359375, -2.65673828125, -2.56793212890625, -2.4791259765625, -2.39031982421875, -2.301513671875, -2.21270751953125, -2.1239013671875, -2.03509521484375, -1.9462890625, -1.85748291015625, -1.7686767578125, -1.67987060546875, -1.591064453125, -1.50225830078125, -1.4134521484375, -1.32464599609375, -1.23583984375, -1.14703369140625, -1.0582275390625, -0.96942138671875, -0.880615234375, -0.79180908203125, -0.7030029296875, -0.61419677734375, -0.525390625, -0.43658447265625, -0.3477783203125, -0.25897216796875, -0.170166015625, -0.08135986328125, 0.0074462890625, 0.09625244140625, 0.18505859375, 0.27386474609375, 0.3626708984375, 0.45147705078125, 0.540283203125, 0.62908935546875, 0.7178955078125, 0.80670166015625, 0.8955078125, 0.98431396484375, 1.0731201171875, 1.16192626953125, 1.250732421875, 1.33953857421875, 1.4283447265625, 1.51715087890625, 1.60595703125, 1.69476318359375, 1.7835693359375, 1.87237548828125, 1.961181640625, 2.04998779296875, 2.1387939453125, 2.22760009765625, 2.31640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 5.0, 8.0, 7.0, 7.0, 16.0, 6.0, 19.0, 24.0, 39.0, 34.0, 57.0, 55.0, 82.0, 70.0, 87.0, 71.0, 74.0, 55.0, 68.0, 49.0, 34.0, 16.0, 22.0, 25.0, 11.0, 16.0, 13.0, 9.0, 5.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2237472534179688, -1.1887054443359375, -1.1536636352539062, -1.118621826171875, -1.0835800170898438, -1.0485382080078125, -1.0134963989257812, -0.97845458984375, -0.9434127807617188, -0.9083709716796875, -0.8733291625976562, -0.838287353515625, -0.8032455444335938, -0.7682037353515625, -0.7331619262695312, -0.6981201171875, -0.6630783081054688, -0.6280364990234375, -0.5929946899414062, -0.557952880859375, -0.5229110717773438, -0.4878692626953125, -0.45282745361328125, -0.41778564453125, -0.38274383544921875, -0.3477020263671875, -0.31266021728515625, -0.277618408203125, -0.24257659912109375, -0.2075347900390625, -0.17249298095703125, -0.137451171875, -0.10240936279296875, -0.0673675537109375, -0.03232574462890625, 0.002716064453125, 0.03775787353515625, 0.0727996826171875, 0.10784149169921875, 0.14288330078125, 0.17792510986328125, 0.2129669189453125, 0.24800872802734375, 0.283050537109375, 0.31809234619140625, 0.3531341552734375, 0.38817596435546875, 0.4232177734375, 0.45825958251953125, 0.4933013916015625, 0.5283432006835938, 0.563385009765625, 0.5984268188476562, 0.6334686279296875, 0.6685104370117188, 0.70355224609375, 0.7385940551757812, 0.7736358642578125, 0.8086776733398438, 0.843719482421875, 0.8787612915039062, 0.9138031005859375, 0.9488449096679688, 0.98388671875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 7.0, 13.0, 13.0, 32.0, 26.0, 34.0, 52.0, 88.0, 92.0, 133.0, 203.0, 357.0, 586.0, 1422.0, 3668.0, 14786.0, 4081463.0, 78034.0, 8327.0, 2480.0, 1009.0, 461.0, 272.0, 185.0, 143.0, 100.0, 78.0, 67.0, 42.0, 28.0, 23.0, 16.0, 8.0, 5.0, 5.0, 5.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.07159423828125, -2.0064697265625, -1.94134521484375, -1.876220703125, -1.81109619140625, -1.7459716796875, -1.68084716796875, -1.61572265625, -1.55059814453125, -1.4854736328125, -1.42034912109375, -1.355224609375, -1.29010009765625, -1.2249755859375, -1.15985107421875, -1.0947265625, -1.02960205078125, -0.9644775390625, -0.89935302734375, -0.834228515625, -0.76910400390625, -0.7039794921875, -0.63885498046875, -0.57373046875, -0.50860595703125, -0.4434814453125, -0.37835693359375, -0.313232421875, -0.24810791015625, -0.1829833984375, -0.11785888671875, -0.052734375, 0.01239013671875, 0.0775146484375, 0.14263916015625, 0.207763671875, 0.27288818359375, 0.3380126953125, 0.40313720703125, 0.46826171875, 0.53338623046875, 0.5985107421875, 0.66363525390625, 0.728759765625, 0.79388427734375, 0.8590087890625, 0.92413330078125, 0.9892578125, 1.05438232421875, 1.1195068359375, 1.18463134765625, 1.249755859375, 1.31488037109375, 1.3800048828125, 1.44512939453125, 1.51025390625, 1.57537841796875, 1.6405029296875, 1.70562744140625, 1.770751953125, 1.83587646484375, 1.9010009765625, 1.96612548828125, 2.03125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 23.0, 77.0, 3817.0, 85.0, 27.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.2169342041015625, -0.198028564453125, -0.1791229248046875, -0.16021728515625, -0.1413116455078125, -0.122406005859375, -0.1035003662109375, -0.0845947265625, -0.0656890869140625, -0.046783447265625, -0.0278778076171875, -0.00897216796875, 0.0099334716796875, 0.028839111328125, 0.0477447509765625, 0.066650390625, 0.0855560302734375, 0.104461669921875, 0.1233673095703125, 0.14227294921875, 0.1611785888671875, 0.180084228515625, 0.1989898681640625, 0.2178955078125, 0.2368011474609375, 0.255706787109375, 0.2746124267578125, 0.29351806640625, 0.3124237060546875, 0.331329345703125, 0.3502349853515625, 0.369140625, 0.3880462646484375, 0.406951904296875, 0.4258575439453125, 0.44476318359375, 0.4636688232421875, 0.482574462890625, 0.5014801025390625, 0.5203857421875, 0.5392913818359375, 0.558197021484375, 0.5771026611328125, 0.59600830078125, 0.6149139404296875, 0.633819580078125, 0.6527252197265625, 0.671630859375, 0.6905364990234375, 0.709442138671875, 0.7283477783203125, 0.74725341796875, 0.7661590576171875, 0.785064697265625, 0.8039703369140625, 0.8228759765625, 0.8417816162109375, 0.860687255859375, 0.8795928955078125, 0.89849853515625, 0.9174041748046875, 0.936309814453125, 0.9552154541015625, 0.97412109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 130.0, 745.0, 118.0, 14.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.236989974975586, -9.93779468536377, -9.638599395751953, -9.339405059814453, -9.040209770202637, -8.74101448059082, -8.441819190979004, -8.142623901367188, -7.843428611755371, -7.544233322143555, -7.2450385093688965, -6.94584321975708, -6.646647930145264, -6.3474531173706055, -6.048257827758789, -5.749062538146973, -5.4498677253723145, -5.150672435760498, -4.85147762298584, -4.552282333374023, -4.253087043762207, -3.9538919925689697, -3.6546969413757324, -3.355501651763916, -3.0563066005706787, -2.7571115493774414, -2.457916259765625, -2.1587212085723877, -1.8595260381698608, -1.560330867767334, -1.2611358165740967, -0.9619405269622803, -0.662745475769043, -0.3635503351688385, -0.06435519456863403, 0.23483991622924805, 0.5340350866317749, 0.8332302570343018, 1.132425308227539, 1.4316205978393555, 1.7308156490325928, 2.03001070022583, 2.3292059898376465, 2.628401041030884, 2.927596092224121, 3.2267913818359375, 3.525986433029175, 3.825181722640991, 4.1243767738342285, 4.423572063446045, 4.722766876220703, 5.0219621658325195, 5.321157455444336, 5.620352745056152, 5.9195475578308105, 6.218742847442627, 6.517937660217285, 6.817132949829102, 7.11632776260376, 7.415523052215576, 7.714718341827393, 8.01391315460205, 8.313108444213867, 8.612303733825684, 8.9114990234375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 9.0, 5.0, 8.0, 11.0, 18.0, 16.0, 21.0, 27.0, 25.0, 30.0, 37.0, 36.0, 43.0, 40.0, 44.0, 54.0, 49.0, 54.0, 57.0, 51.0, 39.0, 40.0, 34.0, 35.0, 28.0, 35.0, 25.0, 26.0, 20.0, 11.0, 26.0, 14.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9321097731590271, -0.8937767744064331, -0.8554438352584839, -0.8171108365058899, -0.7787778973579407, -0.7404448986053467, -0.7021119594573975, -0.6637789607048035, -0.6254459619522095, -0.5871129631996155, -0.5487800240516663, -0.5104470252990723, -0.47211408615112305, -0.43378108739852905, -0.39544811844825745, -0.35711514949798584, -0.3187822103500366, -0.280449241399765, -0.2421162724494934, -0.2037832885980606, -0.165450319647789, -0.1271173506975174, -0.0887843668460846, -0.05045139789581299, -0.012118428945541382, 0.026214543730020523, 0.06454751640558243, 0.10288049280643463, 0.14121346175670624, 0.17954643070697784, 0.21787941455841064, 0.25621238350868225, 0.29454541206359863, 0.33287838101387024, 0.37121134996414185, 0.40954434871673584, 0.44787728786468506, 0.48621028661727905, 0.524543285369873, 0.5628762245178223, 0.6012091636657715, 0.6395421624183655, 0.6778751015663147, 0.7162081003189087, 0.7545410394668579, 0.7928740382194519, 0.8312070369720459, 0.8695399761199951, 0.9078729748725891, 0.9462059736251831, 0.9845389127731323, 1.0228718519210815, 1.0612049102783203, 1.0995378494262695, 1.1378707885742188, 1.176203727722168, 1.2145367860794067, 1.252869725227356, 1.2912027835845947, 1.329535722732544, 1.3678686618804932, 1.4062016010284424, 1.4445346593856812, 1.4828675985336304, 1.5212005376815796]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 6.0, 13.0, 19.0, 30.0, 40.0, 59.0, 67.0, 132.0, 199.0, 289.0, 474.0, 860.0, 1676.0, 3304.0, 7881.0, 21945.0, 83774.0, 503186.0, 337929.0, 57257.0, 16906.0, 6379.0, 2828.0, 1319.0, 749.0, 454.0, 254.0, 160.0, 101.0, 76.0, 62.0, 34.0, 19.0, 22.0, 10.0, 9.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.16796875, -2.103973388671875, -2.03997802734375, -1.975982666015625, -1.9119873046875, -1.847991943359375, -1.78399658203125, -1.720001220703125, -1.656005859375, -1.592010498046875, -1.52801513671875, -1.464019775390625, -1.4000244140625, -1.336029052734375, -1.27203369140625, -1.208038330078125, -1.14404296875, -1.080047607421875, -1.01605224609375, -0.952056884765625, -0.8880615234375, -0.824066162109375, -0.76007080078125, -0.696075439453125, -0.632080078125, -0.568084716796875, -0.50408935546875, -0.440093994140625, -0.3760986328125, -0.312103271484375, -0.24810791015625, -0.184112548828125, -0.1201171875, -0.056121826171875, 0.00787353515625, 0.071868896484375, 0.1358642578125, 0.199859619140625, 0.26385498046875, 0.327850341796875, 0.391845703125, 0.455841064453125, 0.51983642578125, 0.583831787109375, 0.6478271484375, 0.711822509765625, 0.77581787109375, 0.839813232421875, 0.90380859375, 0.967803955078125, 1.03179931640625, 1.095794677734375, 1.1597900390625, 1.223785400390625, 1.28778076171875, 1.351776123046875, 1.415771484375, 1.479766845703125, 1.54376220703125, 1.607757568359375, 1.6717529296875, 1.735748291015625, 1.79974365234375, 1.863739013671875, 1.927734375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 10.0, 7.0, 5.0, 20.0, 18.0, 27.0, 26.0, 30.0, 52.0, 55.0, 67.0, 72.0, 77.0, 73.0, 67.0, 68.0, 60.0, 55.0, 44.0, 30.0, 21.0, 25.0, 14.0, 19.0, 11.0, 13.0, 10.0, 2.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2490234375, -1.2147293090820312, -1.1804351806640625, -1.1461410522460938, -1.111846923828125, -1.0775527954101562, -1.0432586669921875, -1.0089645385742188, -0.97467041015625, -0.9403762817382812, -0.9060821533203125, -0.8717880249023438, -0.837493896484375, -0.8031997680664062, -0.7689056396484375, -0.7346115112304688, -0.7003173828125, -0.6660232543945312, -0.6317291259765625, -0.5974349975585938, -0.563140869140625, -0.5288467407226562, -0.4945526123046875, -0.46025848388671875, -0.42596435546875, -0.39167022705078125, -0.3573760986328125, -0.32308197021484375, -0.288787841796875, -0.25449371337890625, -0.2201995849609375, -0.18590545654296875, -0.151611328125, -0.11731719970703125, -0.0830230712890625, -0.04872894287109375, -0.014434814453125, 0.01985931396484375, 0.0541534423828125, 0.08844757080078125, 0.12274169921875, 0.15703582763671875, 0.1913299560546875, 0.22562408447265625, 0.259918212890625, 0.29421234130859375, 0.3285064697265625, 0.36280059814453125, 0.3970947265625, 0.43138885498046875, 0.4656829833984375, 0.49997711181640625, 0.534271240234375, 0.5685653686523438, 0.6028594970703125, 0.6371536254882812, 0.67144775390625, 0.7057418823242188, 0.7400360107421875, 0.7743301391601562, 0.808624267578125, 0.8429183959960938, 0.8772125244140625, 0.9115066528320312, 0.94580078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 15.0, 27.0, 38.0, 70.0, 124.0, 235.0, 432.0, 789.0, 1716.0, 4406.0, 19612.0, 333780.0, 649232.0, 28537.0, 5559.0, 1958.0, 901.0, 470.0, 247.0, 133.0, 86.0, 64.0, 37.0, 16.0, 13.0, 9.0, 9.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.619903564453125, -3.50347900390625, -3.387054443359375, -3.2706298828125, -3.154205322265625, -3.03778076171875, -2.921356201171875, -2.804931640625, -2.688507080078125, -2.57208251953125, -2.455657958984375, -2.3392333984375, -2.222808837890625, -2.10638427734375, -1.989959716796875, -1.87353515625, -1.757110595703125, -1.64068603515625, -1.524261474609375, -1.4078369140625, -1.291412353515625, -1.17498779296875, -1.058563232421875, -0.942138671875, -0.825714111328125, -0.70928955078125, -0.592864990234375, -0.4764404296875, -0.360015869140625, -0.24359130859375, -0.127166748046875, -0.0107421875, 0.105682373046875, 0.22210693359375, 0.338531494140625, 0.4549560546875, 0.571380615234375, 0.68780517578125, 0.804229736328125, 0.920654296875, 1.037078857421875, 1.15350341796875, 1.269927978515625, 1.3863525390625, 1.502777099609375, 1.61920166015625, 1.735626220703125, 1.85205078125, 1.968475341796875, 2.08489990234375, 2.201324462890625, 2.3177490234375, 2.434173583984375, 2.55059814453125, 2.667022705078125, 2.783447265625, 2.899871826171875, 3.01629638671875, 3.132720947265625, 3.2491455078125, 3.365570068359375, 3.48199462890625, 3.598419189453125, 3.71484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 7.0, 15.0, 18.0, 23.0, 32.0, 38.0, 41.0, 62.0, 57.0, 53.0, 64.0, 63.0, 79.0, 63.0, 62.0, 62.0, 44.0, 49.0, 36.0, 35.0, 20.0, 16.0, 12.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.62005615234375, -4.4471435546875, -4.27423095703125, -4.101318359375, -3.92840576171875, -3.7554931640625, -3.58258056640625, -3.40966796875, -3.23675537109375, -3.0638427734375, -2.89093017578125, -2.718017578125, -2.54510498046875, -2.3721923828125, -2.19927978515625, -2.0263671875, -1.85345458984375, -1.6805419921875, -1.50762939453125, -1.334716796875, -1.16180419921875, -0.9888916015625, -0.81597900390625, -0.64306640625, -0.47015380859375, -0.2972412109375, -0.12432861328125, 0.048583984375, 0.22149658203125, 0.3944091796875, 0.56732177734375, 0.740234375, 0.91314697265625, 1.0860595703125, 1.25897216796875, 1.431884765625, 1.60479736328125, 1.7777099609375, 1.95062255859375, 2.12353515625, 2.29644775390625, 2.4693603515625, 2.64227294921875, 2.815185546875, 2.98809814453125, 3.1610107421875, 3.33392333984375, 3.5068359375, 3.67974853515625, 3.8526611328125, 4.02557373046875, 4.198486328125, 4.37139892578125, 4.5443115234375, 4.71722412109375, 4.89013671875, 5.06304931640625, 5.2359619140625, 5.40887451171875, 5.581787109375, 5.75469970703125, 5.9276123046875, 6.10052490234375, 6.2734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 11.0, 14.0, 32.0, 102.0, 341.0, 1446.0, 13347.0, 1020230.0, 11188.0, 1394.0, 271.0, 92.0, 50.0, 13.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.53125, -6.36578369140625, -6.2003173828125, -6.03485107421875, -5.869384765625, -5.70391845703125, -5.5384521484375, -5.37298583984375, -5.20751953125, -5.04205322265625, -4.8765869140625, -4.71112060546875, -4.545654296875, -4.38018798828125, -4.2147216796875, -4.04925537109375, -3.8837890625, -3.71832275390625, -3.5528564453125, -3.38739013671875, -3.221923828125, -3.05645751953125, -2.8909912109375, -2.72552490234375, -2.56005859375, -2.39459228515625, -2.2291259765625, -2.06365966796875, -1.898193359375, -1.73272705078125, -1.5672607421875, -1.40179443359375, -1.236328125, -1.07086181640625, -0.9053955078125, -0.73992919921875, -0.574462890625, -0.40899658203125, -0.2435302734375, -0.07806396484375, 0.08740234375, 0.25286865234375, 0.4183349609375, 0.58380126953125, 0.749267578125, 0.91473388671875, 1.0802001953125, 1.24566650390625, 1.4111328125, 1.57659912109375, 1.7420654296875, 1.90753173828125, 2.072998046875, 2.23846435546875, 2.4039306640625, 2.56939697265625, 2.73486328125, 2.90032958984375, 3.0657958984375, 3.23126220703125, 3.396728515625, 3.56219482421875, 3.7276611328125, 3.89312744140625, 4.05859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 7.0, 16.0, 33.0, 70.0, 189.0, 274.0, 205.0, 112.0, 45.0, 12.0, 10.0, 10.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022149085998535156, -0.0002125091850757599, -0.0002035275101661682, -0.00019454583525657654, -0.00018556416034698486, -0.0001765824854373932, -0.00016760081052780151, -0.00015861913561820984, -0.00014963746070861816, -0.0001406557857990265, -0.00013167411088943481, -0.00012269243597984314, -0.00011371076107025146, -0.00010472908616065979, -9.574741125106812e-05, -8.676573634147644e-05, -7.778406143188477e-05, -6.880238652229309e-05, -5.9820711612701416e-05, -5.083903670310974e-05, -4.1857361793518066e-05, -3.287568688392639e-05, -2.3894011974334717e-05, -1.4912337064743042e-05, -5.930662155151367e-06, 3.0510127544403076e-06, 1.2032687664031982e-05, 2.1014362573623657e-05, 2.9996037483215332e-05, 3.897771239280701e-05, 4.795938730239868e-05, 5.6941062211990356e-05, 6.592273712158203e-05, 7.49044120311737e-05, 8.388608694076538e-05, 9.286776185035706e-05, 0.00010184943675994873, 0.0001108311116695404, 0.00011981278657913208, 0.00012879446148872375, 0.00013777613639831543, 0.0001467578113079071, 0.00015573948621749878, 0.00016472116112709045, 0.00017370283603668213, 0.0001826845109462738, 0.00019166618585586548, 0.00020064786076545715, 0.00020962953567504883, 0.0002186112105846405, 0.00022759288549423218, 0.00023657456040382385, 0.00024555623531341553, 0.0002545379102230072, 0.0002635195851325989, 0.00027250126004219055, 0.0002814829349517822, 0.0002904646098613739, 0.0002994462847709656, 0.00030842795968055725, 0.0003174096345901489, 0.0003263913094997406, 0.0003353729844093323, 0.00034435465931892395, 0.0003533363342285156]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 11.0, 4.0, 13.0, 12.0, 16.0, 39.0, 46.0, 73.0, 144.0, 279.0, 543.0, 1326.0, 3478.0, 12171.0, 778799.0, 237282.0, 9244.0, 2793.0, 1156.0, 551.0, 234.0, 128.0, 63.0, 59.0, 27.0, 21.0, 13.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9482421875, -1.873046875, -1.7978515625, -1.72265625, -1.6474609375, -1.572265625, -1.4970703125, -1.421875, -1.3466796875, -1.271484375, -1.1962890625, -1.12109375, -1.0458984375, -0.970703125, -0.8955078125, -0.8203125, -0.7451171875, -0.669921875, -0.5947265625, -0.51953125, -0.4443359375, -0.369140625, -0.2939453125, -0.21875, -0.1435546875, -0.068359375, 0.0068359375, 0.08203125, 0.1572265625, 0.232421875, 0.3076171875, 0.3828125, 0.4580078125, 0.533203125, 0.6083984375, 0.68359375, 0.7587890625, 0.833984375, 0.9091796875, 0.984375, 1.0595703125, 1.134765625, 1.2099609375, 1.28515625, 1.3603515625, 1.435546875, 1.5107421875, 1.5859375, 1.6611328125, 1.736328125, 1.8115234375, 1.88671875, 1.9619140625, 2.037109375, 2.1123046875, 2.1875, 2.2626953125, 2.337890625, 2.4130859375, 2.48828125, 2.5634765625, 2.638671875, 2.7138671875, 2.7890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 9.0, 23.0, 92.0, 354.0, 331.0, 94.0, 19.0, 12.0, 9.0, 5.0, 3.0, 2.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.859222412109375, -2.70867919921875, -2.558135986328125, -2.4075927734375, -2.257049560546875, -2.10650634765625, -1.955963134765625, -1.805419921875, -1.654876708984375, -1.50433349609375, -1.353790283203125, -1.2032470703125, -1.052703857421875, -0.90216064453125, -0.751617431640625, -0.60107421875, -0.450531005859375, -0.29998779296875, -0.149444580078125, 0.0010986328125, 0.151641845703125, 0.30218505859375, 0.452728271484375, 0.603271484375, 0.753814697265625, 0.90435791015625, 1.054901123046875, 1.2054443359375, 1.355987548828125, 1.50653076171875, 1.657073974609375, 1.8076171875, 1.958160400390625, 2.10870361328125, 2.259246826171875, 2.4097900390625, 2.560333251953125, 2.71087646484375, 2.861419677734375, 3.011962890625, 3.162506103515625, 3.31304931640625, 3.463592529296875, 3.6141357421875, 3.764678955078125, 3.91522216796875, 4.065765380859375, 4.21630859375, 4.366851806640625, 4.51739501953125, 4.667938232421875, 4.8184814453125, 4.969024658203125, 5.11956787109375, 5.270111083984375, 5.420654296875, 5.571197509765625, 5.72174072265625, 5.872283935546875, 6.0228271484375, 6.173370361328125, 6.32391357421875, 6.474456787109375, 6.625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 12.0, 41.0, 132.0, 289.0, 278.0, 128.0, 70.0, 29.0, 19.0, 9.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.160404205322266, -25.91027069091797, -24.660137176513672, -23.410003662109375, -22.159870147705078, -20.90973663330078, -19.659605026245117, -18.40947151184082, -17.159337997436523, -15.909204483032227, -14.65907096862793, -13.40893840789795, -12.158804893493652, -10.908671379089355, -9.658538818359375, -8.408405303955078, -7.158271789550781, -5.908138275146484, -4.658005237579346, -3.407871961593628, -2.15773868560791, -0.9076051712036133, 0.3425278663635254, 1.592660903930664, 2.842794418334961, 4.092927932739258, 5.3430609703063965, 6.593194007873535, 7.843327522277832, 9.093461036682129, 10.34359359741211, 11.593727111816406, 12.843864440917969, 14.093997955322266, 15.344131469726562, 16.59426498413086, 17.844398498535156, 19.094532012939453, 20.344663619995117, 21.594797134399414, 22.84493064880371, 24.095064163208008, 25.345197677612305, 26.5953311920166, 27.845462799072266, 29.095596313476562, 30.34572982788086, 31.595863342285156, 32.84599685668945, 34.09613037109375, 35.34626388549805, 36.596397399902344, 37.84653091430664, 39.09666442871094, 40.346797943115234, 41.59693145751953, 42.84706115722656, 44.09719467163086, 45.347328186035156, 46.59746170043945, 47.84759521484375, 49.09772872924805, 50.347862243652344, 51.597991943359375, 52.84812927246094]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 7.0, 6.0, 12.0, 10.0, 17.0, 8.0, 17.0, 12.0, 19.0, 18.0, 24.0, 24.0, 21.0, 31.0, 22.0, 50.0, 42.0, 45.0, 40.0, 42.0, 30.0, 44.0, 47.0, 45.0, 40.0, 44.0, 37.0, 31.0, 30.0, 28.0, 31.0, 13.0, 16.0, 21.0, 18.0, 18.0, 10.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.617327690124512, -15.052301406860352, -14.487274169921875, -13.922247886657715, -13.357221603393555, -12.792194366455078, -12.227168083190918, -11.662141799926758, -11.097114562988281, -10.532088279724121, -9.967061042785645, -9.402034759521484, -8.837007522583008, -8.271981239318848, -7.7069549560546875, -7.141928195953369, -6.576901435852051, -6.011874675750732, -5.446847915649414, -4.881821632385254, -4.3167948722839355, -3.751768112182617, -3.186741590499878, -2.6217150688171387, -2.0566883087158203, -1.4916616678237915, -0.9266350269317627, -0.3616083860397339, 0.20341825485229492, 0.7684450149536133, 1.3334715366363525, 1.8984980583190918, 2.4635257720947266, 3.028552532196045, 3.593579053878784, 4.158605575561523, 4.723632335662842, 5.28865909576416, 5.85368537902832, 6.418712139129639, 6.983738899230957, 7.548765659332275, 8.113792419433594, 8.678818702697754, 9.243844985961914, 9.80887222290039, 10.37389850616455, 10.938924789428711, 11.503952026367188, 12.068978309631348, 12.634005546569824, 13.199031829833984, 13.764059066772461, 14.329085350036621, 14.894111633300781, 15.459138870239258, 16.024166107177734, 16.58919334411621, 17.154218673706055, 17.71924591064453, 18.284273147583008, 18.849300384521484, 19.414325714111328, 19.979352951049805, 20.54437828063965]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 9.0, 6.0, 4.0, 9.0, 13.0, 10.0, 18.0, 26.0, 39.0, 54.0, 81.0, 136.0, 233.0, 425.0, 1018.0, 3183.0, 28463.0, 4143983.0, 12394.0, 2365.0, 814.0, 367.0, 212.0, 131.0, 86.0, 55.0, 25.0, 21.0, 18.0, 19.0, 17.0, 6.0, 15.0, 10.0, 3.0, 4.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.88714599609375, -3.7547607421875, -3.62237548828125, -3.489990234375, -3.35760498046875, -3.2252197265625, -3.09283447265625, -2.96044921875, -2.82806396484375, -2.6956787109375, -2.56329345703125, -2.430908203125, -2.29852294921875, -2.1661376953125, -2.03375244140625, -1.9013671875, -1.76898193359375, -1.6365966796875, -1.50421142578125, -1.371826171875, -1.23944091796875, -1.1070556640625, -0.97467041015625, -0.84228515625, -0.70989990234375, -0.5775146484375, -0.44512939453125, -0.312744140625, -0.18035888671875, -0.0479736328125, 0.08441162109375, 0.216796875, 0.34918212890625, 0.4815673828125, 0.61395263671875, 0.746337890625, 0.87872314453125, 1.0111083984375, 1.14349365234375, 1.27587890625, 1.40826416015625, 1.5406494140625, 1.67303466796875, 1.805419921875, 1.93780517578125, 2.0701904296875, 2.20257568359375, 2.3349609375, 2.46734619140625, 2.5997314453125, 2.73211669921875, 2.864501953125, 2.99688720703125, 3.1292724609375, 3.26165771484375, 3.39404296875, 3.52642822265625, 3.6588134765625, 3.79119873046875, 3.923583984375, 4.05596923828125, 4.1883544921875, 4.32073974609375, 4.453125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 8.0, 14.0, 16.0, 27.0, 34.0, 34.0, 51.0, 48.0, 59.0, 78.0, 67.0, 70.0, 81.0, 73.0, 63.0, 54.0, 42.0, 34.0, 30.0, 22.0, 12.0, 16.0, 11.0, 9.0, 7.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8544921875, -0.81842041015625, -0.7823486328125, -0.74627685546875, -0.710205078125, -0.67413330078125, -0.6380615234375, -0.60198974609375, -0.56591796875, -0.52984619140625, -0.4937744140625, -0.45770263671875, -0.421630859375, -0.38555908203125, -0.3494873046875, -0.31341552734375, -0.27734375, -0.24127197265625, -0.2052001953125, -0.16912841796875, -0.133056640625, -0.09698486328125, -0.0609130859375, -0.02484130859375, 0.01123046875, 0.04730224609375, 0.0833740234375, 0.11944580078125, 0.155517578125, 0.19158935546875, 0.2276611328125, 0.26373291015625, 0.2998046875, 0.33587646484375, 0.3719482421875, 0.40802001953125, 0.444091796875, 0.48016357421875, 0.5162353515625, 0.55230712890625, 0.58837890625, 0.62445068359375, 0.6605224609375, 0.69659423828125, 0.732666015625, 0.76873779296875, 0.8048095703125, 0.84088134765625, 0.876953125, 0.91302490234375, 0.9490966796875, 0.98516845703125, 1.021240234375, 1.05731201171875, 1.0933837890625, 1.12945556640625, 1.16552734375, 1.20159912109375, 1.2376708984375, 1.27374267578125, 1.309814453125, 1.34588623046875, 1.3819580078125, 1.41802978515625, 1.4541015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 9.0, 7.0, 15.0, 18.0, 17.0, 37.0, 34.0, 38.0, 60.0, 69.0, 105.0, 117.0, 191.0, 247.0, 299.0, 385.0, 897.0, 10436.0, 4175136.0, 4050.0, 650.0, 328.0, 256.0, 181.0, 184.0, 106.0, 87.0, 80.0, 60.0, 39.0, 28.0, 22.0, 22.0, 18.0, 10.0, 11.0, 11.0, 8.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.63671875, -11.265625, -10.89453125, -10.5234375, -10.15234375, -9.78125, -9.41015625, -9.0390625, -8.66796875, -8.296875, -7.92578125, -7.5546875, -7.18359375, -6.8125, -6.44140625, -6.0703125, -5.69921875, -5.328125, -4.95703125, -4.5859375, -4.21484375, -3.84375, -3.47265625, -3.1015625, -2.73046875, -2.359375, -1.98828125, -1.6171875, -1.24609375, -0.875, -0.50390625, -0.1328125, 0.23828125, 0.609375, 0.98046875, 1.3515625, 1.72265625, 2.09375, 2.46484375, 2.8359375, 3.20703125, 3.578125, 3.94921875, 4.3203125, 4.69140625, 5.0625, 5.43359375, 5.8046875, 6.17578125, 6.546875, 6.91796875, 7.2890625, 7.66015625, 8.03125, 8.40234375, 8.7734375, 9.14453125, 9.515625, 9.88671875, 10.2578125, 10.62890625, 11.0, 11.37109375, 11.7421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 25.0, 4003.0, 40.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.640625, -13.37078857421875, -13.1009521484375, -12.83111572265625, -12.561279296875, -12.29144287109375, -12.0216064453125, -11.75177001953125, -11.48193359375, -11.21209716796875, -10.9422607421875, -10.67242431640625, -10.402587890625, -10.13275146484375, -9.8629150390625, -9.59307861328125, -9.3232421875, -9.05340576171875, -8.7835693359375, -8.51373291015625, -8.243896484375, -7.97406005859375, -7.7042236328125, -7.43438720703125, -7.16455078125, -6.89471435546875, -6.6248779296875, -6.35504150390625, -6.085205078125, -5.81536865234375, -5.5455322265625, -5.27569580078125, -5.005859375, -4.73602294921875, -4.4661865234375, -4.19635009765625, -3.926513671875, -3.65667724609375, -3.3868408203125, -3.11700439453125, -2.84716796875, -2.57733154296875, -2.3074951171875, -2.03765869140625, -1.767822265625, -1.49798583984375, -1.2281494140625, -0.95831298828125, -0.6884765625, -0.41864013671875, -0.1488037109375, 0.12103271484375, 0.390869140625, 0.66070556640625, 0.9305419921875, 1.20037841796875, 1.47021484375, 1.74005126953125, 2.0098876953125, 2.27972412109375, 2.549560546875, 2.81939697265625, 3.0892333984375, 3.35906982421875, 3.62890625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 24.0, 55.0, 184.0, 438.0, 212.0, 62.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.379966735839844, -33.69788360595703, -33.01579666137695, -32.33371353149414, -31.651628494262695, -30.96954345703125, -30.287460327148438, -29.605375289916992, -28.923290252685547, -28.2412052154541, -27.55912208557129, -26.877037048339844, -26.1949520111084, -25.512866973876953, -24.83078384399414, -24.148698806762695, -23.466615676879883, -22.784530639648438, -22.102447509765625, -21.42036247253418, -20.738277435302734, -20.056194305419922, -19.374109268188477, -18.69202423095703, -18.00994110107422, -17.327856063842773, -16.64577293395996, -15.963687896728516, -15.28160285949707, -14.599518775939941, -13.917434692382812, -13.235349655151367, -12.553266525268555, -11.871182441711426, -11.18909740447998, -10.507013320922852, -9.824928283691406, -9.142844200134277, -8.460760116577148, -7.778675556182861, -7.096590995788574, -6.414506435394287, -5.732421875, -5.050337791442871, -4.368253231048584, -3.686168670654297, -3.004084587097168, -2.322000026702881, -1.6399154663085938, -0.9578310251235962, -0.27574658393859863, 0.4063377380371094, 1.0884222984313965, 1.7705068588256836, 2.4525909423828125, 3.1346755027770996, 3.8167600631713867, 4.498844623565674, 5.180929183959961, 5.86301326751709, 6.545097827911377, 7.227182388305664, 7.909266471862793, 8.591350555419922, 9.273435592651367]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 12.0, 17.0, 20.0, 38.0, 64.0, 90.0, 123.0, 163.0, 140.0, 114.0, 69.0, 49.0, 41.0, 20.0, 17.0, 5.0, 9.0, 0.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28121566772461, -20.547666549682617, -19.814117431640625, -19.08056640625, -18.347017288208008, -17.613468170166016, -16.879919052124023, -16.14636993408203, -15.412819862365723, -14.67927074432373, -13.945720672607422, -13.21217155456543, -12.478622436523438, -11.745072364807129, -11.011523246765137, -10.277973175048828, -9.544424057006836, -8.810874938964844, -8.077324867248535, -7.343775749206543, -6.610226154327393, -5.876676559448242, -5.14312744140625, -4.4095778465271, -3.676028251647949, -2.942478656768799, -2.2089293003082275, -1.4753799438476562, -0.7418303489685059, -0.008280754089355469, 0.7252683639526367, 1.458817958831787, 2.1923694610595703, 2.9259190559387207, 3.659468412399292, 4.393017768859863, 5.126567363739014, 5.860116958618164, 6.593666076660156, 7.327215671539307, 8.060765266418457, 8.79431438446045, 9.527864456176758, 10.26141357421875, 10.994962692260742, 11.72851276397705, 12.462061882019043, 13.195611953735352, 13.929161071777344, 14.662710189819336, 15.396260261535645, 16.129810333251953, 16.863359451293945, 17.596908569335938, 18.33045768737793, 19.064006805419922, 19.797557830810547, 20.53110694885254, 21.26465606689453, 21.998207092285156, 22.73175621032715, 23.46530532836914, 24.198854446411133, 24.932403564453125, 25.665952682495117]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 18.0, 19.0, 40.0, 55.0, 107.0, 178.0, 336.0, 652.0, 1696.0, 5319.0, 22103.0, 151814.0, 714412.0, 124756.0, 19520.0, 4613.0, 1502.0, 676.0, 306.0, 157.0, 102.0, 62.0, 32.0, 22.0, 19.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.9449462890625, -2.844970703125, -2.7449951171875, -2.64501953125, -2.5450439453125, -2.445068359375, -2.3450927734375, -2.2451171875, -2.1451416015625, -2.045166015625, -1.9451904296875, -1.84521484375, -1.7452392578125, -1.645263671875, -1.5452880859375, -1.4453125, -1.3453369140625, -1.245361328125, -1.1453857421875, -1.04541015625, -0.9454345703125, -0.845458984375, -0.7454833984375, -0.6455078125, -0.5455322265625, -0.445556640625, -0.3455810546875, -0.24560546875, -0.1456298828125, -0.045654296875, 0.0543212890625, 0.154296875, 0.2542724609375, 0.354248046875, 0.4542236328125, 0.55419921875, 0.6541748046875, 0.754150390625, 0.8541259765625, 0.9541015625, 1.0540771484375, 1.154052734375, 1.2540283203125, 1.35400390625, 1.4539794921875, 1.553955078125, 1.6539306640625, 1.75390625, 1.8538818359375, 1.953857421875, 2.0538330078125, 2.15380859375, 2.2537841796875, 2.353759765625, 2.4537353515625, 2.5537109375, 2.6536865234375, 2.753662109375, 2.8536376953125, 2.95361328125, 3.0535888671875, 3.153564453125, 3.2535400390625, 3.353515625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 8.0, 18.0, 18.0, 21.0, 35.0, 39.0, 55.0, 66.0, 79.0, 100.0, 96.0, 97.0, 90.0, 75.0, 46.0, 45.0, 22.0, 16.0, 20.0, 12.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.876953125, -1.8171234130859375, -1.757293701171875, -1.6974639892578125, -1.63763427734375, -1.5778045654296875, -1.517974853515625, -1.4581451416015625, -1.3983154296875, -1.3384857177734375, -1.278656005859375, -1.2188262939453125, -1.15899658203125, -1.0991668701171875, -1.039337158203125, -0.9795074462890625, -0.919677734375, -0.8598480224609375, -0.800018310546875, -0.7401885986328125, -0.68035888671875, -0.6205291748046875, -0.560699462890625, -0.5008697509765625, -0.4410400390625, -0.3812103271484375, -0.321380615234375, -0.2615509033203125, -0.20172119140625, -0.1418914794921875, -0.082061767578125, -0.0222320556640625, 0.03759765625, 0.0974273681640625, 0.157257080078125, 0.2170867919921875, 0.27691650390625, 0.3367462158203125, 0.396575927734375, 0.4564056396484375, 0.5162353515625, 0.5760650634765625, 0.635894775390625, 0.6957244873046875, 0.75555419921875, 0.8153839111328125, 0.875213623046875, 0.9350433349609375, 0.994873046875, 1.0547027587890625, 1.114532470703125, 1.1743621826171875, 1.23419189453125, 1.2940216064453125, 1.353851318359375, 1.4136810302734375, 1.4735107421875, 1.5333404541015625, 1.593170166015625, 1.6529998779296875, 1.71282958984375, 1.7726593017578125, 1.832489013671875, 1.8923187255859375, 1.9521484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 14.0, 18.0, 20.0, 36.0, 48.0, 90.0, 147.0, 276.0, 717.0, 3284.0, 110577.0, 921293.0, 9946.0, 1177.0, 411.0, 192.0, 118.0, 78.0, 41.0, 23.0, 7.0, 11.0, 10.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.43572998046875, -7.1722412109375, -6.90875244140625, -6.645263671875, -6.38177490234375, -6.1182861328125, -5.85479736328125, -5.59130859375, -5.32781982421875, -5.0643310546875, -4.80084228515625, -4.537353515625, -4.27386474609375, -4.0103759765625, -3.74688720703125, -3.4833984375, -3.21990966796875, -2.9564208984375, -2.69293212890625, -2.429443359375, -2.16595458984375, -1.9024658203125, -1.63897705078125, -1.37548828125, -1.11199951171875, -0.8485107421875, -0.58502197265625, -0.321533203125, -0.05804443359375, 0.2054443359375, 0.46893310546875, 0.732421875, 0.99591064453125, 1.2593994140625, 1.52288818359375, 1.786376953125, 2.04986572265625, 2.3133544921875, 2.57684326171875, 2.84033203125, 3.10382080078125, 3.3673095703125, 3.63079833984375, 3.894287109375, 4.15777587890625, 4.4212646484375, 4.68475341796875, 4.9482421875, 5.21173095703125, 5.4752197265625, 5.73870849609375, 6.002197265625, 6.26568603515625, 6.5291748046875, 6.79266357421875, 7.05615234375, 7.31964111328125, 7.5831298828125, 7.84661865234375, 8.110107421875, 8.37359619140625, 8.6370849609375, 8.90057373046875, 9.1640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 39.0, 68.0, 112.0, 168.0, 184.0, 158.0, 122.0, 92.0, 30.0, 13.0, 10.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.880859375, -21.35546875, -20.830078125, -20.3046875, -19.779296875, -19.25390625, -18.728515625, -18.203125, -17.677734375, -17.15234375, -16.626953125, -16.1015625, -15.576171875, -15.05078125, -14.525390625, -14.0, -13.474609375, -12.94921875, -12.423828125, -11.8984375, -11.373046875, -10.84765625, -10.322265625, -9.796875, -9.271484375, -8.74609375, -8.220703125, -7.6953125, -7.169921875, -6.64453125, -6.119140625, -5.59375, -5.068359375, -4.54296875, -4.017578125, -3.4921875, -2.966796875, -2.44140625, -1.916015625, -1.390625, -0.865234375, -0.33984375, 0.185546875, 0.7109375, 1.236328125, 1.76171875, 2.287109375, 2.8125, 3.337890625, 3.86328125, 4.388671875, 4.9140625, 5.439453125, 5.96484375, 6.490234375, 7.015625, 7.541015625, 8.06640625, 8.591796875, 9.1171875, 9.642578125, 10.16796875, 10.693359375, 11.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 13.0, 16.0, 20.0, 24.0, 45.0, 87.0, 169.0, 515.0, 1960.0, 13064.0, 646920.0, 372543.0, 10619.0, 1718.0, 463.0, 166.0, 68.0, 27.0, 39.0, 12.0, 9.0, 7.0, 12.0, 4.0, 7.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.119415283203125, -2.06500244140625, -2.010589599609375, -1.9561767578125, -1.901763916015625, -1.84735107421875, -1.792938232421875, -1.738525390625, -1.684112548828125, -1.62969970703125, -1.575286865234375, -1.5208740234375, -1.466461181640625, -1.41204833984375, -1.357635498046875, -1.30322265625, -1.248809814453125, -1.19439697265625, -1.139984130859375, -1.0855712890625, -1.031158447265625, -0.97674560546875, -0.922332763671875, -0.867919921875, -0.813507080078125, -0.75909423828125, -0.704681396484375, -0.6502685546875, -0.595855712890625, -0.54144287109375, -0.487030029296875, -0.4326171875, -0.378204345703125, -0.32379150390625, -0.269378662109375, -0.2149658203125, -0.160552978515625, -0.10614013671875, -0.051727294921875, 0.002685546875, 0.057098388671875, 0.11151123046875, 0.165924072265625, 0.2203369140625, 0.274749755859375, 0.32916259765625, 0.383575439453125, 0.43798828125, 0.492401123046875, 0.54681396484375, 0.601226806640625, 0.6556396484375, 0.710052490234375, 0.76446533203125, 0.818878173828125, 0.873291015625, 0.927703857421875, 0.98211669921875, 1.036529541015625, 1.0909423828125, 1.145355224609375, 1.19976806640625, 1.254180908203125, 1.30859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 16.0, 12.0, 25.0, 49.0, 57.0, 72.0, 117.0, 127.0, 124.0, 101.0, 77.0, 46.0, 30.0, 24.0, 18.0, 15.0, 11.0, 10.0, 6.0, 5.0, 7.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011783838272094727, -0.0001134360209107399, -0.00010903365910053253, -0.00010463129729032516, -0.0001002289354801178, -9.582657366991043e-05, -9.142421185970306e-05, -8.70218500494957e-05, -8.261948823928833e-05, -7.821712642908096e-05, -7.38147646188736e-05, -6.941240280866623e-05, -6.501004099845886e-05, -6.0607679188251495e-05, -5.620531737804413e-05, -5.180295556783676e-05, -4.7400593757629395e-05, -4.299823194742203e-05, -3.859587013721466e-05, -3.4193508327007294e-05, -2.9791146516799927e-05, -2.538878470659256e-05, -2.0986422896385193e-05, -1.6584061086177826e-05, -1.2181699275970459e-05, -7.779337465763092e-06, -3.376975655555725e-06, 1.0253861546516418e-06, 5.427747964859009e-06, 9.830109775066376e-06, 1.4232471585273743e-05, 1.863483339548111e-05, 2.3037195205688477e-05, 2.7439557015895844e-05, 3.184191882610321e-05, 3.624428063631058e-05, 4.0646642446517944e-05, 4.504900425672531e-05, 4.945136606693268e-05, 5.3853727877140045e-05, 5.825608968734741e-05, 6.265845149755478e-05, 6.706081330776215e-05, 7.146317511796951e-05, 7.586553692817688e-05, 8.026789873838425e-05, 8.467026054859161e-05, 8.907262235879898e-05, 9.347498416900635e-05, 9.787734597921371e-05, 0.00010227970778942108, 0.00010668206959962845, 0.00011108443140983582, 0.00011548679322004318, 0.00011988915503025055, 0.00012429151684045792, 0.00012869387865066528, 0.00013309624046087265, 0.00013749860227108002, 0.00014190096408128738, 0.00014630332589149475, 0.00015070568770170212, 0.00015510804951190948, 0.00015951041132211685, 0.00016391277313232422]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 9.0, 12.0, 8.0, 32.0, 62.0, 117.0, 240.0, 650.0, 2354.0, 21714.0, 986760.0, 32660.0, 2666.0, 732.0, 275.0, 105.0, 59.0, 36.0, 19.0, 11.0, 8.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.080078125, -2.007232666015625, -1.93438720703125, -1.861541748046875, -1.7886962890625, -1.715850830078125, -1.64300537109375, -1.570159912109375, -1.497314453125, -1.424468994140625, -1.35162353515625, -1.278778076171875, -1.2059326171875, -1.133087158203125, -1.06024169921875, -0.987396240234375, -0.91455078125, -0.841705322265625, -0.76885986328125, -0.696014404296875, -0.6231689453125, -0.550323486328125, -0.47747802734375, -0.404632568359375, -0.331787109375, -0.258941650390625, -0.18609619140625, -0.113250732421875, -0.0404052734375, 0.032440185546875, 0.10528564453125, 0.178131103515625, 0.2509765625, 0.323822021484375, 0.39666748046875, 0.469512939453125, 0.5423583984375, 0.615203857421875, 0.68804931640625, 0.760894775390625, 0.833740234375, 0.906585693359375, 0.97943115234375, 1.052276611328125, 1.1251220703125, 1.197967529296875, 1.27081298828125, 1.343658447265625, 1.41650390625, 1.489349365234375, 1.56219482421875, 1.635040283203125, 1.7078857421875, 1.780731201171875, 1.85357666015625, 1.926422119140625, 1.999267578125, 2.072113037109375, 2.14495849609375, 2.217803955078125, 2.2906494140625, 2.363494873046875, 2.43634033203125, 2.509185791015625, 2.58203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 12.0, 8.0, 14.0, 19.0, 44.0, 88.0, 133.0, 160.0, 184.0, 136.0, 78.0, 44.0, 26.0, 15.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.278717041015625, -1.22540283203125, -1.172088623046875, -1.1187744140625, -1.065460205078125, -1.01214599609375, -0.958831787109375, -0.905517578125, -0.852203369140625, -0.79888916015625, -0.745574951171875, -0.6922607421875, -0.638946533203125, -0.58563232421875, -0.532318115234375, -0.47900390625, -0.425689697265625, -0.37237548828125, -0.319061279296875, -0.2657470703125, -0.212432861328125, -0.15911865234375, -0.105804443359375, -0.052490234375, 0.000823974609375, 0.05413818359375, 0.107452392578125, 0.1607666015625, 0.214080810546875, 0.26739501953125, 0.320709228515625, 0.3740234375, 0.427337646484375, 0.48065185546875, 0.533966064453125, 0.5872802734375, 0.640594482421875, 0.69390869140625, 0.747222900390625, 0.800537109375, 0.853851318359375, 0.90716552734375, 0.960479736328125, 1.0137939453125, 1.067108154296875, 1.12042236328125, 1.173736572265625, 1.22705078125, 1.280364990234375, 1.33367919921875, 1.386993408203125, 1.4403076171875, 1.493621826171875, 1.54693603515625, 1.600250244140625, 1.653564453125, 1.706878662109375, 1.76019287109375, 1.813507080078125, 1.8668212890625, 1.920135498046875, 1.97344970703125, 2.026763916015625, 2.080078125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 17.0, 122.0, 653.0, 203.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.2798309326172, -128.9432373046875, -124.60664367675781, -120.27005004882812, -115.93345642089844, -111.59686279296875, -107.26026916503906, -102.92367553710938, -98.58708190917969, -94.25048828125, -89.91389465332031, -85.57730102539062, -81.24070739746094, -76.90411376953125, -72.56752014160156, -68.23092651367188, -63.89433288574219, -59.5577392578125, -55.22114562988281, -50.884552001953125, -46.54795837402344, -42.21136474609375, -37.87477111816406, -33.538177490234375, -29.201583862304688, -24.864990234375, -20.528396606445312, -16.191802978515625, -11.855209350585938, -7.51861572265625, -3.1820220947265625, 1.154571533203125, 5.49114990234375, 9.827743530273438, 14.164337158203125, 18.500930786132812, 22.8375244140625, 27.174118041992188, 31.510711669921875, 35.84730529785156, 40.18389892578125, 44.52049255371094, 48.857086181640625, 53.19367980957031, 57.5302734375, 61.86686706542969, 66.20346069335938, 70.54005432128906, 74.87664794921875, 79.21324157714844, 83.54983520507812, 87.88642883300781, 92.2230224609375, 96.55961608886719, 100.89620971679688, 105.23280334472656, 109.56939697265625, 113.90599060058594, 118.24258422851562, 122.57917785644531, 126.915771484375, 131.2523651123047, 135.58895874023438, 139.92555236816406, 144.26214599609375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 16.0, 17.0, 21.0, 30.0, 23.0, 43.0, 29.0, 37.0, 58.0, 54.0, 59.0, 60.0, 67.0, 60.0, 55.0, 52.0, 47.0, 38.0, 43.0, 27.0, 32.0, 23.0, 18.0, 7.0, 12.0, 20.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.70851135253906, -40.5550422668457, -39.401573181152344, -38.248104095458984, -37.094635009765625, -35.941165924072266, -34.787696838378906, -33.63422775268555, -32.48075866699219, -31.327289581298828, -30.17382049560547, -29.02035140991211, -27.86688232421875, -26.71341323852539, -25.55994415283203, -24.406475067138672, -23.253005981445312, -22.099536895751953, -20.946067810058594, -19.792598724365234, -18.639129638671875, -17.485660552978516, -16.332191467285156, -15.178722381591797, -14.025253295898438, -12.871784210205078, -11.718315124511719, -10.56484603881836, -9.411376953125, -8.25790786743164, -7.104438781738281, -5.950969696044922, -4.797496795654297, -3.6440277099609375, -2.490558624267578, -1.3370895385742188, -0.18362045288085938, 0.9698486328125, 2.1233177185058594, 3.2767868041992188, 4.430255889892578, 5.5837249755859375, 6.737194061279297, 7.890663146972656, 9.044132232666016, 10.197601318359375, 11.351070404052734, 12.504539489746094, 13.658008575439453, 14.811477661132812, 15.964946746826172, 17.11841583251953, 18.27188491821289, 19.42535400390625, 20.57882308959961, 21.73229217529297, 22.885761260986328, 24.039230346679688, 25.192699432373047, 26.346168518066406, 27.499637603759766, 28.653106689453125, 29.806575775146484, 30.960044860839844, 32.1135139465332]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 12.0, 9.0, 20.0, 26.0, 33.0, 55.0, 58.0, 114.0, 123.0, 205.0, 270.0, 402.0, 620.0, 1033.0, 1720.0, 2806.0, 4930.0, 10407.0, 26163.0, 109223.0, 1439583.0, 2415902.0, 128950.0, 26415.0, 10630.0, 5546.0, 3159.0, 1944.0, 1219.0, 788.0, 575.0, 376.0, 267.0, 202.0, 146.0, 92.0, 62.0, 55.0, 40.0, 28.0, 17.0, 14.0, 11.0, 6.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9634246826171875, -0.927825927734375, -0.8922271728515625, -0.85662841796875, -0.8210296630859375, -0.785430908203125, -0.7498321533203125, -0.7142333984375, -0.6786346435546875, -0.643035888671875, -0.6074371337890625, -0.57183837890625, -0.5362396240234375, -0.500640869140625, -0.4650421142578125, -0.429443359375, -0.3938446044921875, -0.358245849609375, -0.3226470947265625, -0.28704833984375, -0.2514495849609375, -0.215850830078125, -0.1802520751953125, -0.1446533203125, -0.1090545654296875, -0.073455810546875, -0.0378570556640625, -0.00225830078125, 0.0333404541015625, 0.068939208984375, 0.1045379638671875, 0.14013671875, 0.1757354736328125, 0.211334228515625, 0.2469329833984375, 0.28253173828125, 0.3181304931640625, 0.353729248046875, 0.3893280029296875, 0.4249267578125, 0.4605255126953125, 0.496124267578125, 0.5317230224609375, 0.56732177734375, 0.6029205322265625, 0.638519287109375, 0.6741180419921875, 0.709716796875, 0.7453155517578125, 0.780914306640625, 0.8165130615234375, 0.85211181640625, 0.8877105712890625, 0.923309326171875, 0.9589080810546875, 0.9945068359375, 1.0301055908203125, 1.065704345703125, 1.1013031005859375, 1.13690185546875, 1.1725006103515625, 1.208099365234375, 1.2436981201171875, 1.279296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 4.0, 7.0, 16.0, 10.0, 15.0, 26.0, 26.0, 24.0, 27.0, 36.0, 44.0, 58.0, 57.0, 53.0, 56.0, 58.0, 61.0, 56.0, 60.0, 42.0, 37.0, 41.0, 35.0, 26.0, 17.0, 18.0, 23.0, 13.0, 9.0, 5.0, 8.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9189453125, -0.8869171142578125, -0.854888916015625, -0.8228607177734375, -0.79083251953125, -0.7588043212890625, -0.726776123046875, -0.6947479248046875, -0.6627197265625, -0.6306915283203125, -0.598663330078125, -0.5666351318359375, -0.53460693359375, -0.5025787353515625, -0.470550537109375, -0.4385223388671875, -0.406494140625, -0.3744659423828125, -0.342437744140625, -0.3104095458984375, -0.27838134765625, -0.2463531494140625, -0.214324951171875, -0.1822967529296875, -0.1502685546875, -0.1182403564453125, -0.086212158203125, -0.0541839599609375, -0.02215576171875, 0.0098724365234375, 0.041900634765625, 0.0739288330078125, 0.10595703125, 0.1379852294921875, 0.170013427734375, 0.2020416259765625, 0.23406982421875, 0.2660980224609375, 0.298126220703125, 0.3301544189453125, 0.3621826171875, 0.3942108154296875, 0.426239013671875, 0.4582672119140625, 0.49029541015625, 0.5223236083984375, 0.554351806640625, 0.5863800048828125, 0.618408203125, 0.6504364013671875, 0.682464599609375, 0.7144927978515625, 0.74652099609375, 0.7785491943359375, 0.810577392578125, 0.8426055908203125, 0.8746337890625, 0.9066619873046875, 0.938690185546875, 0.9707183837890625, 1.00274658203125, 1.0347747802734375, 1.066802978515625, 1.0988311767578125, 1.130859375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 5.0, 9.0, 19.0, 16.0, 31.0, 50.0, 103.0, 221.0, 395.0, 999.0, 3259.0, 18390.0, 611125.0, 3525401.0, 27485.0, 4352.0, 1245.0, 490.0, 266.0, 141.0, 88.0, 36.0, 28.0, 17.0, 17.0, 13.0, 7.0, 3.0, 6.0, 7.0, 2.0, 4.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.7000732421875, -3.591552734375, -3.4830322265625, -3.37451171875, -3.2659912109375, -3.157470703125, -3.0489501953125, -2.9404296875, -2.8319091796875, -2.723388671875, -2.6148681640625, -2.50634765625, -2.3978271484375, -2.289306640625, -2.1807861328125, -2.072265625, -1.9637451171875, -1.855224609375, -1.7467041015625, -1.63818359375, -1.5296630859375, -1.421142578125, -1.3126220703125, -1.2041015625, -1.0955810546875, -0.987060546875, -0.8785400390625, -0.77001953125, -0.6614990234375, -0.552978515625, -0.4444580078125, -0.3359375, -0.2274169921875, -0.118896484375, -0.0103759765625, 0.09814453125, 0.2066650390625, 0.315185546875, 0.4237060546875, 0.5322265625, 0.6407470703125, 0.749267578125, 0.8577880859375, 0.96630859375, 1.0748291015625, 1.183349609375, 1.2918701171875, 1.400390625, 1.5089111328125, 1.617431640625, 1.7259521484375, 1.83447265625, 1.9429931640625, 2.051513671875, 2.1600341796875, 2.2685546875, 2.3770751953125, 2.485595703125, 2.5941162109375, 2.70263671875, 2.8111572265625, 2.919677734375, 3.0281982421875, 3.13671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 8.0, 10.0, 10.0, 14.0, 24.0, 23.0, 32.0, 58.0, 183.0, 784.0, 1964.0, 623.0, 140.0, 61.0, 35.0, 21.0, 26.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.044921875, -1.949798583984375, -1.85467529296875, -1.759552001953125, -1.6644287109375, -1.569305419921875, -1.47418212890625, -1.379058837890625, -1.283935546875, -1.188812255859375, -1.09368896484375, -0.998565673828125, -0.9034423828125, -0.808319091796875, -0.71319580078125, -0.618072509765625, -0.52294921875, -0.427825927734375, -0.33270263671875, -0.237579345703125, -0.1424560546875, -0.047332763671875, 0.04779052734375, 0.142913818359375, 0.238037109375, 0.333160400390625, 0.42828369140625, 0.523406982421875, 0.6185302734375, 0.713653564453125, 0.80877685546875, 0.903900146484375, 0.9990234375, 1.094146728515625, 1.18927001953125, 1.284393310546875, 1.3795166015625, 1.474639892578125, 1.56976318359375, 1.664886474609375, 1.760009765625, 1.855133056640625, 1.95025634765625, 2.045379638671875, 2.1405029296875, 2.235626220703125, 2.33074951171875, 2.425872802734375, 2.52099609375, 2.616119384765625, 2.71124267578125, 2.806365966796875, 2.9014892578125, 2.996612548828125, 3.09173583984375, 3.186859130859375, 3.281982421875, 3.377105712890625, 3.47222900390625, 3.567352294921875, 3.6624755859375, 3.757598876953125, 3.85272216796875, 3.947845458984375, 4.04296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 4.0, 18.0, 19.0, 26.0, 47.0, 91.0, 129.0, 140.0, 154.0, 119.0, 90.0, 56.0, 31.0, 12.0, 18.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.957306861877441, -12.5669584274292, -12.176609992980957, -11.786261558532715, -11.395913124084473, -11.00556468963623, -10.615216255187988, -10.224867820739746, -9.834519386291504, -9.444170951843262, -9.05382251739502, -8.663474082946777, -8.273125648498535, -7.882777214050293, -7.492428779602051, -7.102080345153809, -6.711731910705566, -6.321383476257324, -5.931035041809082, -5.54068660736084, -5.150338172912598, -4.7599897384643555, -4.369641304016113, -3.979292869567871, -3.588944435119629, -3.1985960006713867, -2.8082475662231445, -2.4178991317749023, -2.02755069732666, -1.637202262878418, -1.2468538284301758, -0.8565053939819336, -0.466156005859375, -0.07580757141113281, 0.3145408630371094, 0.7048892974853516, 1.0952377319335938, 1.485586166381836, 1.8759346008300781, 2.2662830352783203, 2.6566314697265625, 3.0469799041748047, 3.437328338623047, 3.827676773071289, 4.218025207519531, 4.608373641967773, 4.998722076416016, 5.389070510864258, 5.7794189453125, 6.169767379760742, 6.560115814208984, 6.950464248657227, 7.340812683105469, 7.731161117553711, 8.121509552001953, 8.511857986450195, 8.902206420898438, 9.29255485534668, 9.682903289794922, 10.073251724243164, 10.463600158691406, 10.853948593139648, 11.24429702758789, 11.634645462036133, 12.024993896484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 12.0, 9.0, 19.0, 29.0, 20.0, 21.0, 28.0, 33.0, 40.0, 45.0, 41.0, 52.0, 54.0, 82.0, 64.0, 71.0, 52.0, 34.0, 57.0, 39.0, 31.0, 38.0, 26.0, 23.0, 14.0, 17.0, 13.0, 7.0, 4.0, 5.0, 1.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.359330177307129, -9.958972930908203, -9.558615684509277, -9.158258438110352, -8.757902145385742, -8.3575439453125, -7.957187652587891, -7.556830406188965, -7.156473159790039, -6.756115913391113, -6.3557586669921875, -5.95540189743042, -5.555044651031494, -5.154687404632568, -4.754330635070801, -4.353973388671875, -3.953616142272949, -3.5532588958740234, -3.1529018878936768, -2.75254487991333, -2.3521876335144043, -1.9518303871154785, -1.5514733791351318, -1.1511163711547852, -0.7507591247558594, -0.35040199756622314, 0.049955129623413086, 0.4503122568130493, 0.8506693840026855, 1.2510266304016113, 1.651383638381958, 2.0517406463623047, 2.4520978927612305, 2.8524551391601562, 3.252812147140503, 3.6531691551208496, 4.053526401519775, 4.453883647918701, 4.854240417480469, 5.2545976638793945, 5.65495491027832, 6.055312156677246, 6.455669403076172, 6.8560261726379395, 7.256383419036865, 7.656740665435791, 8.057097434997559, 8.457454681396484, 8.85781192779541, 9.258169174194336, 9.658526420593262, 10.058883666992188, 10.459239959716797, 10.859598159790039, 11.259954452514648, 11.660311698913574, 12.0606689453125, 12.461026191711426, 12.861383438110352, 13.261740684509277, 13.662097930908203, 14.062454223632812, 14.462811470031738, 14.863168716430664, 15.26352596282959]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 17.0, 22.0, 24.0, 52.0, 63.0, 91.0, 136.0, 194.0, 291.0, 446.0, 683.0, 1125.0, 1674.0, 2910.0, 4910.0, 8425.0, 15237.0, 28004.0, 54273.0, 111025.0, 217306.0, 271049.0, 162404.0, 79597.0, 39851.0, 20718.0, 11697.0, 6468.0, 3677.0, 2260.0, 1412.0, 881.0, 577.0, 377.0, 232.0, 142.0, 94.0, 64.0, 47.0, 34.0, 20.0, 13.0, 11.0, 11.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6571121215820312, -0.6320953369140625, -0.6070785522460938, -0.582061767578125, -0.5570449829101562, -0.5320281982421875, -0.5070114135742188, -0.48199462890625, -0.45697784423828125, -0.4319610595703125, -0.40694427490234375, -0.381927490234375, -0.35691070556640625, -0.3318939208984375, -0.30687713623046875, -0.2818603515625, -0.25684356689453125, -0.2318267822265625, -0.20680999755859375, -0.181793212890625, -0.15677642822265625, -0.1317596435546875, -0.10674285888671875, -0.08172607421875, -0.05670928955078125, -0.0316925048828125, -0.00667572021484375, 0.018341064453125, 0.04335784912109375, 0.0683746337890625, 0.09339141845703125, 0.118408203125, 0.14342498779296875, 0.1684417724609375, 0.19345855712890625, 0.218475341796875, 0.24349212646484375, 0.2685089111328125, 0.29352569580078125, 0.31854248046875, 0.34355926513671875, 0.3685760498046875, 0.39359283447265625, 0.418609619140625, 0.44362640380859375, 0.4686431884765625, 0.49365997314453125, 0.5186767578125, 0.5436935424804688, 0.5687103271484375, 0.5937271118164062, 0.618743896484375, 0.6437606811523438, 0.6687774658203125, 0.6937942504882812, 0.71881103515625, 0.7438278198242188, 0.7688446044921875, 0.7938613891601562, 0.818878173828125, 0.8438949584960938, 0.8689117431640625, 0.8939285278320312, 0.9189453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 22.0, 18.0, 13.0, 19.0, 20.0, 29.0, 27.0, 42.0, 32.0, 38.0, 51.0, 46.0, 53.0, 47.0, 70.0, 59.0, 54.0, 60.0, 39.0, 36.0, 29.0, 22.0, 33.0, 31.0, 25.0, 15.0, 11.0, 10.0, 10.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.7779388427734375, -0.748260498046875, -0.7185821533203125, -0.68890380859375, -0.6592254638671875, -0.629547119140625, -0.5998687744140625, -0.5701904296875, -0.5405120849609375, -0.510833740234375, -0.4811553955078125, -0.45147705078125, -0.4217987060546875, -0.392120361328125, -0.3624420166015625, -0.332763671875, -0.3030853271484375, -0.273406982421875, -0.2437286376953125, -0.21405029296875, -0.1843719482421875, -0.154693603515625, -0.1250152587890625, -0.0953369140625, -0.0656585693359375, -0.035980224609375, -0.0063018798828125, 0.02337646484375, 0.0530548095703125, 0.082733154296875, 0.1124114990234375, 0.14208984375, 0.1717681884765625, 0.201446533203125, 0.2311248779296875, 0.26080322265625, 0.2904815673828125, 0.320159912109375, 0.3498382568359375, 0.3795166015625, 0.4091949462890625, 0.438873291015625, 0.4685516357421875, 0.49822998046875, 0.5279083251953125, 0.557586669921875, 0.5872650146484375, 0.616943359375, 0.6466217041015625, 0.676300048828125, 0.7059783935546875, 0.73565673828125, 0.7653350830078125, 0.795013427734375, 0.8246917724609375, 0.8543701171875, 0.8840484619140625, 0.913726806640625, 0.9434051513671875, 0.97308349609375, 1.0027618408203125, 1.032440185546875, 1.0621185302734375, 1.091796875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 7.0, 12.0, 16.0, 22.0, 51.0, 71.0, 121.0, 180.0, 301.0, 573.0, 1171.0, 3068.0, 13614.0, 165124.0, 796046.0, 57059.0, 7296.0, 2016.0, 791.0, 419.0, 221.0, 122.0, 86.0, 51.0, 35.0, 24.0, 16.0, 8.0, 4.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.784820556640625, -2.67901611328125, -2.573211669921875, -2.4674072265625, -2.361602783203125, -2.25579833984375, -2.149993896484375, -2.044189453125, -1.938385009765625, -1.83258056640625, -1.726776123046875, -1.6209716796875, -1.515167236328125, -1.40936279296875, -1.303558349609375, -1.19775390625, -1.091949462890625, -0.98614501953125, -0.880340576171875, -0.7745361328125, -0.668731689453125, -0.56292724609375, -0.457122802734375, -0.351318359375, -0.245513916015625, -0.13970947265625, -0.033905029296875, 0.0718994140625, 0.177703857421875, 0.28350830078125, 0.389312744140625, 0.4951171875, 0.600921630859375, 0.70672607421875, 0.812530517578125, 0.9183349609375, 1.024139404296875, 1.12994384765625, 1.235748291015625, 1.341552734375, 1.447357177734375, 1.55316162109375, 1.658966064453125, 1.7647705078125, 1.870574951171875, 1.97637939453125, 2.082183837890625, 2.18798828125, 2.293792724609375, 2.39959716796875, 2.505401611328125, 2.6112060546875, 2.717010498046875, 2.82281494140625, 2.928619384765625, 3.034423828125, 3.140228271484375, 3.24603271484375, 3.351837158203125, 3.4576416015625, 3.563446044921875, 3.66925048828125, 3.775054931640625, 3.880859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 10.0, 7.0, 12.0, 15.0, 27.0, 24.0, 22.0, 32.0, 43.0, 36.0, 45.0, 46.0, 49.0, 57.0, 50.0, 45.0, 40.0, 76.0, 47.0, 39.0, 36.0, 37.0, 33.0, 32.0, 27.0, 15.0, 16.0, 13.0, 9.0, 11.0, 6.0, 6.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.635955810546875, -3.50433349609375, -3.372711181640625, -3.2410888671875, -3.109466552734375, -2.97784423828125, -2.846221923828125, -2.714599609375, -2.582977294921875, -2.45135498046875, -2.319732666015625, -2.1881103515625, -2.056488037109375, -1.92486572265625, -1.793243408203125, -1.66162109375, -1.529998779296875, -1.39837646484375, -1.266754150390625, -1.1351318359375, -1.003509521484375, -0.87188720703125, -0.740264892578125, -0.608642578125, -0.477020263671875, -0.34539794921875, -0.213775634765625, -0.0821533203125, 0.049468994140625, 0.18109130859375, 0.312713623046875, 0.4443359375, 0.575958251953125, 0.70758056640625, 0.839202880859375, 0.9708251953125, 1.102447509765625, 1.23406982421875, 1.365692138671875, 1.497314453125, 1.628936767578125, 1.76055908203125, 1.892181396484375, 2.0238037109375, 2.155426025390625, 2.28704833984375, 2.418670654296875, 2.55029296875, 2.681915283203125, 2.81353759765625, 2.945159912109375, 3.0767822265625, 3.208404541015625, 3.34002685546875, 3.471649169921875, 3.603271484375, 3.734893798828125, 3.86651611328125, 3.998138427734375, 4.1297607421875, 4.261383056640625, 4.39300537109375, 4.524627685546875, 4.65625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 15.0, 19.0, 23.0, 35.0, 55.0, 98.0, 169.0, 299.0, 577.0, 1441.0, 3695.0, 16382.0, 423640.0, 576819.0, 18406.0, 3983.0, 1438.0, 650.0, 297.0, 172.0, 112.0, 56.0, 44.0, 23.0, 14.0, 8.0, 9.0, 12.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.1591796875, -1.120574951171875, -1.08197021484375, -1.043365478515625, -1.0047607421875, -0.966156005859375, -0.92755126953125, -0.888946533203125, -0.850341796875, -0.811737060546875, -0.77313232421875, -0.734527587890625, -0.6959228515625, -0.657318115234375, -0.61871337890625, -0.580108642578125, -0.54150390625, -0.502899169921875, -0.46429443359375, -0.425689697265625, -0.3870849609375, -0.348480224609375, -0.30987548828125, -0.271270751953125, -0.232666015625, -0.194061279296875, -0.15545654296875, -0.116851806640625, -0.0782470703125, -0.039642333984375, -0.00103759765625, 0.037567138671875, 0.076171875, 0.114776611328125, 0.15338134765625, 0.191986083984375, 0.2305908203125, 0.269195556640625, 0.30780029296875, 0.346405029296875, 0.385009765625, 0.423614501953125, 0.46221923828125, 0.500823974609375, 0.5394287109375, 0.578033447265625, 0.61663818359375, 0.655242919921875, 0.69384765625, 0.732452392578125, 0.77105712890625, 0.809661865234375, 0.8482666015625, 0.886871337890625, 0.92547607421875, 0.964080810546875, 1.002685546875, 1.041290283203125, 1.07989501953125, 1.118499755859375, 1.1571044921875, 1.195709228515625, 1.23431396484375, 1.272918701171875, 1.3115234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 9.0, 6.0, 13.0, 14.0, 31.0, 53.0, 88.0, 131.0, 184.0, 183.0, 108.0, 69.0, 37.0, 31.0, 11.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00027108192443847656, -0.00026389583945274353, -0.0002567097544670105, -0.00024952366948127747, -0.00024233758449554443, -0.0002351514995098114, -0.00022796541452407837, -0.00022077932953834534, -0.0002135932445526123, -0.00020640715956687927, -0.00019922107458114624, -0.0001920349895954132, -0.00018484890460968018, -0.00017766281962394714, -0.0001704767346382141, -0.00016329064965248108, -0.00015610456466674805, -0.00014891847968101501, -0.00014173239469528198, -0.00013454630970954895, -0.00012736022472381592, -0.00012017413973808289, -0.00011298805475234985, -0.00010580196976661682, -9.861588478088379e-05, -9.142979979515076e-05, -8.424371480941772e-05, -7.705762982368469e-05, -6.987154483795166e-05, -6.268545985221863e-05, -5.5499374866485596e-05, -4.8313289880752563e-05, -4.112720489501953e-05, -3.39411199092865e-05, -2.6755034923553467e-05, -1.9568949937820435e-05, -1.2382864952087402e-05, -5.19677996635437e-06, 1.989305019378662e-06, 9.175390005111694e-06, 1.6361474990844727e-05, 2.354755997657776e-05, 3.073364496231079e-05, 3.791972994804382e-05, 4.5105814933776855e-05, 5.229189991950989e-05, 5.947798490524292e-05, 6.666406989097595e-05, 7.385015487670898e-05, 8.103623986244202e-05, 8.822232484817505e-05, 9.540840983390808e-05, 0.00010259449481964111, 0.00010978057980537415, 0.00011696666479110718, 0.0001241527497768402, 0.00013133883476257324, 0.00013852491974830627, 0.0001457110047340393, 0.00015289708971977234, 0.00016008317470550537, 0.0001672692596912384, 0.00017445534467697144, 0.00018164142966270447, 0.0001888275146484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 3.0, 5.0, 13.0, 12.0, 13.0, 28.0, 30.0, 48.0, 71.0, 107.0, 194.0, 387.0, 904.0, 2658.0, 11446.0, 250725.0, 754746.0, 21049.0, 3770.0, 1238.0, 476.0, 216.0, 123.0, 87.0, 57.0, 29.0, 26.0, 17.0, 11.0, 7.0, 10.0, 3.0, 7.0, 6.0, 4.0, 1.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3076171875, -1.266937255859375, -1.22625732421875, -1.185577392578125, -1.1448974609375, -1.104217529296875, -1.06353759765625, -1.022857666015625, -0.982177734375, -0.941497802734375, -0.90081787109375, -0.860137939453125, -0.8194580078125, -0.778778076171875, -0.73809814453125, -0.697418212890625, -0.65673828125, -0.616058349609375, -0.57537841796875, -0.534698486328125, -0.4940185546875, -0.453338623046875, -0.41265869140625, -0.371978759765625, -0.331298828125, -0.290618896484375, -0.24993896484375, -0.209259033203125, -0.1685791015625, -0.127899169921875, -0.08721923828125, -0.046539306640625, -0.005859375, 0.034820556640625, 0.07550048828125, 0.116180419921875, 0.1568603515625, 0.197540283203125, 0.23822021484375, 0.278900146484375, 0.319580078125, 0.360260009765625, 0.40093994140625, 0.441619873046875, 0.4822998046875, 0.522979736328125, 0.56365966796875, 0.604339599609375, 0.64501953125, 0.685699462890625, 0.72637939453125, 0.767059326171875, 0.8077392578125, 0.848419189453125, 0.88909912109375, 0.929779052734375, 0.970458984375, 1.011138916015625, 1.05181884765625, 1.092498779296875, 1.1331787109375, 1.173858642578125, 1.21453857421875, 1.255218505859375, 1.2958984375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 38.0, 49.0, 60.0, 88.0, 116.0, 117.0, 107.0, 82.0, 73.0, 64.0, 39.0, 31.0, 26.0, 10.0, 6.0, 4.0, 5.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.173828125, -1.1358489990234375, -1.097869873046875, -1.0598907470703125, -1.02191162109375, -0.9839324951171875, -0.945953369140625, -0.9079742431640625, -0.8699951171875, -0.8320159912109375, -0.794036865234375, -0.7560577392578125, -0.71807861328125, -0.6800994873046875, -0.642120361328125, -0.6041412353515625, -0.566162109375, -0.5281829833984375, -0.490203857421875, -0.4522247314453125, -0.41424560546875, -0.3762664794921875, -0.338287353515625, -0.3003082275390625, -0.2623291015625, -0.2243499755859375, -0.186370849609375, -0.1483917236328125, -0.11041259765625, -0.0724334716796875, -0.034454345703125, 0.0035247802734375, 0.04150390625, 0.0794830322265625, 0.117462158203125, 0.1554412841796875, 0.19342041015625, 0.2313995361328125, 0.269378662109375, 0.3073577880859375, 0.3453369140625, 0.3833160400390625, 0.421295166015625, 0.4592742919921875, 0.49725341796875, 0.5352325439453125, 0.573211669921875, 0.6111907958984375, 0.649169921875, 0.6871490478515625, 0.725128173828125, 0.7631072998046875, 0.80108642578125, 0.8390655517578125, 0.877044677734375, 0.9150238037109375, 0.9530029296875, 0.9909820556640625, 1.028961181640625, 1.0669403076171875, 1.10491943359375, 1.1428985595703125, 1.180877685546875, 1.2188568115234375, 1.2568359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 21.0, 230.0, 561.0, 145.0, 23.0, 8.0, 10.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-101.09318542480469, -99.19454956054688, -97.2959213256836, -95.39728546142578, -93.4986572265625, -91.60002136230469, -89.7013931274414, -87.8027572631836, -85.90412902832031, -84.0054931640625, -82.10686492919922, -80.2082290649414, -78.30960083007812, -76.41096496582031, -74.51233673095703, -72.61370086669922, -70.71507263183594, -68.81643676757812, -66.91780853271484, -65.01917266845703, -63.12054443359375, -61.2219123840332, -59.323280334472656, -57.424644470214844, -55.52600860595703, -53.627376556396484, -51.72874450683594, -49.83011245727539, -47.931480407714844, -46.0328483581543, -44.13421630859375, -42.23558044433594, -40.336952209472656, -38.43832015991211, -36.53968811035156, -34.641056060791016, -32.74242401123047, -30.843791961669922, -28.945158004760742, -27.046525955200195, -25.14789581298828, -23.249263763427734, -21.350631713867188, -19.45199966430664, -17.553367614746094, -15.65473461151123, -13.756101608276367, -11.85746955871582, -9.958837509155273, -8.060205459594727, -6.1615729331970215, -4.262940406799316, -2.3643083572387695, -0.46567630767822266, 1.4329566955566406, 3.3315887451171875, 5.230220794677734, 7.128852844238281, 9.027484893798828, 10.926117897033691, 12.824749946594238, 14.723381996154785, 16.62201499938965, 18.520647048950195, 20.419279098510742]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 3.0, 8.0, 18.0, 22.0, 11.0, 18.0, 17.0, 32.0, 24.0, 34.0, 35.0, 35.0, 40.0, 47.0, 56.0, 54.0, 66.0, 48.0, 51.0, 44.0, 41.0, 28.0, 34.0, 28.0, 32.0, 30.0, 21.0, 21.0, 28.0, 19.0, 11.0, 8.0, 6.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.727006912231445, -15.239923477172852, -14.752840042114258, -14.265755653381348, -13.778672218322754, -13.29158878326416, -12.804505348205566, -12.317420959472656, -11.830337524414062, -11.343254089355469, -10.856170654296875, -10.369086265563965, -9.882002830505371, -9.394919395446777, -8.907835960388184, -8.420751571655273, -7.933668613433838, -7.446585178375244, -6.959501266479492, -6.472417831420898, -5.9853339195251465, -5.498250484466553, -5.011166572570801, -4.524083137512207, -4.036999702453613, -3.5499160289764404, -3.0628323554992676, -2.575748920440674, -2.088665008544922, -1.6015815734863281, -1.1144979000091553, -0.6274142265319824, -0.14033031463623047, 0.34675332903862, 0.8338369727134705, 1.3209205865859985, 1.8080042600631714, 2.2950878143310547, 2.7821714878082275, 3.2692551612854004, 3.7563388347625732, 4.243422508239746, 4.73050594329834, 5.217589855194092, 5.7046732902526855, 6.1917572021484375, 6.678840637207031, 7.165924072265625, 7.653007984161377, 8.140091896057129, 8.627175331115723, 9.114258766174316, 9.60134220123291, 10.08842658996582, 10.575510025024414, 11.062593460083008, 11.549676895141602, 12.036760330200195, 12.523843765258789, 13.0109281539917, 13.498011589050293, 13.985095024108887, 14.47217845916748, 14.95926284790039, 15.446346282958984]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 19.0, 36.0, 51.0, 87.0, 179.0, 413.0, 1385.0, 6620.0, 79166.0, 4022893.0, 75163.0, 5772.0, 1374.0, 500.0, 220.0, 129.0, 72.0, 42.0, 39.0, 20.0, 16.0, 12.0, 12.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.412109375, -3.32989501953125, -3.2476806640625, -3.16546630859375, -3.083251953125, -3.00103759765625, -2.9188232421875, -2.83660888671875, -2.75439453125, -2.67218017578125, -2.5899658203125, -2.50775146484375, -2.425537109375, -2.34332275390625, -2.2611083984375, -2.17889404296875, -2.0966796875, -2.01446533203125, -1.9322509765625, -1.85003662109375, -1.767822265625, -1.68560791015625, -1.6033935546875, -1.52117919921875, -1.43896484375, -1.35675048828125, -1.2745361328125, -1.19232177734375, -1.110107421875, -1.02789306640625, -0.9456787109375, -0.86346435546875, -0.78125, -0.69903564453125, -0.6168212890625, -0.53460693359375, -0.452392578125, -0.37017822265625, -0.2879638671875, -0.20574951171875, -0.12353515625, -0.04132080078125, 0.0408935546875, 0.12310791015625, 0.205322265625, 0.28753662109375, 0.3697509765625, 0.45196533203125, 0.5341796875, 0.61639404296875, 0.6986083984375, 0.78082275390625, 0.863037109375, 0.94525146484375, 1.0274658203125, 1.10968017578125, 1.19189453125, 1.27410888671875, 1.3563232421875, 1.43853759765625, 1.520751953125, 1.60296630859375, 1.6851806640625, 1.76739501953125, 1.849609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 9.0, 15.0, 15.0, 18.0, 33.0, 44.0, 46.0, 60.0, 67.0, 76.0, 70.0, 81.0, 84.0, 88.0, 68.0, 62.0, 35.0, 34.0, 27.0, 21.0, 9.0, 12.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8896484375, -0.847930908203125, -0.80621337890625, -0.764495849609375, -0.7227783203125, -0.681060791015625, -0.63934326171875, -0.597625732421875, -0.555908203125, -0.514190673828125, -0.47247314453125, -0.430755615234375, -0.3890380859375, -0.347320556640625, -0.30560302734375, -0.263885498046875, -0.22216796875, -0.180450439453125, -0.13873291015625, -0.097015380859375, -0.0552978515625, -0.013580322265625, 0.02813720703125, 0.069854736328125, 0.111572265625, 0.153289794921875, 0.19500732421875, 0.236724853515625, 0.2784423828125, 0.320159912109375, 0.36187744140625, 0.403594970703125, 0.4453125, 0.487030029296875, 0.52874755859375, 0.570465087890625, 0.6121826171875, 0.653900146484375, 0.69561767578125, 0.737335205078125, 0.779052734375, 0.820770263671875, 0.86248779296875, 0.904205322265625, 0.9459228515625, 0.987640380859375, 1.02935791015625, 1.071075439453125, 1.11279296875, 1.154510498046875, 1.19622802734375, 1.237945556640625, 1.2796630859375, 1.321380615234375, 1.36309814453125, 1.404815673828125, 1.446533203125, 1.488250732421875, 1.52996826171875, 1.571685791015625, 1.6134033203125, 1.655120849609375, 1.69683837890625, 1.738555908203125, 1.7802734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 13.0, 19.0, 44.0, 102.0, 165.0, 414.0, 1618.0, 12416.0, 1715599.0, 2449847.0, 11654.0, 1506.0, 418.0, 215.0, 112.0, 60.0, 38.0, 18.0, 15.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.29595947265625, -3.1739501953125, -3.05194091796875, -2.929931640625, -2.80792236328125, -2.6859130859375, -2.56390380859375, -2.44189453125, -2.31988525390625, -2.1978759765625, -2.07586669921875, -1.953857421875, -1.83184814453125, -1.7098388671875, -1.58782958984375, -1.4658203125, -1.34381103515625, -1.2218017578125, -1.09979248046875, -0.977783203125, -0.85577392578125, -0.7337646484375, -0.61175537109375, -0.48974609375, -0.36773681640625, -0.2457275390625, -0.12371826171875, -0.001708984375, 0.12030029296875, 0.2423095703125, 0.36431884765625, 0.486328125, 0.60833740234375, 0.7303466796875, 0.85235595703125, 0.974365234375, 1.09637451171875, 1.2183837890625, 1.34039306640625, 1.46240234375, 1.58441162109375, 1.7064208984375, 1.82843017578125, 1.950439453125, 2.07244873046875, 2.1944580078125, 2.31646728515625, 2.4384765625, 2.56048583984375, 2.6824951171875, 2.80450439453125, 2.926513671875, 3.04852294921875, 3.1705322265625, 3.29254150390625, 3.41455078125, 3.53656005859375, 3.6585693359375, 3.78057861328125, 3.902587890625, 4.02459716796875, 4.1466064453125, 4.26861572265625, 4.390625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 4.0, 8.0, 8.0, 10.0, 13.0, 24.0, 45.0, 60.0, 181.0, 851.0, 1971.0, 612.0, 156.0, 59.0, 34.0, 17.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.283203125, -2.19342041015625, -2.1036376953125, -2.01385498046875, -1.924072265625, -1.83428955078125, -1.7445068359375, -1.65472412109375, -1.56494140625, -1.47515869140625, -1.3853759765625, -1.29559326171875, -1.205810546875, -1.11602783203125, -1.0262451171875, -0.93646240234375, -0.8466796875, -0.75689697265625, -0.6671142578125, -0.57733154296875, -0.487548828125, -0.39776611328125, -0.3079833984375, -0.21820068359375, -0.12841796875, -0.03863525390625, 0.0511474609375, 0.14093017578125, 0.230712890625, 0.32049560546875, 0.4102783203125, 0.50006103515625, 0.58984375, 0.67962646484375, 0.7694091796875, 0.85919189453125, 0.948974609375, 1.03875732421875, 1.1285400390625, 1.21832275390625, 1.30810546875, 1.39788818359375, 1.4876708984375, 1.57745361328125, 1.667236328125, 1.75701904296875, 1.8468017578125, 1.93658447265625, 2.0263671875, 2.11614990234375, 2.2059326171875, 2.29571533203125, 2.385498046875, 2.47528076171875, 2.5650634765625, 2.65484619140625, 2.74462890625, 2.83441162109375, 2.9241943359375, 3.01397705078125, 3.103759765625, 3.19354248046875, 3.2833251953125, 3.37310791015625, 3.462890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 10.0, 33.0, 105.0, 238.0, 272.0, 160.0, 85.0, 30.0, 24.0, 9.0, 12.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.11816120147705, -12.63796615600586, -12.157770156860352, -11.67757511138916, -11.197380065917969, -10.717184066772461, -10.23698902130127, -9.756793975830078, -9.27659797668457, -8.796402931213379, -8.316206932067871, -7.83601188659668, -7.35581636428833, -6.8756208419799805, -6.395425796508789, -5.9152302742004395, -5.43503475189209, -4.95483922958374, -4.474643707275391, -3.994448661804199, -3.5142531394958496, -3.0340576171875, -2.5538623332977295, -2.073667049407959, -1.5934715270996094, -1.1132761240005493, -0.6330807209014893, -0.1528853178024292, 0.32731008529663086, 0.8075056076049805, 1.287700891494751, 1.7678961753845215, 2.2480926513671875, 2.728288173675537, 3.2084834575653076, 3.688678741455078, 4.168874263763428, 4.649069786071777, 5.129264831542969, 5.609460353851318, 6.089655876159668, 6.569851398468018, 7.050046920776367, 7.530241966247559, 8.01043701171875, 8.490633010864258, 8.97082805633545, 9.45102310180664, 9.931219100952148, 10.41141414642334, 10.891610145568848, 11.371805191040039, 11.852001190185547, 12.332196235656738, 12.81239128112793, 13.292587280273438, 13.772782325744629, 14.25297737121582, 14.733173370361328, 15.21336841583252, 15.693563461303711, 16.17375946044922, 16.653955459594727, 17.1341495513916, 17.61434555053711]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 5.0, 10.0, 8.0, 14.0, 13.0, 24.0, 17.0, 30.0, 27.0, 26.0, 42.0, 44.0, 50.0, 48.0, 62.0, 59.0, 58.0, 59.0, 53.0, 70.0, 50.0, 47.0, 38.0, 28.0, 24.0, 27.0, 14.0, 16.0, 5.0, 6.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.063533782958984, -7.807955265045166, -7.552376747131348, -7.2967987060546875, -7.041220188140869, -6.785641670227051, -6.530063629150391, -6.274485111236572, -6.018906593322754, -5.7633280754089355, -5.507749557495117, -5.252171516418457, -4.996592998504639, -4.74101448059082, -4.48543643951416, -4.229857921600342, -3.9742794036865234, -3.718700885772705, -3.463122606277466, -3.2075443267822266, -2.951965808868408, -2.69638729095459, -2.4408090114593506, -2.1852307319641113, -1.929652214050293, -1.6740738153457642, -1.4184954166412354, -1.1629170179367065, -0.9073386192321777, -0.6517602205276489, -0.3961818218231201, -0.1406034231185913, 0.1149740219116211, 0.3705524206161499, 0.6261308193206787, 0.8817092180252075, 1.1372876167297363, 1.3928660154342651, 1.648444414138794, 1.9040228128433228, 2.1596012115478516, 2.41517972946167, 2.670758008956909, 2.9263362884521484, 3.181914806365967, 3.437493324279785, 3.6930716037750244, 3.9486498832702637, 4.204228401184082, 4.4598069190979, 4.715385437011719, 4.970963478088379, 5.226541996002197, 5.482120513916016, 5.737698554992676, 5.993277072906494, 6.2488555908203125, 6.504434108734131, 6.760012626647949, 7.015590667724609, 7.271169185638428, 7.526747703552246, 7.782325744628906, 8.037904739379883, 8.293482780456543]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 6.0, 20.0, 29.0, 49.0, 60.0, 98.0, 170.0, 331.0, 548.0, 1008.0, 2010.0, 4301.0, 9109.0, 21604.0, 53445.0, 143826.0, 334642.0, 288602.0, 113434.0, 42865.0, 17406.0, 7700.0, 3463.0, 1763.0, 883.0, 485.0, 254.0, 150.0, 82.0, 71.0, 57.0, 19.0, 17.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96875, -0.9340057373046875, -0.899261474609375, -0.8645172119140625, -0.82977294921875, -0.7950286865234375, -0.760284423828125, -0.7255401611328125, -0.6907958984375, -0.6560516357421875, -0.621307373046875, -0.5865631103515625, -0.55181884765625, -0.5170745849609375, -0.482330322265625, -0.4475860595703125, -0.412841796875, -0.3780975341796875, -0.343353271484375, -0.3086090087890625, -0.27386474609375, -0.2391204833984375, -0.204376220703125, -0.1696319580078125, -0.1348876953125, -0.1001434326171875, -0.065399169921875, -0.0306549072265625, 0.00408935546875, 0.0388336181640625, 0.073577880859375, 0.1083221435546875, 0.14306640625, 0.1778106689453125, 0.212554931640625, 0.2472991943359375, 0.28204345703125, 0.3167877197265625, 0.351531982421875, 0.3862762451171875, 0.4210205078125, 0.4557647705078125, 0.490509033203125, 0.5252532958984375, 0.55999755859375, 0.5947418212890625, 0.629486083984375, 0.6642303466796875, 0.698974609375, 0.7337188720703125, 0.768463134765625, 0.8032073974609375, 0.83795166015625, 0.8726959228515625, 0.907440185546875, 0.9421844482421875, 0.9769287109375, 1.0116729736328125, 1.046417236328125, 1.0811614990234375, 1.11590576171875, 1.1506500244140625, 1.185394287109375, 1.2201385498046875, 1.2548828125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 8.0, 4.0, 15.0, 6.0, 12.0, 13.0, 16.0, 14.0, 15.0, 29.0, 25.0, 36.0, 33.0, 42.0, 48.0, 46.0, 46.0, 40.0, 45.0, 34.0, 48.0, 60.0, 49.0, 56.0, 38.0, 27.0, 33.0, 27.0, 34.0, 17.0, 9.0, 14.0, 17.0, 8.0, 15.0, 2.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66796875, -0.6422576904296875, -0.616546630859375, -0.5908355712890625, -0.56512451171875, -0.5394134521484375, -0.513702392578125, -0.4879913330078125, -0.4622802734375, -0.4365692138671875, -0.410858154296875, -0.3851470947265625, -0.35943603515625, -0.3337249755859375, -0.308013916015625, -0.2823028564453125, -0.256591796875, -0.2308807373046875, -0.205169677734375, -0.1794586181640625, -0.15374755859375, -0.1280364990234375, -0.102325439453125, -0.0766143798828125, -0.0509033203125, -0.0251922607421875, 0.000518798828125, 0.0262298583984375, 0.05194091796875, 0.0776519775390625, 0.103363037109375, 0.1290740966796875, 0.15478515625, 0.1804962158203125, 0.206207275390625, 0.2319183349609375, 0.25762939453125, 0.2833404541015625, 0.309051513671875, 0.3347625732421875, 0.3604736328125, 0.3861846923828125, 0.411895751953125, 0.4376068115234375, 0.46331787109375, 0.4890289306640625, 0.514739990234375, 0.5404510498046875, 0.566162109375, 0.5918731689453125, 0.617584228515625, 0.6432952880859375, 0.66900634765625, 0.6947174072265625, 0.720428466796875, 0.7461395263671875, 0.7718505859375, 0.7975616455078125, 0.823272705078125, 0.8489837646484375, 0.87469482421875, 0.9004058837890625, 0.926116943359375, 0.9518280029296875, 0.9775390625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 16.0, 18.0, 24.0, 39.0, 70.0, 95.0, 131.0, 243.0, 399.0, 853.0, 2248.0, 9028.0, 80321.0, 789538.0, 146809.0, 13571.0, 2859.0, 1005.0, 481.0, 273.0, 161.0, 103.0, 60.0, 50.0, 34.0, 26.0, 22.0, 16.0, 9.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.62109375, -3.524810791015625, -3.42852783203125, -3.332244873046875, -3.2359619140625, -3.139678955078125, -3.04339599609375, -2.947113037109375, -2.850830078125, -2.754547119140625, -2.65826416015625, -2.561981201171875, -2.4656982421875, -2.369415283203125, -2.27313232421875, -2.176849365234375, -2.08056640625, -1.984283447265625, -1.88800048828125, -1.791717529296875, -1.6954345703125, -1.599151611328125, -1.50286865234375, -1.406585693359375, -1.310302734375, -1.214019775390625, -1.11773681640625, -1.021453857421875, -0.9251708984375, -0.828887939453125, -0.73260498046875, -0.636322021484375, -0.5400390625, -0.443756103515625, -0.34747314453125, -0.251190185546875, -0.1549072265625, -0.058624267578125, 0.03765869140625, 0.133941650390625, 0.230224609375, 0.326507568359375, 0.42279052734375, 0.519073486328125, 0.6153564453125, 0.711639404296875, 0.80792236328125, 0.904205322265625, 1.00048828125, 1.096771240234375, 1.19305419921875, 1.289337158203125, 1.3856201171875, 1.481903076171875, 1.57818603515625, 1.674468994140625, 1.770751953125, 1.867034912109375, 1.96331787109375, 2.059600830078125, 2.1558837890625, 2.252166748046875, 2.34844970703125, 2.444732666015625, 2.541015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 13.0, 12.0, 16.0, 26.0, 34.0, 54.0, 40.0, 68.0, 53.0, 76.0, 81.0, 93.0, 79.0, 65.0, 51.0, 55.0, 44.0, 43.0, 23.0, 19.0, 15.0, 6.0, 7.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.5625, -6.40203857421875, -6.2415771484375, -6.08111572265625, -5.920654296875, -5.76019287109375, -5.5997314453125, -5.43927001953125, -5.27880859375, -5.11834716796875, -4.9578857421875, -4.79742431640625, -4.636962890625, -4.47650146484375, -4.3160400390625, -4.15557861328125, -3.9951171875, -3.83465576171875, -3.6741943359375, -3.51373291015625, -3.353271484375, -3.19281005859375, -3.0323486328125, -2.87188720703125, -2.71142578125, -2.55096435546875, -2.3905029296875, -2.23004150390625, -2.069580078125, -1.90911865234375, -1.7486572265625, -1.58819580078125, -1.427734375, -1.26727294921875, -1.1068115234375, -0.94635009765625, -0.785888671875, -0.62542724609375, -0.4649658203125, -0.30450439453125, -0.14404296875, 0.01641845703125, 0.1768798828125, 0.33734130859375, 0.497802734375, 0.65826416015625, 0.8187255859375, 0.97918701171875, 1.1396484375, 1.30010986328125, 1.4605712890625, 1.62103271484375, 1.781494140625, 1.94195556640625, 2.1024169921875, 2.26287841796875, 2.42333984375, 2.58380126953125, 2.7442626953125, 2.90472412109375, 3.065185546875, 3.22564697265625, 3.3861083984375, 3.54656982421875, 3.70703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 1.0, 6.0, 17.0, 19.0, 44.0, 62.0, 104.0, 231.0, 492.0, 1541.0, 8684.0, 251693.0, 766552.0, 15680.0, 2248.0, 617.0, 276.0, 119.0, 70.0, 32.0, 24.0, 14.0, 6.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -2.0039520263671875, -1.943450927734375, -1.8829498291015625, -1.82244873046875, -1.7619476318359375, -1.701446533203125, -1.6409454345703125, -1.5804443359375, -1.5199432373046875, -1.459442138671875, -1.3989410400390625, -1.33843994140625, -1.2779388427734375, -1.217437744140625, -1.1569366455078125, -1.096435546875, -1.0359344482421875, -0.975433349609375, -0.9149322509765625, -0.85443115234375, -0.7939300537109375, -0.733428955078125, -0.6729278564453125, -0.6124267578125, -0.5519256591796875, -0.491424560546875, -0.4309234619140625, -0.37042236328125, -0.3099212646484375, -0.249420166015625, -0.1889190673828125, -0.12841796875, -0.0679168701171875, -0.007415771484375, 0.0530853271484375, 0.11358642578125, 0.1740875244140625, 0.234588623046875, 0.2950897216796875, 0.3555908203125, 0.4160919189453125, 0.476593017578125, 0.5370941162109375, 0.59759521484375, 0.6580963134765625, 0.718597412109375, 0.7790985107421875, 0.839599609375, 0.9001007080078125, 0.960601806640625, 1.0211029052734375, 1.08160400390625, 1.1421051025390625, 1.202606201171875, 1.2631072998046875, 1.3236083984375, 1.3841094970703125, 1.444610595703125, 1.5051116943359375, 1.56561279296875, 1.6261138916015625, 1.686614990234375, 1.7471160888671875, 1.8076171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 9.0, 13.0, 31.0, 70.0, 133.0, 208.0, 244.0, 140.0, 64.0, 47.0, 21.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033402442932128906, -0.00032171234488487244, -0.0003094002604484558, -0.0002970881760120392, -0.00028477609157562256, -0.00027246400713920593, -0.0002601519227027893, -0.0002478398382663727, -0.00023552775382995605, -0.00022321566939353943, -0.0002109035849571228, -0.00019859150052070618, -0.00018627941608428955, -0.00017396733164787292, -0.0001616552472114563, -0.00014934316277503967, -0.00013703107833862305, -0.00012471899390220642, -0.0001124069094657898, -0.00010009482502937317, -8.778274059295654e-05, -7.547065615653992e-05, -6.315857172012329e-05, -5.0846487283706665e-05, -3.853440284729004e-05, -2.6222318410873413e-05, -1.3910233974456787e-05, -1.5981495380401611e-06, 1.0713934898376465e-05, 2.302601933479309e-05, 3.533810377120972e-05, 4.765018820762634e-05, 5.996227264404297e-05, 7.22743570804596e-05, 8.458644151687622e-05, 9.689852595329285e-05, 0.00010921061038970947, 0.0001215226948261261, 0.00013383477926254272, 0.00014614686369895935, 0.00015845894813537598, 0.0001707710325717926, 0.00018308311700820923, 0.00019539520144462585, 0.00020770728588104248, 0.0002200193703174591, 0.00023233145475387573, 0.00024464353919029236, 0.000256955623626709, 0.0002692677080631256, 0.00028157979249954224, 0.00029389187693595886, 0.0003062039613723755, 0.0003185160458087921, 0.00033082813024520874, 0.00034314021468162537, 0.000355452299118042, 0.0003677643835544586, 0.00038007646799087524, 0.00039238855242729187, 0.0004047006368637085, 0.0004170127213001251, 0.00042932480573654175, 0.0004416368901729584, 0.000453948974609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 13.0, 11.0, 17.0, 28.0, 27.0, 42.0, 79.0, 118.0, 161.0, 265.0, 513.0, 1096.0, 2633.0, 9249.0, 52057.0, 595036.0, 341491.0, 34315.0, 6984.0, 2249.0, 931.0, 454.0, 258.0, 148.0, 94.0, 73.0, 40.0, 41.0, 27.0, 15.0, 12.0, 13.0, 9.0, 9.0, 9.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9310302734375, -0.903564453125, -0.8760986328125, -0.8486328125, -0.8211669921875, -0.793701171875, -0.7662353515625, -0.73876953125, -0.7113037109375, -0.683837890625, -0.6563720703125, -0.62890625, -0.6014404296875, -0.573974609375, -0.5465087890625, -0.51904296875, -0.4915771484375, -0.464111328125, -0.4366455078125, -0.4091796875, -0.3817138671875, -0.354248046875, -0.3267822265625, -0.29931640625, -0.2718505859375, -0.244384765625, -0.2169189453125, -0.189453125, -0.1619873046875, -0.134521484375, -0.1070556640625, -0.07958984375, -0.0521240234375, -0.024658203125, 0.0028076171875, 0.0302734375, 0.0577392578125, 0.085205078125, 0.1126708984375, 0.14013671875, 0.1676025390625, 0.195068359375, 0.2225341796875, 0.25, 0.2774658203125, 0.304931640625, 0.3323974609375, 0.35986328125, 0.3873291015625, 0.414794921875, 0.4422607421875, 0.4697265625, 0.4971923828125, 0.524658203125, 0.5521240234375, 0.57958984375, 0.6070556640625, 0.634521484375, 0.6619873046875, 0.689453125, 0.7169189453125, 0.744384765625, 0.7718505859375, 0.79931640625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 4.0, 8.0, 15.0, 12.0, 17.0, 29.0, 41.0, 46.0, 57.0, 64.0, 82.0, 72.0, 87.0, 86.0, 68.0, 56.0, 54.0, 44.0, 38.0, 28.0, 20.0, 8.0, 13.0, 13.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.765625, -0.738555908203125, -0.71148681640625, -0.684417724609375, -0.6573486328125, -0.630279541015625, -0.60321044921875, -0.576141357421875, -0.549072265625, -0.522003173828125, -0.49493408203125, -0.467864990234375, -0.4407958984375, -0.413726806640625, -0.38665771484375, -0.359588623046875, -0.33251953125, -0.305450439453125, -0.27838134765625, -0.251312255859375, -0.2242431640625, -0.197174072265625, -0.17010498046875, -0.143035888671875, -0.115966796875, -0.088897705078125, -0.06182861328125, -0.034759521484375, -0.0076904296875, 0.019378662109375, 0.04644775390625, 0.073516845703125, 0.1005859375, 0.127655029296875, 0.15472412109375, 0.181793212890625, 0.2088623046875, 0.235931396484375, 0.26300048828125, 0.290069580078125, 0.317138671875, 0.344207763671875, 0.37127685546875, 0.398345947265625, 0.4254150390625, 0.452484130859375, 0.47955322265625, 0.506622314453125, 0.53369140625, 0.560760498046875, 0.58782958984375, 0.614898681640625, 0.6419677734375, 0.669036865234375, 0.69610595703125, 0.723175048828125, 0.750244140625, 0.777313232421875, 0.80438232421875, 0.831451416015625, 0.8585205078125, 0.885589599609375, 0.91265869140625, 0.939727783203125, 0.966796875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 25.0, 71.0, 310.0, 467.0, 104.0, 9.0, 11.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.674224853515625, -58.15066909790039, -56.62711715698242, -55.10356140136719, -53.58000946044922, -52.056453704833984, -50.53289794921875, -49.00934600830078, -47.48579025268555, -45.96223449707031, -44.438682556152344, -42.91512680053711, -41.391571044921875, -39.868019104003906, -38.34446334838867, -36.82090759277344, -35.29735565185547, -33.773799896240234, -32.250247955322266, -30.72669219970703, -29.20313835144043, -27.679584503173828, -26.156028747558594, -24.632474899291992, -23.10892105102539, -21.58536720275879, -20.061813354492188, -18.538257598876953, -17.01470375061035, -15.49114990234375, -13.967595100402832, -12.444040298461914, -10.920482635498047, -9.396928787231445, -7.873373985290527, -6.349819660186768, -4.826265335083008, -3.302711009979248, -1.7791566848754883, -0.2556018829345703, 1.2679519653320312, 2.791506290435791, 4.315060615539551, 5.8386149406433105, 7.36216926574707, 8.885723114013672, 10.40927791595459, 11.932832717895508, 13.45638656616211, 14.979940414428711, 16.503494262695312, 18.027050018310547, 19.55060386657715, 21.07415771484375, 22.597713470458984, 24.121267318725586, 25.644821166992188, 27.16837501525879, 28.69192886352539, 30.215484619140625, 31.739038467407227, 33.26259231567383, 34.78614807128906, 36.30970001220703, 37.833255767822266]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 5.0, 12.0, 13.0, 14.0, 20.0, 20.0, 29.0, 29.0, 37.0, 49.0, 65.0, 55.0, 65.0, 66.0, 76.0, 65.0, 60.0, 44.0, 34.0, 46.0, 31.0, 30.0, 29.0, 20.0, 15.0, 10.0, 18.0, 15.0, 4.0, 3.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.69677734375, -13.10966682434082, -12.522557258605957, -11.935446739196777, -11.348337173461914, -10.761226654052734, -10.174116134643555, -9.587005615234375, -8.999896049499512, -8.412785530090332, -7.825675964355469, -7.238565444946289, -6.651455402374268, -6.064345359802246, -5.477234840393066, -4.890124797821045, -4.303014755249023, -3.715904712677002, -3.1287944316864014, -2.541684150695801, -1.9545741081237793, -1.3674640655517578, -0.7803537845611572, -0.19324350357055664, 0.39386653900146484, 0.9809767007827759, 1.568086862564087, 2.1551971435546875, 2.742307186126709, 3.3294172286987305, 3.916527509689331, 4.503637790679932, 5.090749740600586, 5.677859783172607, 6.264969825744629, 6.852080345153809, 7.43919038772583, 8.026300430297852, 8.613410949707031, 9.200521469116211, 9.787631034851074, 10.374741554260254, 10.961851119995117, 11.548961639404297, 12.136072158813477, 12.72318172454834, 13.31029224395752, 13.897401809692383, 14.484512329101562, 15.071622848510742, 15.658732414245605, 16.24584197998047, 16.83295249938965, 17.420063018798828, 18.007173538208008, 18.594284057617188, 19.181392669677734, 19.768503189086914, 20.355613708496094, 20.94272232055664, 21.52983283996582, 22.116943359375, 22.70405387878418, 23.29116439819336, 23.87827491760254]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 7.0, 19.0, 43.0, 74.0, 84.0, 154.0, 288.0, 501.0, 992.0, 2029.0, 4975.0, 14202.0, 50340.0, 423179.0, 2995062.0, 617424.0, 61539.0, 13585.0, 4993.0, 2175.0, 1099.0, 600.0, 366.0, 185.0, 102.0, 87.0, 53.0, 29.0, 20.0, 16.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.747161865234375, -0.71405029296875, -0.680938720703125, -0.6478271484375, -0.614715576171875, -0.58160400390625, -0.548492431640625, -0.515380859375, -0.482269287109375, -0.44915771484375, -0.416046142578125, -0.3829345703125, -0.349822998046875, -0.31671142578125, -0.283599853515625, -0.25048828125, -0.217376708984375, -0.18426513671875, -0.151153564453125, -0.1180419921875, -0.084930419921875, -0.05181884765625, -0.018707275390625, 0.014404296875, 0.047515869140625, 0.08062744140625, 0.113739013671875, 0.1468505859375, 0.179962158203125, 0.21307373046875, 0.246185302734375, 0.279296875, 0.312408447265625, 0.34552001953125, 0.378631591796875, 0.4117431640625, 0.444854736328125, 0.47796630859375, 0.511077880859375, 0.544189453125, 0.577301025390625, 0.61041259765625, 0.643524169921875, 0.6766357421875, 0.709747314453125, 0.74285888671875, 0.775970458984375, 0.80908203125, 0.842193603515625, 0.87530517578125, 0.908416748046875, 0.9415283203125, 0.974639892578125, 1.00775146484375, 1.040863037109375, 1.073974609375, 1.107086181640625, 1.14019775390625, 1.173309326171875, 1.2064208984375, 1.239532470703125, 1.27264404296875, 1.305755615234375, 1.3388671875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 14.0, 15.0, 17.0, 18.0, 30.0, 24.0, 28.0, 41.0, 48.0, 41.0, 49.0, 63.0, 57.0, 68.0, 41.0, 64.0, 54.0, 53.0, 40.0, 39.0, 35.0, 31.0, 18.0, 19.0, 14.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.60888671875, -0.5812759399414062, -0.5536651611328125, -0.5260543823242188, -0.498443603515625, -0.47083282470703125, -0.4432220458984375, -0.41561126708984375, -0.38800048828125, -0.36038970947265625, -0.3327789306640625, -0.30516815185546875, -0.277557373046875, -0.24994659423828125, -0.2223358154296875, -0.19472503662109375, -0.1671142578125, -0.13950347900390625, -0.1118927001953125, -0.08428192138671875, -0.056671142578125, -0.02906036376953125, -0.0014495849609375, 0.02616119384765625, 0.05377197265625, 0.08138275146484375, 0.1089935302734375, 0.13660430908203125, 0.164215087890625, 0.19182586669921875, 0.2194366455078125, 0.24704742431640625, 0.274658203125, 0.30226898193359375, 0.3298797607421875, 0.35749053955078125, 0.385101318359375, 0.41271209716796875, 0.4403228759765625, 0.46793365478515625, 0.49554443359375, 0.5231552124023438, 0.5507659912109375, 0.5783767700195312, 0.605987548828125, 0.6335983276367188, 0.6612091064453125, 0.6888198852539062, 0.7164306640625, 0.7440414428710938, 0.7716522216796875, 0.7992630004882812, 0.826873779296875, 0.8544845581054688, 0.8820953369140625, 0.9097061157226562, 0.93731689453125, 0.9649276733398438, 0.9925384521484375, 1.0201492309570312, 1.047760009765625, 1.0753707885742188, 1.1029815673828125, 1.1305923461914062, 1.158203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 22.0, 35.0, 43.0, 57.0, 124.0, 237.0, 514.0, 1250.0, 5052.0, 31882.0, 948313.0, 3146846.0, 49956.0, 7245.0, 1637.0, 533.0, 212.0, 107.0, 45.0, 35.0, 34.0, 25.0, 16.0, 10.0, 12.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7578125, -2.687286376953125, -2.61676025390625, -2.546234130859375, -2.4757080078125, -2.405181884765625, -2.33465576171875, -2.264129638671875, -2.193603515625, -2.123077392578125, -2.05255126953125, -1.982025146484375, -1.9114990234375, -1.840972900390625, -1.77044677734375, -1.699920654296875, -1.62939453125, -1.558868408203125, -1.48834228515625, -1.417816162109375, -1.3472900390625, -1.276763916015625, -1.20623779296875, -1.135711669921875, -1.065185546875, -0.994659423828125, -0.92413330078125, -0.853607177734375, -0.7830810546875, -0.712554931640625, -0.64202880859375, -0.571502685546875, -0.5009765625, -0.430450439453125, -0.35992431640625, -0.289398193359375, -0.2188720703125, -0.148345947265625, -0.07781982421875, -0.007293701171875, 0.063232421875, 0.133758544921875, 0.20428466796875, 0.274810791015625, 0.3453369140625, 0.415863037109375, 0.48638916015625, 0.556915283203125, 0.62744140625, 0.697967529296875, 0.76849365234375, 0.839019775390625, 0.9095458984375, 0.980072021484375, 1.05059814453125, 1.121124267578125, 1.191650390625, 1.262176513671875, 1.33270263671875, 1.403228759765625, 1.4737548828125, 1.544281005859375, 1.61480712890625, 1.685333251953125, 1.755859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 10.0, 4.0, 8.0, 12.0, 15.0, 27.0, 27.0, 36.0, 59.0, 101.0, 157.0, 317.0, 712.0, 1028.0, 753.0, 350.0, 157.0, 88.0, 44.0, 43.0, 18.0, 18.0, 13.0, 11.0, 15.0, 8.0, 6.0, 5.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.16796875, -2.1130828857421875, -2.058197021484375, -2.0033111572265625, -1.94842529296875, -1.8935394287109375, -1.838653564453125, -1.7837677001953125, -1.7288818359375, -1.6739959716796875, -1.619110107421875, -1.5642242431640625, -1.50933837890625, -1.4544525146484375, -1.399566650390625, -1.3446807861328125, -1.289794921875, -1.2349090576171875, -1.180023193359375, -1.1251373291015625, -1.07025146484375, -1.0153656005859375, -0.960479736328125, -0.9055938720703125, -0.8507080078125, -0.7958221435546875, -0.740936279296875, -0.6860504150390625, -0.63116455078125, -0.5762786865234375, -0.521392822265625, -0.4665069580078125, -0.41162109375, -0.3567352294921875, -0.301849365234375, -0.2469635009765625, -0.19207763671875, -0.1371917724609375, -0.082305908203125, -0.0274200439453125, 0.0274658203125, 0.0823516845703125, 0.137237548828125, 0.1921234130859375, 0.24700927734375, 0.3018951416015625, 0.356781005859375, 0.4116668701171875, 0.466552734375, 0.5214385986328125, 0.576324462890625, 0.6312103271484375, 0.68609619140625, 0.7409820556640625, 0.795867919921875, 0.8507537841796875, 0.9056396484375, 0.9605255126953125, 1.015411376953125, 1.0702972412109375, 1.12518310546875, 1.1800689697265625, 1.234954833984375, 1.2898406982421875, 1.3447265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 16.0, 56.0, 116.0, 241.0, 269.0, 175.0, 63.0, 18.0, 12.0, 7.0, 7.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4849853515625, -19.87091636657715, -19.256847381591797, -18.642778396606445, -18.028709411621094, -17.414640426635742, -16.80057144165039, -16.18650245666504, -15.572433471679688, -14.958364486694336, -14.344295501708984, -13.730226516723633, -13.116157531738281, -12.50208854675293, -11.888019561767578, -11.273950576782227, -10.659881591796875, -10.045812606811523, -9.431743621826172, -8.81767463684082, -8.203605651855469, -7.589536666870117, -6.975467681884766, -6.361398696899414, -5.7473297119140625, -5.133260726928711, -4.519191741943359, -3.905122756958008, -3.2910537719726562, -2.6769847869873047, -2.062915802001953, -1.4488468170166016, -0.8347797393798828, -0.22071075439453125, 0.3933582305908203, 1.0074272155761719, 1.6214962005615234, 2.235565185546875, 2.8496341705322266, 3.463703155517578, 4.07777214050293, 4.691841125488281, 5.305910110473633, 5.919979095458984, 6.534048080444336, 7.1481170654296875, 7.762186050415039, 8.37625503540039, 8.990324020385742, 9.604393005371094, 10.218461990356445, 10.832530975341797, 11.446599960327148, 12.0606689453125, 12.674737930297852, 13.288806915283203, 13.902875900268555, 14.516944885253906, 15.131013870239258, 15.74508285522461, 16.35915184020996, 16.973220825195312, 17.587289810180664, 18.201358795166016, 18.815427780151367]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 19.0, 11.0, 5.0, 19.0, 14.0, 24.0, 23.0, 23.0, 22.0, 31.0, 40.0, 39.0, 37.0, 61.0, 47.0, 59.0, 46.0, 47.0, 58.0, 47.0, 65.0, 40.0, 43.0, 31.0, 28.0, 20.0, 22.0, 14.0, 15.0, 10.0, 6.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.67354965209961, -8.42505931854248, -8.176568031311035, -7.928077220916748, -7.679586410522461, -7.431096076965332, -7.182604789733887, -6.934114456176758, -6.685623645782471, -6.437132835388184, -6.1886420249938965, -5.940151214599609, -5.691660404205322, -5.443169593811035, -5.194679260253906, -4.946188449859619, -4.697697639465332, -4.449206829071045, -4.200716018676758, -3.9522252082824707, -3.7037346363067627, -3.4552438259124756, -3.2067530155181885, -2.9582624435424805, -2.709771156311035, -2.461280345916748, -2.212789535522461, -1.9642988443374634, -1.7158081531524658, -1.4673173427581787, -1.2188265323638916, -0.970335841178894, -0.7218451499938965, -0.47335439920425415, -0.22486361861228943, 0.023627161979675293, 0.2721179127693176, 0.52060866355896, 0.7690994739532471, 1.0175901651382446, 1.2660809755325317, 1.5145717859268188, 1.7630624771118164, 2.0115532875061035, 2.2600440979003906, 2.5085349082946777, 2.757025718688965, 3.005516290664673, 3.25400710105896, 3.502497911453247, 3.750988721847534, 3.999479293823242, 4.247970104217529, 4.496460914611816, 4.7449517250061035, 4.993442535400391, 5.241933345794678, 5.490424156188965, 5.738914966583252, 5.987405776977539, 6.235896587371826, 6.484387397766113, 6.732877731323242, 6.981368541717529, 7.229859352111816]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 20.0, 26.0, 40.0, 62.0, 86.0, 160.0, 266.0, 414.0, 659.0, 1326.0, 2510.0, 5295.0, 11824.0, 29277.0, 75233.0, 192931.0, 340281.0, 231265.0, 93445.0, 36044.0, 14661.0, 6303.0, 2845.0, 1547.0, 811.0, 493.0, 276.0, 169.0, 89.0, 59.0, 44.0, 26.0, 27.0, 8.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89306640625, -0.8629074096679688, -0.8327484130859375, -0.8025894165039062, -0.772430419921875, -0.7422714233398438, -0.7121124267578125, -0.6819534301757812, -0.65179443359375, -0.6216354370117188, -0.5914764404296875, -0.5613174438476562, -0.531158447265625, -0.5009994506835938, -0.4708404541015625, -0.44068145751953125, -0.4105224609375, -0.38036346435546875, -0.3502044677734375, -0.32004547119140625, -0.289886474609375, -0.25972747802734375, -0.2295684814453125, -0.19940948486328125, -0.16925048828125, -0.13909149169921875, -0.1089324951171875, -0.07877349853515625, -0.048614501953125, -0.01845550537109375, 0.0117034912109375, 0.04186248779296875, 0.072021484375, 0.10218048095703125, 0.1323394775390625, 0.16249847412109375, 0.192657470703125, 0.22281646728515625, 0.2529754638671875, 0.28313446044921875, 0.31329345703125, 0.34345245361328125, 0.3736114501953125, 0.40377044677734375, 0.433929443359375, 0.46408843994140625, 0.4942474365234375, 0.5244064331054688, 0.5545654296875, 0.5847244262695312, 0.6148834228515625, 0.6450424194335938, 0.675201416015625, 0.7053604125976562, 0.7355194091796875, 0.7656784057617188, 0.79583740234375, 0.8259963989257812, 0.8561553955078125, 0.8863143920898438, 0.916473388671875, 0.9466323852539062, 0.9767913818359375, 1.0069503784179688, 1.037109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 11.0, 4.0, 9.0, 6.0, 15.0, 17.0, 15.0, 20.0, 31.0, 23.0, 38.0, 27.0, 41.0, 62.0, 58.0, 60.0, 54.0, 51.0, 63.0, 57.0, 66.0, 40.0, 43.0, 41.0, 33.0, 25.0, 26.0, 17.0, 17.0, 10.0, 9.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68359375, -0.65625, -0.62890625, -0.6015625, -0.57421875, -0.546875, -0.51953125, -0.4921875, -0.46484375, -0.4375, -0.41015625, -0.3828125, -0.35546875, -0.328125, -0.30078125, -0.2734375, -0.24609375, -0.21875, -0.19140625, -0.1640625, -0.13671875, -0.109375, -0.08203125, -0.0546875, -0.02734375, 0.0, 0.02734375, 0.0546875, 0.08203125, 0.109375, 0.13671875, 0.1640625, 0.19140625, 0.21875, 0.24609375, 0.2734375, 0.30078125, 0.328125, 0.35546875, 0.3828125, 0.41015625, 0.4375, 0.46484375, 0.4921875, 0.51953125, 0.546875, 0.57421875, 0.6015625, 0.62890625, 0.65625, 0.68359375, 0.7109375, 0.73828125, 0.765625, 0.79296875, 0.8203125, 0.84765625, 0.875, 0.90234375, 0.9296875, 0.95703125, 0.984375, 1.01171875, 1.0390625, 1.06640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 0.0, 4.0, 6.0, 11.0, 7.0, 11.0, 24.0, 17.0, 28.0, 46.0, 40.0, 52.0, 63.0, 87.0, 132.0, 159.0, 183.0, 278.0, 398.0, 608.0, 904.0, 1759.0, 4255.0, 15313.0, 91048.0, 660537.0, 228063.0, 31364.0, 7044.0, 2453.0, 1149.0, 703.0, 454.0, 335.0, 237.0, 179.0, 147.0, 93.0, 85.0, 58.0, 40.0, 39.0, 33.0, 28.0, 22.0, 18.0, 10.0, 12.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-1.978515625, -1.9180450439453125, -1.857574462890625, -1.7971038818359375, -1.73663330078125, -1.6761627197265625, -1.615692138671875, -1.5552215576171875, -1.4947509765625, -1.4342803955078125, -1.373809814453125, -1.3133392333984375, -1.25286865234375, -1.1923980712890625, -1.131927490234375, -1.0714569091796875, -1.010986328125, -0.9505157470703125, -0.890045166015625, -0.8295745849609375, -0.76910400390625, -0.7086334228515625, -0.648162841796875, -0.5876922607421875, -0.5272216796875, -0.4667510986328125, -0.406280517578125, -0.3458099365234375, -0.28533935546875, -0.2248687744140625, -0.164398193359375, -0.1039276123046875, -0.04345703125, 0.0170135498046875, 0.077484130859375, 0.1379547119140625, 0.19842529296875, 0.2588958740234375, 0.319366455078125, 0.3798370361328125, 0.4403076171875, 0.5007781982421875, 0.561248779296875, 0.6217193603515625, 0.68218994140625, 0.7426605224609375, 0.803131103515625, 0.8636016845703125, 0.924072265625, 0.9845428466796875, 1.045013427734375, 1.1054840087890625, 1.16595458984375, 1.2264251708984375, 1.286895751953125, 1.3473663330078125, 1.4078369140625, 1.4683074951171875, 1.528778076171875, 1.5892486572265625, 1.64971923828125, 1.7101898193359375, 1.770660400390625, 1.8311309814453125, 1.8916015625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 9.0, 5.0, 8.0, 4.0, 8.0, 12.0, 11.0, 6.0, 19.0, 15.0, 21.0, 23.0, 27.0, 26.0, 51.0, 44.0, 36.0, 41.0, 47.0, 51.0, 61.0, 46.0, 34.0, 44.0, 49.0, 36.0, 43.0, 33.0, 27.0, 25.0, 26.0, 23.0, 12.0, 15.0, 9.0, 18.0, 4.0, 7.0, 12.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.83203125, -2.734161376953125, -2.63629150390625, -2.538421630859375, -2.4405517578125, -2.342681884765625, -2.24481201171875, -2.146942138671875, -2.049072265625, -1.951202392578125, -1.85333251953125, -1.755462646484375, -1.6575927734375, -1.559722900390625, -1.46185302734375, -1.363983154296875, -1.26611328125, -1.168243408203125, -1.07037353515625, -0.972503662109375, -0.8746337890625, -0.776763916015625, -0.67889404296875, -0.581024169921875, -0.483154296875, -0.385284423828125, -0.28741455078125, -0.189544677734375, -0.0916748046875, 0.006195068359375, 0.10406494140625, 0.201934814453125, 0.2998046875, 0.397674560546875, 0.49554443359375, 0.593414306640625, 0.6912841796875, 0.789154052734375, 0.88702392578125, 0.984893798828125, 1.082763671875, 1.180633544921875, 1.27850341796875, 1.376373291015625, 1.4742431640625, 1.572113037109375, 1.66998291015625, 1.767852783203125, 1.86572265625, 1.963592529296875, 2.06146240234375, 2.159332275390625, 2.2572021484375, 2.355072021484375, 2.45294189453125, 2.550811767578125, 2.648681640625, 2.746551513671875, 2.84442138671875, 2.942291259765625, 3.0401611328125, 3.138031005859375, 3.23590087890625, 3.333770751953125, 3.431640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 17.0, 24.0, 29.0, 53.0, 70.0, 151.0, 365.0, 1019.0, 4580.0, 48778.0, 956226.0, 31871.0, 3793.0, 870.0, 302.0, 155.0, 68.0, 52.0, 36.0, 11.0, 16.0, 14.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46484375, -1.416717529296875, -1.36859130859375, -1.320465087890625, -1.2723388671875, -1.224212646484375, -1.17608642578125, -1.127960205078125, -1.079833984375, -1.031707763671875, -0.98358154296875, -0.935455322265625, -0.8873291015625, -0.839202880859375, -0.79107666015625, -0.742950439453125, -0.69482421875, -0.646697998046875, -0.59857177734375, -0.550445556640625, -0.5023193359375, -0.454193115234375, -0.40606689453125, -0.357940673828125, -0.309814453125, -0.261688232421875, -0.21356201171875, -0.165435791015625, -0.1173095703125, -0.069183349609375, -0.02105712890625, 0.027069091796875, 0.0751953125, 0.123321533203125, 0.17144775390625, 0.219573974609375, 0.2677001953125, 0.315826416015625, 0.36395263671875, 0.412078857421875, 0.460205078125, 0.508331298828125, 0.55645751953125, 0.604583740234375, 0.6527099609375, 0.700836181640625, 0.74896240234375, 0.797088623046875, 0.84521484375, 0.893341064453125, 0.94146728515625, 0.989593505859375, 1.0377197265625, 1.085845947265625, 1.13397216796875, 1.182098388671875, 1.230224609375, 1.278350830078125, 1.32647705078125, 1.374603271484375, 1.4227294921875, 1.470855712890625, 1.51898193359375, 1.567108154296875, 1.615234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 5.0, 7.0, 23.0, 20.0, 36.0, 56.0, 109.0, 158.0, 200.0, 124.0, 88.0, 63.0, 30.0, 22.0, 10.0, 8.0, 9.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024127960205078125, -0.00023337453603744507, -0.0002254694700241089, -0.0002175644040107727, -0.00020965933799743652, -0.00020175427198410034, -0.00019384920597076416, -0.00018594413995742798, -0.0001780390739440918, -0.00017013400793075562, -0.00016222894191741943, -0.00015432387590408325, -0.00014641880989074707, -0.0001385137438774109, -0.0001306086778640747, -0.00012270361185073853, -0.00011479854583740234, -0.00010689347982406616, -9.898841381072998e-05, -9.10833477973938e-05, -8.317828178405762e-05, -7.527321577072144e-05, -6.736814975738525e-05, -5.946308374404907e-05, -5.155801773071289e-05, -4.365295171737671e-05, -3.574788570404053e-05, -2.7842819690704346e-05, -1.9937753677368164e-05, -1.2032687664031982e-05, -4.127621650695801e-06, 3.777444362640381e-06, 1.1682510375976562e-05, 1.9587576389312744e-05, 2.7492642402648926e-05, 3.539770841598511e-05, 4.330277442932129e-05, 5.120784044265747e-05, 5.911290645599365e-05, 6.701797246932983e-05, 7.492303848266602e-05, 8.28281044960022e-05, 9.073317050933838e-05, 9.863823652267456e-05, 0.00010654330253601074, 0.00011444836854934692, 0.0001223534345626831, 0.0001302585005760193, 0.00013816356658935547, 0.00014606863260269165, 0.00015397369861602783, 0.00016187876462936401, 0.0001697838306427002, 0.00017768889665603638, 0.00018559396266937256, 0.00019349902868270874, 0.00020140409469604492, 0.0002093091607093811, 0.00021721422672271729, 0.00022511929273605347, 0.00023302435874938965, 0.00024092942476272583, 0.000248834490776062, 0.0002567395567893982, 0.0002646446228027344]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 7.0, 14.0, 21.0, 23.0, 43.0, 60.0, 83.0, 138.0, 339.0, 906.0, 3032.0, 17444.0, 789835.0, 222703.0, 10377.0, 2173.0, 684.0, 299.0, 121.0, 75.0, 51.0, 24.0, 24.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3837890625, -1.3416900634765625, -1.299591064453125, -1.2574920654296875, -1.21539306640625, -1.1732940673828125, -1.131195068359375, -1.0890960693359375, -1.0469970703125, -1.0048980712890625, -0.962799072265625, -0.9207000732421875, -0.87860107421875, -0.8365020751953125, -0.794403076171875, -0.7523040771484375, -0.710205078125, -0.6681060791015625, -0.626007080078125, -0.5839080810546875, -0.54180908203125, -0.4997100830078125, -0.457611083984375, -0.4155120849609375, -0.3734130859375, -0.3313140869140625, -0.289215087890625, -0.2471160888671875, -0.20501708984375, -0.1629180908203125, -0.120819091796875, -0.0787200927734375, -0.03662109375, 0.0054779052734375, 0.047576904296875, 0.0896759033203125, 0.13177490234375, 0.1738739013671875, 0.215972900390625, 0.2580718994140625, 0.3001708984375, 0.3422698974609375, 0.384368896484375, 0.4264678955078125, 0.46856689453125, 0.5106658935546875, 0.552764892578125, 0.5948638916015625, 0.636962890625, 0.6790618896484375, 0.721160888671875, 0.7632598876953125, 0.80535888671875, 0.8474578857421875, 0.889556884765625, 0.9316558837890625, 0.9737548828125, 1.0158538818359375, 1.057952880859375, 1.1000518798828125, 1.14215087890625, 1.1842498779296875, 1.226348876953125, 1.2684478759765625, 1.310546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 8.0, 8.0, 9.0, 16.0, 19.0, 19.0, 26.0, 40.0, 49.0, 61.0, 76.0, 94.0, 131.0, 90.0, 83.0, 59.0, 53.0, 38.0, 29.0, 15.0, 17.0, 11.0, 11.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7275390625, -0.705535888671875, -0.68353271484375, -0.661529541015625, -0.6395263671875, -0.617523193359375, -0.59552001953125, -0.573516845703125, -0.551513671875, -0.529510498046875, -0.50750732421875, -0.485504150390625, -0.4635009765625, -0.441497802734375, -0.41949462890625, -0.397491455078125, -0.37548828125, -0.353485107421875, -0.33148193359375, -0.309478759765625, -0.2874755859375, -0.265472412109375, -0.24346923828125, -0.221466064453125, -0.199462890625, -0.177459716796875, -0.15545654296875, -0.133453369140625, -0.1114501953125, -0.089447021484375, -0.06744384765625, -0.045440673828125, -0.0234375, -0.001434326171875, 0.02056884765625, 0.042572021484375, 0.0645751953125, 0.086578369140625, 0.10858154296875, 0.130584716796875, 0.152587890625, 0.174591064453125, 0.19659423828125, 0.218597412109375, 0.2406005859375, 0.262603759765625, 0.28460693359375, 0.306610107421875, 0.32861328125, 0.350616455078125, 0.37261962890625, 0.394622802734375, 0.4166259765625, 0.438629150390625, 0.46063232421875, 0.482635498046875, 0.504638671875, 0.526641845703125, 0.54864501953125, 0.570648193359375, 0.5926513671875, 0.614654541015625, 0.63665771484375, 0.658660888671875, 0.6806640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 13.0, 9.0, 40.0, 83.0, 142.0, 272.0, 244.0, 95.0, 55.0, 23.0, 12.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.1849308013916, -23.5288028717041, -22.8726749420166, -22.216548919677734, -21.560420989990234, -20.904293060302734, -20.248165130615234, -19.592037200927734, -18.935909271240234, -18.279781341552734, -17.623653411865234, -16.967527389526367, -16.311399459838867, -15.655271530151367, -14.999143600463867, -14.343015670776367, -13.6868896484375, -13.03076171875, -12.374634742736816, -11.718506813049316, -11.062379837036133, -10.406251907348633, -9.750123977661133, -9.093996047973633, -8.43786907196045, -7.781741619110107, -7.125614166259766, -6.469486236572266, -5.813358783721924, -5.157231330871582, -4.501103401184082, -3.8449759483337402, -3.1888465881347656, -2.532719135284424, -1.876591444015503, -1.2204638719558716, -0.5643362998962402, 0.09179115295410156, 0.7479188442230225, 1.4040465354919434, 2.060173988342285, 2.716301441192627, 3.372429132461548, 4.028556823730469, 4.6846842765808105, 5.340811729431152, 5.996939659118652, 6.653067111968994, 7.309194564819336, 7.965322017669678, 8.62144947052002, 9.27757740020752, 9.933704376220703, 10.589832305908203, 11.245960235595703, 11.902088165283203, 12.558215141296387, 13.214343070983887, 13.87047004699707, 14.52659797668457, 15.18272590637207, 15.838852882385254, 16.494979858398438, 17.151107788085938, 17.807235717773438]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 11.0, 22.0, 13.0, 14.0, 21.0, 22.0, 22.0, 20.0, 28.0, 34.0, 19.0, 35.0, 57.0, 55.0, 57.0, 75.0, 77.0, 51.0, 35.0, 38.0, 43.0, 36.0, 24.0, 32.0, 27.0, 16.0, 14.0, 17.0, 17.0, 13.0, 9.0, 12.0, 4.0, 6.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0], "bins": [-16.52168083190918, -16.101119995117188, -15.680558204650879, -15.259997367858887, -14.839435577392578, -14.418874740600586, -13.998313903808594, -13.577753067016602, -13.157191276550293, -12.7366304397583, -12.316068649291992, -11.8955078125, -11.474946975708008, -11.0543851852417, -10.633824348449707, -10.213262557983398, -9.792701721191406, -9.372140884399414, -8.951579093933105, -8.531018257141113, -8.110456466674805, -7.6898956298828125, -7.26933479309082, -6.84877347946167, -6.4282121658325195, -6.007650852203369, -5.587089538574219, -5.166528701782227, -4.745967388153076, -4.325406074523926, -3.9048449993133545, -3.484283924102783, -3.0637216567993164, -2.643160343170166, -2.2225992679595947, -1.8020380735397339, -1.381476879119873, -0.9609155654907227, -0.5403544902801514, -0.11979341506958008, 0.3007678985595703, 0.7213290929794312, 1.141890287399292, 1.5624514818191528, 1.9830126762390137, 2.403573989868164, 2.8241350650787354, 3.2446961402893066, 3.665257453918457, 4.085818767547607, 4.506380081176758, 4.92694091796875, 5.3475022315979, 5.768063545227051, 6.188624382019043, 6.609185695648193, 7.029747009277344, 7.450308322906494, 7.8708696365356445, 8.291430473327637, 8.711992263793945, 9.132553100585938, 9.55311393737793, 9.973674774169922, 10.39423656463623]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 11.0, 14.0, 10.0, 12.0, 27.0, 37.0, 43.0, 56.0, 70.0, 124.0, 182.0, 340.0, 611.0, 1235.0, 2556.0, 6729.0, 23107.0, 123401.0, 867678.0, 2411322.0, 636301.0, 89584.0, 18707.0, 6430.0, 2833.0, 1294.0, 632.0, 349.0, 184.0, 146.0, 66.0, 45.0, 48.0, 28.0, 23.0, 12.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6026763916015625, -0.579864501953125, -0.5570526123046875, -0.53424072265625, -0.5114288330078125, -0.488616943359375, -0.4658050537109375, -0.4429931640625, -0.4201812744140625, -0.397369384765625, -0.3745574951171875, -0.35174560546875, -0.3289337158203125, -0.306121826171875, -0.2833099365234375, -0.260498046875, -0.2376861572265625, -0.214874267578125, -0.1920623779296875, -0.16925048828125, -0.1464385986328125, -0.123626708984375, -0.1008148193359375, -0.0780029296875, -0.0551910400390625, -0.032379150390625, -0.0095672607421875, 0.01324462890625, 0.0360565185546875, 0.058868408203125, 0.0816802978515625, 0.1044921875, 0.1273040771484375, 0.150115966796875, 0.1729278564453125, 0.19573974609375, 0.2185516357421875, 0.241363525390625, 0.2641754150390625, 0.2869873046875, 0.3097991943359375, 0.332611083984375, 0.3554229736328125, 0.37823486328125, 0.4010467529296875, 0.423858642578125, 0.4466705322265625, 0.469482421875, 0.4922943115234375, 0.515106201171875, 0.5379180908203125, 0.56072998046875, 0.5835418701171875, 0.606353759765625, 0.6291656494140625, 0.6519775390625, 0.6747894287109375, 0.697601318359375, 0.7204132080078125, 0.74322509765625, 0.7660369873046875, 0.788848876953125, 0.8116607666015625, 0.83447265625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 7.0, 12.0, 21.0, 26.0, 24.0, 27.0, 36.0, 60.0, 41.0, 63.0, 62.0, 80.0, 73.0, 66.0, 62.0, 59.0, 56.0, 46.0, 38.0, 34.0, 32.0, 23.0, 12.0, 10.0, 8.0, 6.0, 10.0, 6.0, 2.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3820114135742188, -1.3509368896484375, -1.3198623657226562, -1.288787841796875, -1.2577133178710938, -1.2266387939453125, -1.1955642700195312, -1.16448974609375, -1.1334152221679688, -1.1023406982421875, -1.0712661743164062, -1.040191650390625, -1.0091171264648438, -0.9780426025390625, -0.9469680786132812, -0.9158935546875, -0.8848190307617188, -0.8537445068359375, -0.8226699829101562, -0.791595458984375, -0.7605209350585938, -0.7294464111328125, -0.6983718872070312, -0.66729736328125, -0.6362228393554688, -0.6051483154296875, -0.5740737915039062, -0.542999267578125, -0.5119247436523438, -0.4808502197265625, -0.44977569580078125, -0.418701171875, -0.38762664794921875, -0.3565521240234375, -0.32547760009765625, -0.294403076171875, -0.26332855224609375, -0.2322540283203125, -0.20117950439453125, -0.17010498046875, -0.13903045654296875, -0.1079559326171875, -0.07688140869140625, -0.045806884765625, -0.01473236083984375, 0.0163421630859375, 0.04741668701171875, 0.0784912109375, 0.10956573486328125, 0.1406402587890625, 0.17171478271484375, 0.202789306640625, 0.23386383056640625, 0.2649383544921875, 0.29601287841796875, 0.32708740234375, 0.35816192626953125, 0.3892364501953125, 0.42031097412109375, 0.451385498046875, 0.48246002197265625, 0.5135345458984375, 0.5446090698242188, 0.57568359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 4.0, 15.0, 15.0, 20.0, 42.0, 62.0, 112.0, 213.0, 342.0, 678.0, 1551.0, 4548.0, 18603.0, 148192.0, 3584400.0, 390295.0, 33145.0, 7320.0, 2482.0, 1028.0, 524.0, 263.0, 167.0, 74.0, 70.0, 28.0, 21.0, 12.0, 8.0, 5.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.5927734375, -1.5467987060546875, -1.500823974609375, -1.4548492431640625, -1.40887451171875, -1.3628997802734375, -1.316925048828125, -1.2709503173828125, -1.2249755859375, -1.1790008544921875, -1.133026123046875, -1.0870513916015625, -1.04107666015625, -0.9951019287109375, -0.949127197265625, -0.9031524658203125, -0.857177734375, -0.8112030029296875, -0.765228271484375, -0.7192535400390625, -0.67327880859375, -0.6273040771484375, -0.581329345703125, -0.5353546142578125, -0.4893798828125, -0.4434051513671875, -0.397430419921875, -0.3514556884765625, -0.30548095703125, -0.2595062255859375, -0.213531494140625, -0.1675567626953125, -0.12158203125, -0.0756072998046875, -0.029632568359375, 0.0163421630859375, 0.06231689453125, 0.1082916259765625, 0.154266357421875, 0.2002410888671875, 0.2462158203125, 0.2921905517578125, 0.338165283203125, 0.3841400146484375, 0.43011474609375, 0.4760894775390625, 0.522064208984375, 0.5680389404296875, 0.614013671875, 0.6599884033203125, 0.705963134765625, 0.7519378662109375, 0.79791259765625, 0.8438873291015625, 0.889862060546875, 0.9358367919921875, 0.9818115234375, 1.0277862548828125, 1.073760986328125, 1.1197357177734375, 1.16571044921875, 1.2116851806640625, 1.257659912109375, 1.3036346435546875, 1.349609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 2.0, 18.0, 26.0, 61.0, 69.0, 149.0, 355.0, 709.0, 1054.0, 851.0, 361.0, 160.0, 81.0, 44.0, 32.0, 22.0, 16.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.342803955078125, -1.28326416015625, -1.223724365234375, -1.1641845703125, -1.104644775390625, -1.04510498046875, -0.985565185546875, -0.926025390625, -0.866485595703125, -0.80694580078125, -0.747406005859375, -0.6878662109375, -0.628326416015625, -0.56878662109375, -0.509246826171875, -0.44970703125, -0.390167236328125, -0.33062744140625, -0.271087646484375, -0.2115478515625, -0.152008056640625, -0.09246826171875, -0.032928466796875, 0.026611328125, 0.086151123046875, 0.14569091796875, 0.205230712890625, 0.2647705078125, 0.324310302734375, 0.38385009765625, 0.443389892578125, 0.5029296875, 0.562469482421875, 0.62200927734375, 0.681549072265625, 0.7410888671875, 0.800628662109375, 0.86016845703125, 0.919708251953125, 0.979248046875, 1.038787841796875, 1.09832763671875, 1.157867431640625, 1.2174072265625, 1.276947021484375, 1.33648681640625, 1.396026611328125, 1.45556640625, 1.515106201171875, 1.57464599609375, 1.634185791015625, 1.6937255859375, 1.753265380859375, 1.81280517578125, 1.872344970703125, 1.931884765625, 1.991424560546875, 2.05096435546875, 2.110504150390625, 2.1700439453125, 2.229583740234375, 2.28912353515625, 2.348663330078125, 2.408203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 9.0, 17.0, 59.0, 124.0, 255.0, 280.0, 147.0, 59.0, 17.0, 13.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.396169662475586, -11.836724281311035, -11.277278900146484, -10.71783447265625, -10.1583890914917, -9.598943710327148, -9.039499282836914, -8.480053901672363, -7.9206085205078125, -7.361163139343262, -6.801718235015869, -6.242273330688477, -5.682827949523926, -5.123382568359375, -4.563937664031982, -4.00449275970459, -3.445047378540039, -2.8856022357940674, -2.3261570930480957, -1.766711950302124, -1.2072668075561523, -0.6478216648101807, -0.08837652206420898, 0.4710686206817627, 1.0305137634277344, 1.589958906173706, 2.1494040489196777, 2.7088491916656494, 3.268294334411621, 3.8277394771575928, 4.3871846199035645, 4.946629524230957, 5.506076812744141, 6.065522193908691, 6.624967098236084, 7.184412002563477, 7.743857383728027, 8.303302764892578, 8.862747192382812, 9.422192573547363, 9.981637954711914, 10.541083335876465, 11.100528717041016, 11.65997314453125, 12.2194185256958, 12.778863906860352, 13.338308334350586, 13.897753715515137, 14.457199096679688, 15.016644477844238, 15.576089859008789, 16.135534286499023, 16.69498062133789, 17.254425048828125, 17.81386947631836, 18.373315811157227, 18.93276023864746, 19.492204666137695, 20.051651000976562, 20.611095428466797, 21.17053985595703, 21.7299861907959, 22.289430618286133, 22.848876953125, 23.408321380615234]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 5.0, 2.0, 9.0, 14.0, 20.0, 25.0, 33.0, 38.0, 52.0, 59.0, 70.0, 84.0, 85.0, 79.0, 80.0, 69.0, 58.0, 64.0, 35.0, 33.0, 26.0, 15.0, 16.0, 9.0, 5.0, 9.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.438441753387451, -6.079217433929443, -5.7199931144714355, -5.360769271850586, -5.001544952392578, -4.64232063293457, -4.2830963134765625, -3.9238719940185547, -3.564647674560547, -3.205423355102539, -2.8461990356445312, -2.4869749546051025, -2.1277506351470947, -1.768526315689087, -1.4093022346496582, -1.0500779151916504, -0.6908535957336426, -0.33162933588027954, 0.027594923973083496, 0.38681912422180176, 0.7460434436798096, 1.1052677631378174, 1.464491844177246, 1.823716163635254, 2.1829404830932617, 2.5421648025512695, 2.9013891220092773, 3.260613203048706, 3.619837522506714, 3.9790618419647217, 4.33828592300415, 4.697510242462158, 5.056734085083008, 5.415958404541016, 5.775182723999023, 6.134407043457031, 6.493631362915039, 6.852855682373047, 7.2120795249938965, 7.571303844451904, 7.930528163909912, 8.289752006530762, 8.64897632598877, 9.008200645446777, 9.367424964904785, 9.726649284362793, 10.0858736038208, 10.445097923278809, 10.804322242736816, 11.163546562194824, 11.522770881652832, 11.88199520111084, 12.241219520568848, 12.600443840026855, 12.959667205810547, 13.318891525268555, 13.678115844726562, 14.03734016418457, 14.396564483642578, 14.755788803100586, 15.115013122558594, 15.474237442016602, 15.83346176147461, 16.192686080932617, 16.551910400390625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 1.0, 5.0, 13.0, 20.0, 25.0, 40.0, 73.0, 91.0, 181.0, 366.0, 595.0, 1205.0, 2368.0, 5045.0, 11011.0, 26206.0, 63823.0, 157310.0, 320730.0, 264593.0, 114039.0, 45595.0, 19181.0, 8205.0, 3842.0, 1857.0, 951.0, 491.0, 293.0, 186.0, 80.0, 48.0, 25.0, 17.0, 10.0, 9.0, 11.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98974609375, -0.960479736328125, -0.93121337890625, -0.901947021484375, -0.8726806640625, -0.843414306640625, -0.81414794921875, -0.784881591796875, -0.755615234375, -0.726348876953125, -0.69708251953125, -0.667816162109375, -0.6385498046875, -0.609283447265625, -0.58001708984375, -0.550750732421875, -0.521484375, -0.492218017578125, -0.46295166015625, -0.433685302734375, -0.4044189453125, -0.375152587890625, -0.34588623046875, -0.316619873046875, -0.287353515625, -0.258087158203125, -0.22882080078125, -0.199554443359375, -0.1702880859375, -0.141021728515625, -0.11175537109375, -0.082489013671875, -0.05322265625, -0.023956298828125, 0.00531005859375, 0.034576416015625, 0.0638427734375, 0.093109130859375, 0.12237548828125, 0.151641845703125, 0.180908203125, 0.210174560546875, 0.23944091796875, 0.268707275390625, 0.2979736328125, 0.327239990234375, 0.35650634765625, 0.385772705078125, 0.4150390625, 0.444305419921875, 0.47357177734375, 0.502838134765625, 0.5321044921875, 0.561370849609375, 0.59063720703125, 0.619903564453125, 0.649169921875, 0.678436279296875, 0.70770263671875, 0.736968994140625, 0.7662353515625, 0.795501708984375, 0.82476806640625, 0.854034423828125, 0.88330078125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 8.0, 5.0, 10.0, 17.0, 12.0, 13.0, 11.0, 10.0, 21.0, 27.0, 18.0, 26.0, 35.0, 32.0, 38.0, 56.0, 41.0, 37.0, 33.0, 38.0, 39.0, 43.0, 35.0, 40.0, 36.0, 44.0, 36.0, 29.0, 27.0, 27.0, 17.0, 25.0, 21.0, 19.0, 15.0, 16.0, 4.0, 11.0, 9.0, 5.0, 3.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.630859375, -0.6124343872070312, -0.5940093994140625, -0.5755844116210938, -0.557159423828125, -0.5387344360351562, -0.5203094482421875, -0.5018844604492188, -0.48345947265625, -0.46503448486328125, -0.4466094970703125, -0.42818450927734375, -0.409759521484375, -0.39133453369140625, -0.3729095458984375, -0.35448455810546875, -0.3360595703125, -0.31763458251953125, -0.2992095947265625, -0.28078460693359375, -0.262359619140625, -0.24393463134765625, -0.2255096435546875, -0.20708465576171875, -0.18865966796875, -0.17023468017578125, -0.1518096923828125, -0.13338470458984375, -0.114959716796875, -0.09653472900390625, -0.0781097412109375, -0.05968475341796875, -0.041259765625, -0.02283477783203125, -0.0044097900390625, 0.01401519775390625, 0.032440185546875, 0.05086517333984375, 0.0692901611328125, 0.08771514892578125, 0.10614013671875, 0.12456512451171875, 0.1429901123046875, 0.16141510009765625, 0.179840087890625, 0.19826507568359375, 0.2166900634765625, 0.23511505126953125, 0.2535400390625, 0.27196502685546875, 0.2903900146484375, 0.30881500244140625, 0.327239990234375, 0.34566497802734375, 0.3640899658203125, 0.38251495361328125, 0.40093994140625, 0.41936492919921875, 0.4377899169921875, 0.45621490478515625, 0.474639892578125, 0.49306488037109375, 0.5114898681640625, 0.5299148559570312, 0.54833984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 11.0, 24.0, 27.0, 49.0, 48.0, 47.0, 71.0, 113.0, 169.0, 235.0, 297.0, 473.0, 709.0, 1247.0, 2608.0, 8269.0, 42291.0, 324050.0, 589704.0, 60451.0, 10541.0, 3255.0, 1362.0, 770.0, 510.0, 347.0, 228.0, 178.0, 118.0, 92.0, 60.0, 50.0, 47.0, 23.0, 22.0, 17.0, 5.0, 2.0, 8.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.216796875, -2.15362548828125, -2.0904541015625, -2.02728271484375, -1.964111328125, -1.90093994140625, -1.8377685546875, -1.77459716796875, -1.71142578125, -1.64825439453125, -1.5850830078125, -1.52191162109375, -1.458740234375, -1.39556884765625, -1.3323974609375, -1.26922607421875, -1.2060546875, -1.14288330078125, -1.0797119140625, -1.01654052734375, -0.953369140625, -0.89019775390625, -0.8270263671875, -0.76385498046875, -0.70068359375, -0.63751220703125, -0.5743408203125, -0.51116943359375, -0.447998046875, -0.38482666015625, -0.3216552734375, -0.25848388671875, -0.1953125, -0.13214111328125, -0.0689697265625, -0.00579833984375, 0.057373046875, 0.12054443359375, 0.1837158203125, 0.24688720703125, 0.31005859375, 0.37322998046875, 0.4364013671875, 0.49957275390625, 0.562744140625, 0.62591552734375, 0.6890869140625, 0.75225830078125, 0.8154296875, 0.87860107421875, 0.9417724609375, 1.00494384765625, 1.068115234375, 1.13128662109375, 1.1944580078125, 1.25762939453125, 1.32080078125, 1.38397216796875, 1.4471435546875, 1.51031494140625, 1.573486328125, 1.63665771484375, 1.6998291015625, 1.76300048828125, 1.826171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 9.0, 11.0, 14.0, 20.0, 12.0, 22.0, 28.0, 27.0, 26.0, 35.0, 47.0, 47.0, 54.0, 50.0, 53.0, 51.0, 43.0, 54.0, 47.0, 35.0, 45.0, 34.0, 30.0, 29.0, 22.0, 21.0, 15.0, 18.0, 20.0, 12.0, 6.0, 8.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.572265625, -2.49383544921875, -2.4154052734375, -2.33697509765625, -2.258544921875, -2.18011474609375, -2.1016845703125, -2.02325439453125, -1.94482421875, -1.86639404296875, -1.7879638671875, -1.70953369140625, -1.631103515625, -1.55267333984375, -1.4742431640625, -1.39581298828125, -1.3173828125, -1.23895263671875, -1.1605224609375, -1.08209228515625, -1.003662109375, -0.92523193359375, -0.8468017578125, -0.76837158203125, -0.68994140625, -0.61151123046875, -0.5330810546875, -0.45465087890625, -0.376220703125, -0.29779052734375, -0.2193603515625, -0.14093017578125, -0.0625, 0.01593017578125, 0.0943603515625, 0.17279052734375, 0.251220703125, 0.32965087890625, 0.4080810546875, 0.48651123046875, 0.56494140625, 0.64337158203125, 0.7218017578125, 0.80023193359375, 0.878662109375, 0.95709228515625, 1.0355224609375, 1.11395263671875, 1.1923828125, 1.27081298828125, 1.3492431640625, 1.42767333984375, 1.506103515625, 1.58453369140625, 1.6629638671875, 1.74139404296875, 1.81982421875, 1.89825439453125, 1.9766845703125, 2.05511474609375, 2.133544921875, 2.21197509765625, 2.2904052734375, 2.36883544921875, 2.447265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 8.0, 8.0, 7.0, 11.0, 13.0, 16.0, 33.0, 52.0, 67.0, 114.0, 170.0, 251.0, 474.0, 772.0, 1543.0, 3033.0, 6460.0, 18591.0, 86268.0, 694176.0, 188944.0, 29762.0, 9516.0, 3901.0, 1900.0, 970.0, 557.0, 340.0, 206.0, 124.0, 87.0, 53.0, 42.0, 24.0, 18.0, 14.0, 10.0, 11.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7421875, -0.72015380859375, -0.6981201171875, -0.67608642578125, -0.654052734375, -0.63201904296875, -0.6099853515625, -0.58795166015625, -0.56591796875, -0.54388427734375, -0.5218505859375, -0.49981689453125, -0.477783203125, -0.45574951171875, -0.4337158203125, -0.41168212890625, -0.3896484375, -0.36761474609375, -0.3455810546875, -0.32354736328125, -0.301513671875, -0.27947998046875, -0.2574462890625, -0.23541259765625, -0.21337890625, -0.19134521484375, -0.1693115234375, -0.14727783203125, -0.125244140625, -0.10321044921875, -0.0811767578125, -0.05914306640625, -0.037109375, -0.01507568359375, 0.0069580078125, 0.02899169921875, 0.051025390625, 0.07305908203125, 0.0950927734375, 0.11712646484375, 0.13916015625, 0.16119384765625, 0.1832275390625, 0.20526123046875, 0.227294921875, 0.24932861328125, 0.2713623046875, 0.29339599609375, 0.3154296875, 0.33746337890625, 0.3594970703125, 0.38153076171875, 0.403564453125, 0.42559814453125, 0.4476318359375, 0.46966552734375, 0.49169921875, 0.51373291015625, 0.5357666015625, 0.55780029296875, 0.579833984375, 0.60186767578125, 0.6239013671875, 0.64593505859375, 0.66796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 21.0, 42.0, 164.0, 401.0, 203.0, 64.0, 25.0, 16.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004868507385253906, -0.00046428292989730835, -0.0004417151212692261, -0.0004191473126411438, -0.0003965795040130615, -0.00037401169538497925, -0.00035144388675689697, -0.0003288760781288147, -0.0003063082695007324, -0.00028374046087265015, -0.00026117265224456787, -0.0002386048436164856, -0.00021603703498840332, -0.00019346922636032104, -0.00017090141773223877, -0.0001483336091041565, -0.00012576580047607422, -0.00010319799184799194, -8.063018321990967e-05, -5.806237459182739e-05, -3.549456596374512e-05, -1.2926757335662842e-05, 9.641051292419434e-06, 3.220885992050171e-05, 5.4776668548583984e-05, 7.734447717666626e-05, 9.991228580474854e-05, 0.0001224800944328308, 0.00014504790306091309, 0.00016761571168899536, 0.00019018352031707764, 0.0002127513289451599, 0.0002353191375732422, 0.00025788694620132446, 0.00028045475482940674, 0.000303022563457489, 0.0003255903720855713, 0.00034815818071365356, 0.00037072598934173584, 0.0003932937979698181, 0.0004158616065979004, 0.00043842941522598267, 0.00046099722385406494, 0.0004835650324821472, 0.0005061328411102295, 0.0005287006497383118, 0.000551268458366394, 0.0005738362669944763, 0.0005964040756225586, 0.0006189718842506409, 0.0006415396928787231, 0.0006641075015068054, 0.0006866753101348877, 0.00070924311876297, 0.0007318109273910522, 0.0007543787360191345, 0.0007769465446472168, 0.0007995143532752991, 0.0008220821619033813, 0.0008446499705314636, 0.0008672177791595459, 0.0008897855877876282, 0.0009123533964157104, 0.0009349212050437927, 0.000957489013671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 8.0, 10.0, 26.0, 27.0, 65.0, 105.0, 247.0, 504.0, 1648.0, 8827.0, 237929.0, 779079.0, 16374.0, 2425.0, 699.0, 284.0, 121.0, 74.0, 42.0, 20.0, 8.0, 13.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.7332763671875, -1.685302734375, -1.6373291015625, -1.58935546875, -1.5413818359375, -1.493408203125, -1.4454345703125, -1.3974609375, -1.3494873046875, -1.301513671875, -1.2535400390625, -1.20556640625, -1.1575927734375, -1.109619140625, -1.0616455078125, -1.013671875, -0.9656982421875, -0.917724609375, -0.8697509765625, -0.82177734375, -0.7738037109375, -0.725830078125, -0.6778564453125, -0.6298828125, -0.5819091796875, -0.533935546875, -0.4859619140625, -0.43798828125, -0.3900146484375, -0.342041015625, -0.2940673828125, -0.24609375, -0.1981201171875, -0.150146484375, -0.1021728515625, -0.05419921875, -0.0062255859375, 0.041748046875, 0.0897216796875, 0.1376953125, 0.1856689453125, 0.233642578125, 0.2816162109375, 0.32958984375, 0.3775634765625, 0.425537109375, 0.4735107421875, 0.521484375, 0.5694580078125, 0.617431640625, 0.6654052734375, 0.71337890625, 0.7613525390625, 0.809326171875, 0.8572998046875, 0.9052734375, 0.9532470703125, 1.001220703125, 1.0491943359375, 1.09716796875, 1.1451416015625, 1.193115234375, 1.2410888671875, 1.2890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 5.0, 9.0, 3.0, 6.0, 7.0, 11.0, 13.0, 21.0, 20.0, 22.0, 31.0, 36.0, 47.0, 62.0, 44.0, 60.0, 63.0, 71.0, 75.0, 60.0, 52.0, 45.0, 34.0, 28.0, 21.0, 37.0, 17.0, 11.0, 13.0, 13.0, 11.0, 8.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.494384765625, -0.47887420654296875, -0.4633636474609375, -0.44785308837890625, -0.432342529296875, -0.41683197021484375, -0.4013214111328125, -0.38581085205078125, -0.37030029296875, -0.35478973388671875, -0.3392791748046875, -0.32376861572265625, -0.308258056640625, -0.29274749755859375, -0.2772369384765625, -0.26172637939453125, -0.2462158203125, -0.23070526123046875, -0.2151947021484375, -0.19968414306640625, -0.184173583984375, -0.16866302490234375, -0.1531524658203125, -0.13764190673828125, -0.12213134765625, -0.10662078857421875, -0.0911102294921875, -0.07559967041015625, -0.060089111328125, -0.04457855224609375, -0.0290679931640625, -0.01355743408203125, 0.001953125, 0.01746368408203125, 0.0329742431640625, 0.04848480224609375, 0.063995361328125, 0.07950592041015625, 0.0950164794921875, 0.11052703857421875, 0.12603759765625, 0.14154815673828125, 0.1570587158203125, 0.17256927490234375, 0.188079833984375, 0.20359039306640625, 0.2191009521484375, 0.23461151123046875, 0.2501220703125, 0.26563262939453125, 0.2811431884765625, 0.29665374755859375, 0.312164306640625, 0.32767486572265625, 0.3431854248046875, 0.35869598388671875, 0.37420654296875, 0.38971710205078125, 0.4052276611328125, 0.42073822021484375, 0.436248779296875, 0.45175933837890625, 0.4672698974609375, 0.48278045654296875, 0.498291015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 8.0, 20.0, 51.0, 155.0, 334.0, 275.0, 102.0, 32.0, 8.0, 12.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.361270904541016, -33.52109146118164, -32.680908203125, -31.840726852416992, -31.000545501708984, -30.160364151000977, -29.32018280029297, -28.480003356933594, -27.639820098876953, -26.799638748168945, -25.959457397460938, -25.11927604675293, -24.279094696044922, -23.438913345336914, -22.598731994628906, -21.75855255126953, -20.918371200561523, -20.078189849853516, -19.238008499145508, -18.3978271484375, -17.557645797729492, -16.717464447021484, -15.877284049987793, -15.037102699279785, -14.196921348571777, -13.35673999786377, -12.516558647155762, -11.67637825012207, -10.836196899414062, -9.996015548706055, -9.155834197998047, -8.315652847290039, -7.475473403930664, -6.635292053222656, -5.795110702514648, -4.954929828643799, -4.114748477935791, -3.274567127227783, -2.4343862533569336, -1.5942049026489258, -0.754023551940918, 0.08615767955780029, 0.9263389110565186, 1.7665200233459473, 2.606701374053955, 3.446882724761963, 4.2870635986328125, 5.12724494934082, 5.967426300048828, 6.807607650756836, 7.647789001464844, 8.487970352172852, 9.32815170288086, 10.168333053588867, 11.008513450622559, 11.848694801330566, 12.688876152038574, 13.529057502746582, 14.36923885345459, 15.209419250488281, 16.04960060119629, 16.889781951904297, 17.729963302612305, 18.570144653320312, 19.41032600402832]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 8.0, 9.0, 16.0, 16.0, 12.0, 20.0, 14.0, 34.0, 34.0, 25.0, 31.0, 32.0, 34.0, 40.0, 47.0, 72.0, 82.0, 57.0, 49.0, 58.0, 26.0, 32.0, 28.0, 28.0, 25.0, 18.0, 27.0, 19.0, 21.0, 13.0, 10.0, 15.0, 8.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.247876167297363, -7.950588703155518, -7.65330171585083, -7.356014251708984, -7.058727264404297, -6.761439800262451, -6.4641523361206055, -6.166865348815918, -5.869577884674072, -5.572290420532227, -5.275003433227539, -4.977715969085693, -4.680428504943848, -4.38314151763916, -4.0858540534973145, -3.788566827774048, -3.4912796020507812, -3.1939923763275146, -2.896705150604248, -2.5994176864624023, -2.3021304607391357, -2.004843235015869, -1.707555890083313, -1.4102685451507568, -1.1129813194274902, -0.8156940340995789, -0.5184067487716675, -0.2211194634437561, 0.07616782188415527, 0.3734550476074219, 0.670742392539978, 0.9680297374725342, 1.2653179168701172, 1.5626051425933838, 1.85989248752594, 2.157179832458496, 2.4544670581817627, 2.7517542839050293, 3.049041748046875, 3.3463289737701416, 3.643616199493408, 3.940903425216675, 4.238190650939941, 4.535478115081787, 4.832765579223633, 5.13005256652832, 5.427340030670166, 5.724627494812012, 6.021914482116699, 6.319201946258545, 6.616488933563232, 6.913776397705078, 7.211063385009766, 7.508350849151611, 7.805638313293457, 8.102925300598145, 8.400213241577148, 8.697500228881836, 8.99478816986084, 9.292075157165527, 9.589362144470215, 9.886650085449219, 10.183937072753906, 10.481224060058594, 10.778511047363281]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 14.0, 12.0, 16.0, 24.0, 27.0, 46.0, 48.0, 100.0, 146.0, 217.0, 409.0, 763.0, 1796.0, 5694.0, 27704.0, 366074.0, 2889491.0, 834415.0, 54204.0, 8441.0, 2437.0, 992.0, 457.0, 256.0, 164.0, 105.0, 75.0, 45.0, 33.0, 24.0, 18.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84375, -0.813232421875, -0.78271484375, -0.752197265625, -0.7216796875, -0.691162109375, -0.66064453125, -0.630126953125, -0.599609375, -0.569091796875, -0.53857421875, -0.508056640625, -0.4775390625, -0.447021484375, -0.41650390625, -0.385986328125, -0.35546875, -0.324951171875, -0.29443359375, -0.263916015625, -0.2333984375, -0.202880859375, -0.17236328125, -0.141845703125, -0.111328125, -0.080810546875, -0.05029296875, -0.019775390625, 0.0107421875, 0.041259765625, 0.07177734375, 0.102294921875, 0.1328125, 0.163330078125, 0.19384765625, 0.224365234375, 0.2548828125, 0.285400390625, 0.31591796875, 0.346435546875, 0.376953125, 0.407470703125, 0.43798828125, 0.468505859375, 0.4990234375, 0.529541015625, 0.56005859375, 0.590576171875, 0.62109375, 0.651611328125, 0.68212890625, 0.712646484375, 0.7431640625, 0.773681640625, 0.80419921875, 0.834716796875, 0.865234375, 0.895751953125, 0.92626953125, 0.956787109375, 0.9873046875, 1.017822265625, 1.04833984375, 1.078857421875, 1.109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 7.0, 12.0, 9.0, 15.0, 18.0, 17.0, 11.0, 24.0, 29.0, 27.0, 26.0, 29.0, 46.0, 34.0, 47.0, 37.0, 49.0, 48.0, 46.0, 43.0, 51.0, 30.0, 38.0, 35.0, 38.0, 24.0, 27.0, 22.0, 23.0, 32.0, 20.0, 18.0, 12.0, 8.0, 6.0, 3.0, 9.0, 6.0, 10.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58984375, -0.5720291137695312, -0.5542144775390625, -0.5363998413085938, -0.518585205078125, -0.5007705688476562, -0.4829559326171875, -0.46514129638671875, -0.44732666015625, -0.42951202392578125, -0.4116973876953125, -0.39388275146484375, -0.376068115234375, -0.35825347900390625, -0.3404388427734375, -0.32262420654296875, -0.3048095703125, -0.28699493408203125, -0.2691802978515625, -0.25136566162109375, -0.233551025390625, -0.21573638916015625, -0.1979217529296875, -0.18010711669921875, -0.16229248046875, -0.14447784423828125, -0.1266632080078125, -0.10884857177734375, -0.091033935546875, -0.07321929931640625, -0.0554046630859375, -0.03759002685546875, -0.019775390625, -0.00196075439453125, 0.0158538818359375, 0.03366851806640625, 0.051483154296875, 0.06929779052734375, 0.0871124267578125, 0.10492706298828125, 0.12274169921875, 0.14055633544921875, 0.1583709716796875, 0.17618560791015625, 0.194000244140625, 0.21181488037109375, 0.2296295166015625, 0.24744415283203125, 0.2652587890625, 0.28307342529296875, 0.3008880615234375, 0.31870269775390625, 0.336517333984375, 0.35433197021484375, 0.3721466064453125, 0.38996124267578125, 0.40777587890625, 0.42559051513671875, 0.4434051513671875, 0.46121978759765625, 0.479034423828125, 0.49684906005859375, 0.5146636962890625, 0.5324783325195312, 0.55029296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 17.0, 26.0, 52.0, 85.0, 145.0, 341.0, 941.0, 3757.0, 330410.0, 3849428.0, 7079.0, 1142.0, 441.0, 209.0, 91.0, 44.0, 28.0, 14.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.243072509765625, -4.11505126953125, -3.987030029296875, -3.8590087890625, -3.730987548828125, -3.60296630859375, -3.474945068359375, -3.346923828125, -3.218902587890625, -3.09088134765625, -2.962860107421875, -2.8348388671875, -2.706817626953125, -2.57879638671875, -2.450775146484375, -2.32275390625, -2.194732666015625, -2.06671142578125, -1.938690185546875, -1.8106689453125, -1.682647705078125, -1.55462646484375, -1.426605224609375, -1.298583984375, -1.170562744140625, -1.04254150390625, -0.914520263671875, -0.7864990234375, -0.658477783203125, -0.53045654296875, -0.402435302734375, -0.2744140625, -0.146392822265625, -0.01837158203125, 0.109649658203125, 0.2376708984375, 0.365692138671875, 0.49371337890625, 0.621734619140625, 0.749755859375, 0.877777099609375, 1.00579833984375, 1.133819580078125, 1.2618408203125, 1.389862060546875, 1.51788330078125, 1.645904541015625, 1.77392578125, 1.901947021484375, 2.02996826171875, 2.157989501953125, 2.2860107421875, 2.414031982421875, 2.54205322265625, 2.670074462890625, 2.798095703125, 2.926116943359375, 3.05413818359375, 3.182159423828125, 3.3101806640625, 3.438201904296875, 3.56622314453125, 3.694244384765625, 3.822265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 20.0, 62.0, 179.0, 843.0, 2180.0, 595.0, 120.0, 42.0, 19.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.204864501953125, -3.08355712890625, -2.962249755859375, -2.8409423828125, -2.719635009765625, -2.59832763671875, -2.477020263671875, -2.355712890625, -2.234405517578125, -2.11309814453125, -1.991790771484375, -1.8704833984375, -1.749176025390625, -1.62786865234375, -1.506561279296875, -1.38525390625, -1.263946533203125, -1.14263916015625, -1.021331787109375, -0.9000244140625, -0.778717041015625, -0.65740966796875, -0.536102294921875, -0.414794921875, -0.293487548828125, -0.17218017578125, -0.050872802734375, 0.0704345703125, 0.191741943359375, 0.31304931640625, 0.434356689453125, 0.5556640625, 0.676971435546875, 0.79827880859375, 0.919586181640625, 1.0408935546875, 1.162200927734375, 1.28350830078125, 1.404815673828125, 1.526123046875, 1.647430419921875, 1.76873779296875, 1.890045166015625, 2.0113525390625, 2.132659912109375, 2.25396728515625, 2.375274658203125, 2.49658203125, 2.617889404296875, 2.73919677734375, 2.860504150390625, 2.9818115234375, 3.103118896484375, 3.22442626953125, 3.345733642578125, 3.467041015625, 3.588348388671875, 3.70965576171875, 3.830963134765625, 3.9522705078125, 4.073577880859375, 4.19488525390625, 4.316192626953125, 4.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 19.0, 76.0, 518.0, 316.0, 50.0, 13.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8726806640625, -36.564170837402344, -35.25566482543945, -33.9471549987793, -32.63864517211914, -31.33013916015625, -30.021629333496094, -28.71312141418457, -27.404613494873047, -26.096105575561523, -24.787595748901367, -23.479087829589844, -22.17057991027832, -20.862071990966797, -19.55356216430664, -18.245054244995117, -16.93654441833496, -15.628035545349121, -14.319527626037598, -13.011018753051758, -11.702510833740234, -10.394001960754395, -9.085493087768555, -7.776985168457031, -6.468476295471191, -5.15996789932251, -3.851459264755249, -2.5429506301879883, -1.2344422340393066, 0.074066162109375, 1.3825750350952148, 2.6910829544067383, 3.999591827392578, 5.30810022354126, 6.616608619689941, 7.925117492675781, 9.233625411987305, 10.542134284973145, 11.850643157958984, 13.159151077270508, 14.467659950256348, 15.776168823242188, 17.08467674255371, 18.393184661865234, 19.70169448852539, 21.010202407836914, 22.318710327148438, 23.627220153808594, 24.935728073120117, 26.24423599243164, 27.552745819091797, 28.86125373840332, 30.169761657714844, 31.478271484375, 32.786781311035156, 34.09528732299805, 35.4037971496582, 36.71230697631836, 38.02081298828125, 39.329322814941406, 40.63783264160156, 41.94633865356445, 43.25484848022461, 44.5633544921875, 45.871864318847656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 8.0, 5.0, 10.0, 15.0, 19.0, 15.0, 30.0, 53.0, 58.0, 54.0, 69.0, 71.0, 66.0, 88.0, 82.0, 72.0, 72.0, 40.0, 53.0, 37.0, 24.0, 25.0, 13.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.154629707336426, -11.825424194335938, -11.496219635009766, -11.167014122009277, -10.837809562683105, -10.508604049682617, -10.179399490356445, -9.850193977355957, -9.520989418029785, -9.191783905029297, -8.862579345703125, -8.533373832702637, -8.204169273376465, -7.874964237213135, -7.545759201049805, -7.216553688049316, -6.887348651885986, -6.558143615722656, -6.228938579559326, -5.899733543395996, -5.570528507232666, -5.241323471069336, -4.912117958068848, -4.582913398742676, -4.2537078857421875, -3.9245028495788574, -3.5952978134155273, -3.2660927772521973, -2.936887741088867, -2.607682704925537, -2.278477430343628, -1.9492723941802979, -1.6200675964355469, -1.2908625602722168, -0.9616574645042419, -0.6324523687362671, -0.303247332572937, 0.025957703590393066, 0.3551628589630127, 0.6843678951263428, 1.0135729312896729, 1.342777967453003, 1.671983003616333, 2.001188278198242, 2.3303933143615723, 2.6595983505249023, 2.9888033866882324, 3.3180084228515625, 3.6472134590148926, 3.9764184951782227, 4.305623531341553, 4.634828567504883, 4.964033603668213, 5.293238639831543, 5.622444152832031, 5.951648712158203, 6.280854225158691, 6.6100592613220215, 6.939264297485352, 7.268469333648682, 7.597674369812012, 7.926879405975342, 8.256084442138672, 8.58528995513916, 8.914494514465332]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 14.0, 17.0, 33.0, 47.0, 69.0, 99.0, 133.0, 204.0, 324.0, 540.0, 807.0, 1376.0, 2203.0, 3802.0, 6388.0, 11755.0, 21255.0, 39957.0, 73637.0, 132276.0, 205250.0, 215048.0, 148445.0, 83963.0, 44925.0, 24604.0, 13351.0, 7380.0, 4181.0, 2481.0, 1449.0, 875.0, 561.0, 374.0, 273.0, 148.0, 96.0, 69.0, 45.0, 33.0, 14.0, 9.0, 12.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5776214599609375, -0.559051513671875, -0.5404815673828125, -0.52191162109375, -0.5033416748046875, -0.484771728515625, -0.4662017822265625, -0.4476318359375, -0.4290618896484375, -0.410491943359375, -0.3919219970703125, -0.37335205078125, -0.3547821044921875, -0.336212158203125, -0.3176422119140625, -0.299072265625, -0.2805023193359375, -0.261932373046875, -0.2433624267578125, -0.22479248046875, -0.2062225341796875, -0.187652587890625, -0.1690826416015625, -0.1505126953125, -0.1319427490234375, -0.113372802734375, -0.0948028564453125, -0.07623291015625, -0.0576629638671875, -0.039093017578125, -0.0205230712890625, -0.001953125, 0.0166168212890625, 0.035186767578125, 0.0537567138671875, 0.07232666015625, 0.0908966064453125, 0.109466552734375, 0.1280364990234375, 0.1466064453125, 0.1651763916015625, 0.183746337890625, 0.2023162841796875, 0.22088623046875, 0.2394561767578125, 0.258026123046875, 0.2765960693359375, 0.295166015625, 0.3137359619140625, 0.332305908203125, 0.3508758544921875, 0.36944580078125, 0.3880157470703125, 0.406585693359375, 0.4251556396484375, 0.4437255859375, 0.4622955322265625, 0.480865478515625, 0.4994354248046875, 0.51800537109375, 0.5365753173828125, 0.555145263671875, 0.5737152099609375, 0.59228515625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 10.0, 11.0, 14.0, 14.0, 23.0, 26.0, 25.0, 33.0, 36.0, 39.0, 35.0, 50.0, 49.0, 49.0, 69.0, 33.0, 47.0, 51.0, 38.0, 42.0, 37.0, 37.0, 27.0, 30.0, 35.0, 25.0, 21.0, 14.0, 16.0, 15.0, 9.0, 4.0, 8.0, 4.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5880661010742188, -0.5667572021484375, -0.5454483032226562, -0.524139404296875, -0.5028305053710938, -0.4815216064453125, -0.46021270751953125, -0.43890380859375, -0.41759490966796875, -0.3962860107421875, -0.37497711181640625, -0.353668212890625, -0.33235931396484375, -0.3110504150390625, -0.28974151611328125, -0.2684326171875, -0.24712371826171875, -0.2258148193359375, -0.20450592041015625, -0.183197021484375, -0.16188812255859375, -0.1405792236328125, -0.11927032470703125, -0.09796142578125, -0.07665252685546875, -0.0553436279296875, -0.03403472900390625, -0.012725830078125, 0.00858306884765625, 0.0298919677734375, 0.05120086669921875, 0.072509765625, 0.09381866455078125, 0.1151275634765625, 0.13643646240234375, 0.157745361328125, 0.17905426025390625, 0.2003631591796875, 0.22167205810546875, 0.24298095703125, 0.26428985595703125, 0.2855987548828125, 0.30690765380859375, 0.328216552734375, 0.34952545166015625, 0.3708343505859375, 0.39214324951171875, 0.4134521484375, 0.43476104736328125, 0.4560699462890625, 0.47737884521484375, 0.498687744140625, 0.5199966430664062, 0.5413055419921875, 0.5626144409179688, 0.58392333984375, 0.6052322387695312, 0.6265411376953125, 0.6478500366210938, 0.669158935546875, 0.6904678344726562, 0.7117767333984375, 0.7330856323242188, 0.75439453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 1.0, 13.0, 4.0, 16.0, 15.0, 21.0, 25.0, 19.0, 51.0, 44.0, 76.0, 100.0, 151.0, 210.0, 346.0, 595.0, 1274.0, 3341.0, 10992.0, 44089.0, 203993.0, 601373.0, 138409.0, 30312.0, 7985.0, 2550.0, 1047.0, 490.0, 305.0, 204.0, 123.0, 121.0, 58.0, 40.0, 40.0, 25.0, 28.0, 23.0, 17.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.61328125, -1.56634521484375, -1.5194091796875, -1.47247314453125, -1.425537109375, -1.37860107421875, -1.3316650390625, -1.28472900390625, -1.23779296875, -1.19085693359375, -1.1439208984375, -1.09698486328125, -1.050048828125, -1.00311279296875, -0.9561767578125, -0.90924072265625, -0.8623046875, -0.81536865234375, -0.7684326171875, -0.72149658203125, -0.674560546875, -0.62762451171875, -0.5806884765625, -0.53375244140625, -0.48681640625, -0.43988037109375, -0.3929443359375, -0.34600830078125, -0.299072265625, -0.25213623046875, -0.2052001953125, -0.15826416015625, -0.111328125, -0.06439208984375, -0.0174560546875, 0.02947998046875, 0.076416015625, 0.12335205078125, 0.1702880859375, 0.21722412109375, 0.26416015625, 0.31109619140625, 0.3580322265625, 0.40496826171875, 0.451904296875, 0.49884033203125, 0.5457763671875, 0.59271240234375, 0.6396484375, 0.68658447265625, 0.7335205078125, 0.78045654296875, 0.827392578125, 0.87432861328125, 0.9212646484375, 0.96820068359375, 1.01513671875, 1.06207275390625, 1.1090087890625, 1.15594482421875, 1.202880859375, 1.24981689453125, 1.2967529296875, 1.34368896484375, 1.390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 7.0, 6.0, 4.0, 7.0, 9.0, 17.0, 15.0, 17.0, 22.0, 19.0, 31.0, 27.0, 35.0, 48.0, 44.0, 38.0, 39.0, 44.0, 44.0, 62.0, 50.0, 54.0, 44.0, 49.0, 42.0, 52.0, 31.0, 34.0, 19.0, 25.0, 15.0, 15.0, 12.0, 4.0, 7.0, 5.0, 3.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.338134765625, -2.26025390625, -2.182373046875, -2.1044921875, -2.026611328125, -1.94873046875, -1.870849609375, -1.79296875, -1.715087890625, -1.63720703125, -1.559326171875, -1.4814453125, -1.403564453125, -1.32568359375, -1.247802734375, -1.169921875, -1.092041015625, -1.01416015625, -0.936279296875, -0.8583984375, -0.780517578125, -0.70263671875, -0.624755859375, -0.546875, -0.468994140625, -0.39111328125, -0.313232421875, -0.2353515625, -0.157470703125, -0.07958984375, -0.001708984375, 0.076171875, 0.154052734375, 0.23193359375, 0.309814453125, 0.3876953125, 0.465576171875, 0.54345703125, 0.621337890625, 0.69921875, 0.777099609375, 0.85498046875, 0.932861328125, 1.0107421875, 1.088623046875, 1.16650390625, 1.244384765625, 1.322265625, 1.400146484375, 1.47802734375, 1.555908203125, 1.6337890625, 1.711669921875, 1.78955078125, 1.867431640625, 1.9453125, 2.023193359375, 2.10107421875, 2.178955078125, 2.2568359375, 2.334716796875, 2.41259765625, 2.490478515625, 2.568359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 9.0, 6.0, 13.0, 18.0, 39.0, 77.0, 103.0, 164.0, 349.0, 659.0, 1552.0, 3636.0, 11490.0, 40641.0, 177124.0, 623349.0, 140857.0, 32800.0, 9559.0, 3360.0, 1372.0, 621.0, 343.0, 171.0, 106.0, 46.0, 32.0, 24.0, 8.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52099609375, -0.5054092407226562, -0.4898223876953125, -0.47423553466796875, -0.458648681640625, -0.44306182861328125, -0.4274749755859375, -0.41188812255859375, -0.39630126953125, -0.38071441650390625, -0.3651275634765625, -0.34954071044921875, -0.333953857421875, -0.31836700439453125, -0.3027801513671875, -0.28719329833984375, -0.2716064453125, -0.25601959228515625, -0.2404327392578125, -0.22484588623046875, -0.209259033203125, -0.19367218017578125, -0.1780853271484375, -0.16249847412109375, -0.14691162109375, -0.13132476806640625, -0.1157379150390625, -0.10015106201171875, -0.084564208984375, -0.06897735595703125, -0.0533905029296875, -0.03780364990234375, -0.022216796875, -0.00662994384765625, 0.0089569091796875, 0.02454376220703125, 0.040130615234375, 0.05571746826171875, 0.0713043212890625, 0.08689117431640625, 0.10247802734375, 0.11806488037109375, 0.1336517333984375, 0.14923858642578125, 0.164825439453125, 0.18041229248046875, 0.1959991455078125, 0.21158599853515625, 0.2271728515625, 0.24275970458984375, 0.2583465576171875, 0.27393341064453125, 0.289520263671875, 0.30510711669921875, 0.3206939697265625, 0.33628082275390625, 0.35186767578125, 0.36745452880859375, 0.3830413818359375, 0.39862823486328125, 0.414215087890625, 0.42980194091796875, 0.4453887939453125, 0.46097564697265625, 0.4765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 13.0, 20.0, 35.0, 34.0, 55.0, 77.0, 120.0, 145.0, 131.0, 109.0, 89.0, 38.0, 31.0, 18.0, 19.0, 7.0, 9.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015581771731376648, -0.00014831870794296265, -0.0001408196985721588, -0.00013332068920135498, -0.00012582167983055115, -0.00011832267045974731, -0.00011082366108894348, -0.00010332465171813965, -9.582564234733582e-05, -8.832663297653198e-05, -8.082762360572815e-05, -7.332861423492432e-05, -6.582960486412048e-05, -5.833059549331665e-05, -5.083158612251282e-05, -4.3332576751708984e-05, -3.583356738090515e-05, -2.833455801010132e-05, -2.0835548639297485e-05, -1.3336539268493652e-05, -5.837529897689819e-06, 1.6614794731140137e-06, 9.160488843917847e-06, 1.665949821472168e-05, 2.4158507585525513e-05, 3.1657516956329346e-05, 3.915652632713318e-05, 4.665553569793701e-05, 5.4154545068740845e-05, 6.165355443954468e-05, 6.915256381034851e-05, 7.665157318115234e-05, 8.415058255195618e-05, 9.164959192276001e-05, 9.914860129356384e-05, 0.00010664761066436768, 0.00011414662003517151, 0.00012164562940597534, 0.00012914463877677917, 0.000136643648147583, 0.00014414265751838684, 0.00015164166688919067, 0.0001591406762599945, 0.00016663968563079834, 0.00017413869500160217, 0.000181637704372406, 0.00018913671374320984, 0.00019663572311401367, 0.0002041347324848175, 0.00021163374185562134, 0.00021913275122642517, 0.000226631760597229, 0.00023413076996803284, 0.00024162977933883667, 0.0002491287887096405, 0.00025662779808044434, 0.00026412680745124817, 0.000271625816822052, 0.00027912482619285583, 0.00028662383556365967, 0.0002941228449344635, 0.00030162185430526733, 0.00030912086367607117, 0.000316619873046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 11.0, 14.0, 19.0, 33.0, 46.0, 78.0, 111.0, 223.0, 502.0, 1108.0, 3182.0, 11661.0, 58034.0, 343031.0, 543389.0, 68014.0, 13261.0, 3539.0, 1196.0, 495.0, 238.0, 132.0, 78.0, 52.0, 28.0, 21.0, 22.0, 13.0, 9.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53466796875, -0.5162582397460938, -0.4978485107421875, -0.47943878173828125, -0.461029052734375, -0.44261932373046875, -0.4242095947265625, -0.40579986572265625, -0.38739013671875, -0.36898040771484375, -0.3505706787109375, -0.33216094970703125, -0.313751220703125, -0.29534149169921875, -0.2769317626953125, -0.25852203369140625, -0.2401123046875, -0.22170257568359375, -0.2032928466796875, -0.18488311767578125, -0.166473388671875, -0.14806365966796875, -0.1296539306640625, -0.11124420166015625, -0.09283447265625, -0.07442474365234375, -0.0560150146484375, -0.03760528564453125, -0.019195556640625, -0.00078582763671875, 0.0176239013671875, 0.03603363037109375, 0.054443359375, 0.07285308837890625, 0.0912628173828125, 0.10967254638671875, 0.128082275390625, 0.14649200439453125, 0.1649017333984375, 0.18331146240234375, 0.20172119140625, 0.22013092041015625, 0.2385406494140625, 0.25695037841796875, 0.275360107421875, 0.29376983642578125, 0.3121795654296875, 0.33058929443359375, 0.3489990234375, 0.36740875244140625, 0.3858184814453125, 0.40422821044921875, 0.422637939453125, 0.44104766845703125, 0.4594573974609375, 0.47786712646484375, 0.49627685546875, 0.5146865844726562, 0.5330963134765625, 0.5515060424804688, 0.569915771484375, 0.5883255004882812, 0.6067352294921875, 0.6251449584960938, 0.6435546875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 11.0, 11.0, 15.0, 29.0, 27.0, 29.0, 42.0, 39.0, 73.0, 83.0, 91.0, 91.0, 80.0, 77.0, 53.0, 66.0, 41.0, 29.0, 27.0, 19.0, 18.0, 12.0, 9.0, 4.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6296157836914062, -0.6107940673828125, -0.5919723510742188, -0.573150634765625, -0.5543289184570312, -0.5355072021484375, -0.5166854858398438, -0.49786376953125, -0.47904205322265625, -0.4602203369140625, -0.44139862060546875, -0.422576904296875, -0.40375518798828125, -0.3849334716796875, -0.36611175537109375, -0.3472900390625, -0.32846832275390625, -0.3096466064453125, -0.29082489013671875, -0.272003173828125, -0.25318145751953125, -0.2343597412109375, -0.21553802490234375, -0.19671630859375, -0.17789459228515625, -0.1590728759765625, -0.14025115966796875, -0.121429443359375, -0.10260772705078125, -0.0837860107421875, -0.06496429443359375, -0.046142578125, -0.02732086181640625, -0.0084991455078125, 0.01032257080078125, 0.029144287109375, 0.04796600341796875, 0.0667877197265625, 0.08560943603515625, 0.10443115234375, 0.12325286865234375, 0.1420745849609375, 0.16089630126953125, 0.179718017578125, 0.19853973388671875, 0.2173614501953125, 0.23618316650390625, 0.2550048828125, 0.27382659912109375, 0.2926483154296875, 0.31147003173828125, 0.330291748046875, 0.34911346435546875, 0.3679351806640625, 0.38675689697265625, 0.40557861328125, 0.42440032958984375, 0.4432220458984375, 0.46204376220703125, 0.480865478515625, 0.49968719482421875, 0.5185089111328125, 0.5373306274414062, 0.55615234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 19.0, 33.0, 74.0, 159.0, 325.0, 200.0, 103.0, 39.0, 21.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.74115753173828, -17.211669921875, -16.68218421936035, -16.15269660949707, -15.623208999633789, -15.093722343444824, -14.56423568725586, -14.034748077392578, -13.505261421203613, -12.975774765014648, -12.446287155151367, -11.916800498962402, -11.387313842773438, -10.857826232910156, -10.328339576721191, -9.798852920532227, -9.269365310668945, -8.73987865447998, -8.2103910446167, -7.680904388427734, -7.151417255401611, -6.621930122375488, -6.092443466186523, -5.5629563331604, -5.033469200134277, -4.503982067108154, -3.9744951725006104, -3.4450082778930664, -2.9155211448669434, -2.3860340118408203, -1.8565471172332764, -1.3270602226257324, -0.7975730895996094, -0.2680860757827759, 0.2614009380340576, 0.7908879518508911, 1.3203749656677246, 1.8498620986938477, 2.3793489933013916, 2.9088358879089355, 3.4383230209350586, 3.9678101539611816, 4.497297286987305, 5.0267839431762695, 5.556271076202393, 6.085758209228516, 6.6152448654174805, 7.1447319984436035, 7.674219131469727, 8.203705787658691, 8.733193397521973, 9.262680053710938, 9.792167663574219, 10.321654319763184, 10.851140975952148, 11.38062858581543, 11.910115242004395, 12.43960189819336, 12.96908950805664, 13.498576164245605, 14.02806282043457, 14.557550430297852, 15.087037086486816, 15.616523742675781, 16.146011352539062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 8.0, 17.0, 12.0, 13.0, 16.0, 19.0, 22.0, 28.0, 30.0, 29.0, 30.0, 29.0, 35.0, 50.0, 55.0, 88.0, 76.0, 61.0, 37.0, 31.0, 34.0, 22.0, 33.0, 30.0, 16.0, 18.0, 31.0, 19.0, 15.0, 10.0, 7.0, 8.0, 9.0, 4.0, 7.0, 8.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-8.921832084655762, -8.66435432434082, -8.406875610351562, -8.149396896362305, -7.891919136047363, -7.634440898895264, -7.376962661743164, -7.1194844245910645, -6.862006187438965, -6.604527950286865, -6.347049713134766, -6.089571475982666, -5.832093238830566, -5.574615001678467, -5.317136764526367, -5.059658527374268, -4.802180290222168, -4.544702053070068, -4.287223815917969, -4.029745578765869, -3.7722673416137695, -3.51478910446167, -3.2573108673095703, -2.9998326301574707, -2.742354393005371, -2.4848761558532715, -2.227397918701172, -1.9699196815490723, -1.7124414443969727, -1.454963207244873, -1.1974849700927734, -0.9400067329406738, -0.6825294494628906, -0.425051212310791, -0.1675729751586914, 0.0899052619934082, 0.3473834991455078, 0.6048617362976074, 0.862339973449707, 1.1198182106018066, 1.3772964477539062, 1.6347746849060059, 1.8922529220581055, 2.149731159210205, 2.4072093963623047, 2.6646876335144043, 2.922165870666504, 3.1796441078186035, 3.437122344970703, 3.6946005821228027, 3.9520788192749023, 4.209557056427002, 4.467035293579102, 4.724513530731201, 4.981991767883301, 5.2394700050354, 5.4969482421875, 5.7544264793396, 6.011904716491699, 6.269382953643799, 6.526861190795898, 6.784339427947998, 7.041817665100098, 7.299295902252197, 7.556774139404297]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 12.0, 12.0, 9.0, 18.0, 31.0, 51.0, 46.0, 80.0, 109.0, 163.0, 259.0, 390.0, 568.0, 889.0, 1470.0, 2514.0, 4951.0, 11363.0, 37048.0, 169603.0, 830838.0, 2041584.0, 870289.0, 163108.0, 35892.0, 11395.0, 4943.0, 2540.0, 1415.0, 875.0, 558.0, 388.0, 253.0, 177.0, 130.0, 101.0, 63.0, 45.0, 28.0, 19.0, 14.0, 13.0, 5.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5108871459960938, -0.4929656982421875, -0.47504425048828125, -0.457122802734375, -0.43920135498046875, -0.4212799072265625, -0.40335845947265625, -0.38543701171875, -0.36751556396484375, -0.3495941162109375, -0.33167266845703125, -0.313751220703125, -0.29582977294921875, -0.2779083251953125, -0.25998687744140625, -0.2420654296875, -0.22414398193359375, -0.2062225341796875, -0.18830108642578125, -0.170379638671875, -0.15245819091796875, -0.1345367431640625, -0.11661529541015625, -0.09869384765625, -0.08077239990234375, -0.0628509521484375, -0.04492950439453125, -0.027008056640625, -0.00908660888671875, 0.0088348388671875, 0.02675628662109375, 0.044677734375, 0.06259918212890625, 0.0805206298828125, 0.09844207763671875, 0.116363525390625, 0.13428497314453125, 0.1522064208984375, 0.17012786865234375, 0.18804931640625, 0.20597076416015625, 0.2238922119140625, 0.24181365966796875, 0.259735107421875, 0.27765655517578125, 0.2955780029296875, 0.31349945068359375, 0.3314208984375, 0.34934234619140625, 0.3672637939453125, 0.38518524169921875, 0.403106689453125, 0.42102813720703125, 0.4389495849609375, 0.45687103271484375, 0.47479248046875, 0.49271392822265625, 0.5106353759765625, 0.5285568237304688, 0.546478271484375, 0.5643997192382812, 0.5823211669921875, 0.6002426147460938, 0.6181640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 1.0, 4.0, 8.0, 10.0, 10.0, 7.0, 15.0, 29.0, 23.0, 30.0, 40.0, 31.0, 42.0, 35.0, 47.0, 45.0, 50.0, 58.0, 49.0, 42.0, 47.0, 44.0, 37.0, 42.0, 21.0, 35.0, 32.0, 25.0, 19.0, 20.0, 26.0, 24.0, 15.0, 4.0, 12.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61376953125, -0.5949630737304688, -0.5761566162109375, -0.5573501586914062, -0.538543701171875, -0.5197372436523438, -0.5009307861328125, -0.48212432861328125, -0.46331787109375, -0.44451141357421875, -0.4257049560546875, -0.40689849853515625, -0.388092041015625, -0.36928558349609375, -0.3504791259765625, -0.33167266845703125, -0.3128662109375, -0.29405975341796875, -0.2752532958984375, -0.25644683837890625, -0.237640380859375, -0.21883392333984375, -0.2000274658203125, -0.18122100830078125, -0.16241455078125, -0.14360809326171875, -0.1248016357421875, -0.10599517822265625, -0.087188720703125, -0.06838226318359375, -0.0495758056640625, -0.03076934814453125, -0.011962890625, 0.00684356689453125, 0.0256500244140625, 0.04445648193359375, 0.063262939453125, 0.08206939697265625, 0.1008758544921875, 0.11968231201171875, 0.13848876953125, 0.15729522705078125, 0.1761016845703125, 0.19490814208984375, 0.213714599609375, 0.23252105712890625, 0.2513275146484375, 0.27013397216796875, 0.2889404296875, 0.30774688720703125, 0.3265533447265625, 0.34535980224609375, 0.364166259765625, 0.38297271728515625, 0.4017791748046875, 0.42058563232421875, 0.43939208984375, 0.45819854736328125, 0.4770050048828125, 0.49581146240234375, 0.514617919921875, 0.5334243774414062, 0.5522308349609375, 0.5710372924804688, 0.58984375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 16.0, 25.0, 52.0, 162.0, 404.0, 2203.0, 317807.0, 3867955.0, 4624.0, 654.0, 209.0, 86.0, 41.0, 24.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.658935546875, -4.50927734375, -4.359619140625, -4.2099609375, -4.060302734375, -3.91064453125, -3.760986328125, -3.611328125, -3.461669921875, -3.31201171875, -3.162353515625, -3.0126953125, -2.863037109375, -2.71337890625, -2.563720703125, -2.4140625, -2.264404296875, -2.11474609375, -1.965087890625, -1.8154296875, -1.665771484375, -1.51611328125, -1.366455078125, -1.216796875, -1.067138671875, -0.91748046875, -0.767822265625, -0.6181640625, -0.468505859375, -0.31884765625, -0.169189453125, -0.01953125, 0.130126953125, 0.27978515625, 0.429443359375, 0.5791015625, 0.728759765625, 0.87841796875, 1.028076171875, 1.177734375, 1.327392578125, 1.47705078125, 1.626708984375, 1.7763671875, 1.926025390625, 2.07568359375, 2.225341796875, 2.375, 2.524658203125, 2.67431640625, 2.823974609375, 2.9736328125, 3.123291015625, 3.27294921875, 3.422607421875, 3.572265625, 3.721923828125, 3.87158203125, 4.021240234375, 4.1708984375, 4.320556640625, 4.47021484375, 4.619873046875, 4.76953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 10.0, 24.0, 14.0, 40.0, 84.0, 145.0, 339.0, 804.0, 1085.0, 787.0, 364.0, 182.0, 78.0, 44.0, 31.0, 15.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1865234375, -1.1287078857421875, -1.070892333984375, -1.0130767822265625, -0.95526123046875, -0.8974456787109375, -0.839630126953125, -0.7818145751953125, -0.7239990234375, -0.6661834716796875, -0.608367919921875, -0.5505523681640625, -0.49273681640625, -0.4349212646484375, -0.377105712890625, -0.3192901611328125, -0.261474609375, -0.2036590576171875, -0.145843505859375, -0.0880279541015625, -0.03021240234375, 0.0276031494140625, 0.085418701171875, 0.1432342529296875, 0.2010498046875, 0.2588653564453125, 0.316680908203125, 0.3744964599609375, 0.43231201171875, 0.4901275634765625, 0.547943115234375, 0.6057586669921875, 0.66357421875, 0.7213897705078125, 0.779205322265625, 0.8370208740234375, 0.89483642578125, 0.9526519775390625, 1.010467529296875, 1.0682830810546875, 1.1260986328125, 1.1839141845703125, 1.241729736328125, 1.2995452880859375, 1.35736083984375, 1.4151763916015625, 1.472991943359375, 1.5308074951171875, 1.588623046875, 1.6464385986328125, 1.704254150390625, 1.7620697021484375, 1.81988525390625, 1.8777008056640625, 1.935516357421875, 1.9933319091796875, 2.0511474609375, 2.1089630126953125, 2.166778564453125, 2.2245941162109375, 2.28240966796875, 2.3402252197265625, 2.398040771484375, 2.4558563232421875, 2.513671875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 13.0, 22.0, 55.0, 204.0, 299.0, 256.0, 99.0, 28.0, 16.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.188379287719727, -12.54666519165039, -11.904952049255371, -11.263237953186035, -10.6215238571167, -9.97981071472168, -9.338096618652344, -8.696382522583008, -8.054668426513672, -7.412954807281494, -6.771240711212158, -6.1295270919799805, -5.4878129959106445, -4.846099376678467, -4.204385757446289, -3.562671661376953, -2.9209585189819336, -2.2792446613311768, -1.6375309228897095, -0.9958171844482422, -0.35410332679748535, 0.2876105308532715, 0.9293241500854492, 1.5710382461547852, 2.212751865386963, 2.8544657230377197, 3.4961795806884766, 4.137893199920654, 4.779606819152832, 5.421320915222168, 6.063034534454346, 6.704748630523682, 7.346462249755859, 7.988175868988037, 8.629889488220215, 9.27160358428955, 9.913317680358887, 10.555030822753906, 11.196744918823242, 11.838459014892578, 12.480173110961914, 13.12188720703125, 13.76360034942627, 14.405314445495605, 15.047028541564941, 15.688741683959961, 16.330455780029297, 16.972169876098633, 17.61388397216797, 18.255598068237305, 18.89731216430664, 19.539024353027344, 20.18073844909668, 20.822452545166016, 21.46416664123535, 22.105880737304688, 22.74759292602539, 23.389307022094727, 24.031021118164062, 24.672733306884766, 25.3144474029541, 25.956161499023438, 26.597875595092773, 27.23958969116211, 27.881303787231445]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 12.0, 20.0, 21.0, 20.0, 22.0, 51.0, 38.0, 39.0, 51.0, 56.0, 56.0, 49.0, 50.0, 43.0, 66.0, 53.0, 41.0, 31.0, 55.0, 38.0, 38.0, 21.0, 20.0, 17.0, 12.0, 13.0, 9.0, 7.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.450509548187256, -7.235997200012207, -7.021484851837158, -6.806972503662109, -6.592460632324219, -6.377947807312012, -6.163435935974121, -5.948923587799072, -5.734411239624023, -5.519898891448975, -5.305386543273926, -5.090874195098877, -4.876361846923828, -4.6618499755859375, -4.447337627410889, -4.23282527923584, -4.018312931060791, -3.803800582885742, -3.5892882347106934, -3.3747761249542236, -3.160263776779175, -2.945751428604126, -2.7312393188476562, -2.5167269706726074, -2.3022146224975586, -2.0877022743225098, -1.8731900453567505, -1.6586778163909912, -1.4441654682159424, -1.2296531200408936, -1.0151408910751343, -0.800628662109375, -0.5861167907714844, -0.3716045022010803, -0.15709221363067627, 0.05742007493972778, 0.27193236351013184, 0.48644471168518066, 0.7009569406509399, 0.9154691696166992, 1.129981517791748, 1.3444938659667969, 1.5590060949325562, 1.7735183238983154, 1.9880306720733643, 2.202543020248413, 2.417055130004883, 2.6315674781799316, 2.8460798263549805, 3.0605921745300293, 3.275104522705078, 3.489616632461548, 3.7041289806365967, 3.9186413288116455, 4.133153438568115, 4.347665786743164, 4.562178134918213, 4.776690483093262, 4.9912028312683105, 5.205715179443359, 5.42022705078125, 5.634739875793457, 5.849251747131348, 6.0637640953063965, 6.278276443481445]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [6.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 14.0, 20.0, 35.0, 38.0, 70.0, 72.0, 154.0, 213.0, 291.0, 508.0, 725.0, 1230.0, 2042.0, 3146.0, 5205.0, 9251.0, 15775.0, 27693.0, 49693.0, 89325.0, 156435.0, 223943.0, 193733.0, 117800.0, 65269.0, 36076.0, 20480.0, 11829.0, 6909.0, 4027.0, 2445.0, 1504.0, 929.0, 568.0, 369.0, 233.0, 164.0, 88.0, 79.0, 64.0, 27.0, 31.0, 13.0, 12.0, 4.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4507865905761719, -0.43453216552734375, -0.4182777404785156, -0.4020233154296875, -0.3857688903808594, -0.36951446533203125, -0.3532600402832031, -0.337005615234375, -0.3207511901855469, -0.30449676513671875, -0.2882423400878906, -0.2719879150390625, -0.2557334899902344, -0.23947906494140625, -0.22322463989257812, -0.20697021484375, -0.19071578979492188, -0.17446136474609375, -0.15820693969726562, -0.1419525146484375, -0.12569808959960938, -0.10944366455078125, -0.09318923950195312, -0.076934814453125, -0.060680389404296875, -0.04442596435546875, -0.028171539306640625, -0.0119171142578125, 0.004337310791015625, 0.02059173583984375, 0.036846160888671875, 0.0531005859375, 0.06935501098632812, 0.08560943603515625, 0.10186386108398438, 0.1181182861328125, 0.13437271118164062, 0.15062713623046875, 0.16688156127929688, 0.183135986328125, 0.19939041137695312, 0.21564483642578125, 0.23189926147460938, 0.2481536865234375, 0.2644081115722656, 0.28066253662109375, 0.2969169616699219, 0.31317138671875, 0.3294258117675781, 0.34568023681640625, 0.3619346618652344, 0.3781890869140625, 0.3944435119628906, 0.41069793701171875, 0.4269523620605469, 0.443206787109375, 0.4594612121582031, 0.47571563720703125, 0.4919700622558594, 0.5082244873046875, 0.5244789123535156, 0.5407333374023438, 0.5569877624511719, 0.5732421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 9.0, 10.0, 8.0, 19.0, 25.0, 18.0, 17.0, 26.0, 41.0, 36.0, 47.0, 40.0, 44.0, 52.0, 46.0, 45.0, 37.0, 54.0, 36.0, 48.0, 48.0, 24.0, 26.0, 38.0, 28.0, 29.0, 20.0, 24.0, 15.0, 19.0, 14.0, 6.0, 4.0, 7.0, 6.0, 3.0, 7.0, 0.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52880859375, -0.5100021362304688, -0.4911956787109375, -0.47238922119140625, -0.453582763671875, -0.43477630615234375, -0.4159698486328125, -0.39716339111328125, -0.37835693359375, -0.35955047607421875, -0.3407440185546875, -0.32193756103515625, -0.303131103515625, -0.28432464599609375, -0.2655181884765625, -0.24671173095703125, -0.2279052734375, -0.20909881591796875, -0.1902923583984375, -0.17148590087890625, -0.152679443359375, -0.13387298583984375, -0.1150665283203125, -0.09626007080078125, -0.07745361328125, -0.05864715576171875, -0.0398406982421875, -0.02103424072265625, -0.002227783203125, 0.01657867431640625, 0.0353851318359375, 0.05419158935546875, 0.072998046875, 0.09180450439453125, 0.1106109619140625, 0.12941741943359375, 0.148223876953125, 0.16703033447265625, 0.1858367919921875, 0.20464324951171875, 0.22344970703125, 0.24225616455078125, 0.2610626220703125, 0.27986907958984375, 0.298675537109375, 0.31748199462890625, 0.3362884521484375, 0.35509490966796875, 0.3739013671875, 0.39270782470703125, 0.4115142822265625, 0.43032073974609375, 0.449127197265625, 0.46793365478515625, 0.4867401123046875, 0.5055465698242188, 0.52435302734375, 0.5431594848632812, 0.5619659423828125, 0.5807723999023438, 0.599578857421875, 0.6183853149414062, 0.6371917724609375, 0.6559982299804688, 0.6748046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 9.0, 8.0, 11.0, 18.0, 22.0, 25.0, 69.0, 73.0, 127.0, 205.0, 378.0, 770.0, 2221.0, 11783.0, 132598.0, 821244.0, 68295.0, 7373.0, 1735.0, 688.0, 357.0, 178.0, 129.0, 80.0, 47.0, 32.0, 27.0, 16.0, 14.0, 3.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.589935302734375, -2.50994873046875, -2.429962158203125, -2.3499755859375, -2.269989013671875, -2.19000244140625, -2.110015869140625, -2.030029296875, -1.950042724609375, -1.87005615234375, -1.790069580078125, -1.7100830078125, -1.630096435546875, -1.55010986328125, -1.470123291015625, -1.39013671875, -1.310150146484375, -1.23016357421875, -1.150177001953125, -1.0701904296875, -0.990203857421875, -0.91021728515625, -0.830230712890625, -0.750244140625, -0.670257568359375, -0.59027099609375, -0.510284423828125, -0.4302978515625, -0.350311279296875, -0.27032470703125, -0.190338134765625, -0.1103515625, -0.030364990234375, 0.04962158203125, 0.129608154296875, 0.2095947265625, 0.289581298828125, 0.36956787109375, 0.449554443359375, 0.529541015625, 0.609527587890625, 0.68951416015625, 0.769500732421875, 0.8494873046875, 0.929473876953125, 1.00946044921875, 1.089447021484375, 1.16943359375, 1.249420166015625, 1.32940673828125, 1.409393310546875, 1.4893798828125, 1.569366455078125, 1.64935302734375, 1.729339599609375, 1.809326171875, 1.889312744140625, 1.96929931640625, 2.049285888671875, 2.1292724609375, 2.209259033203125, 2.28924560546875, 2.369232177734375, 2.44921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 5.0, 13.0, 9.0, 11.0, 17.0, 21.0, 18.0, 26.0, 29.0, 31.0, 33.0, 38.0, 45.0, 37.0, 57.0, 50.0, 66.0, 52.0, 57.0, 36.0, 44.0, 36.0, 35.0, 29.0, 26.0, 37.0, 21.0, 20.0, 15.0, 11.0, 4.0, 18.0, 12.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.10394287109375, -2.0360107421875, -1.96807861328125, -1.900146484375, -1.83221435546875, -1.7642822265625, -1.69635009765625, -1.62841796875, -1.56048583984375, -1.4925537109375, -1.42462158203125, -1.356689453125, -1.28875732421875, -1.2208251953125, -1.15289306640625, -1.0849609375, -1.01702880859375, -0.9490966796875, -0.88116455078125, -0.813232421875, -0.74530029296875, -0.6773681640625, -0.60943603515625, -0.54150390625, -0.47357177734375, -0.4056396484375, -0.33770751953125, -0.269775390625, -0.20184326171875, -0.1339111328125, -0.06597900390625, 0.001953125, 0.06988525390625, 0.1378173828125, 0.20574951171875, 0.273681640625, 0.34161376953125, 0.4095458984375, 0.47747802734375, 0.54541015625, 0.61334228515625, 0.6812744140625, 0.74920654296875, 0.817138671875, 0.88507080078125, 0.9530029296875, 1.02093505859375, 1.0888671875, 1.15679931640625, 1.2247314453125, 1.29266357421875, 1.360595703125, 1.42852783203125, 1.4964599609375, 1.56439208984375, 1.63232421875, 1.70025634765625, 1.7681884765625, 1.83612060546875, 1.904052734375, 1.97198486328125, 2.0399169921875, 2.10784912109375, 2.17578125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 14.0, 13.0, 30.0, 45.0, 77.0, 109.0, 245.0, 671.0, 2086.0, 8020.0, 54119.0, 796102.0, 164318.0, 17108.0, 3666.0, 1099.0, 415.0, 149.0, 92.0, 51.0, 31.0, 18.0, 23.0, 8.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.77880859375, -0.7534561157226562, -0.7281036376953125, -0.7027511596679688, -0.677398681640625, -0.6520462036132812, -0.6266937255859375, -0.6013412475585938, -0.57598876953125, -0.5506362915039062, -0.5252838134765625, -0.49993133544921875, -0.474578857421875, -0.44922637939453125, -0.4238739013671875, -0.39852142333984375, -0.3731689453125, -0.34781646728515625, -0.3224639892578125, -0.29711151123046875, -0.271759033203125, -0.24640655517578125, -0.2210540771484375, -0.19570159912109375, -0.17034912109375, -0.14499664306640625, -0.1196441650390625, -0.09429168701171875, -0.068939208984375, -0.04358673095703125, -0.0182342529296875, 0.00711822509765625, 0.032470703125, 0.05782318115234375, 0.0831756591796875, 0.10852813720703125, 0.133880615234375, 0.15923309326171875, 0.1845855712890625, 0.20993804931640625, 0.23529052734375, 0.26064300537109375, 0.2859954833984375, 0.31134796142578125, 0.336700439453125, 0.36205291748046875, 0.3874053955078125, 0.41275787353515625, 0.4381103515625, 0.46346282958984375, 0.4888153076171875, 0.5141677856445312, 0.539520263671875, 0.5648727416992188, 0.5902252197265625, 0.6155776977539062, 0.64093017578125, 0.6662826538085938, 0.6916351318359375, 0.7169876098632812, 0.742340087890625, 0.7676925659179688, 0.7930450439453125, 0.8183975219726562, 0.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 30.0, 37.0, 52.0, 85.0, 148.0, 177.0, 166.0, 118.0, 65.0, 39.0, 23.0, 12.0, 10.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003266334533691406, -0.000317256897687912, -0.00030788034200668335, -0.0002985037863254547, -0.0002891272306442261, -0.00027975067496299744, -0.0002703741192817688, -0.00026099756360054016, -0.0002516210079193115, -0.00024224445223808289, -0.00023286789655685425, -0.0002234913408756256, -0.00021411478519439697, -0.00020473822951316833, -0.0001953616738319397, -0.00018598511815071106, -0.00017660856246948242, -0.00016723200678825378, -0.00015785545110702515, -0.0001484788954257965, -0.00013910233974456787, -0.00012972578406333923, -0.0001203492283821106, -0.00011097267270088196, -0.00010159611701965332, -9.221956133842468e-05, -8.284300565719604e-05, -7.346644997596741e-05, -6.408989429473877e-05, -5.471333861351013e-05, -4.5336782932281494e-05, -3.5960227251052856e-05, -2.658367156982422e-05, -1.720711588859558e-05, -7.830560207366943e-06, 1.5459954738616943e-06, 1.0922551155090332e-05, 2.029910683631897e-05, 2.9675662517547607e-05, 3.9052218198776245e-05, 4.842877388000488e-05, 5.780532956123352e-05, 6.718188524246216e-05, 7.65584409236908e-05, 8.593499660491943e-05, 9.531155228614807e-05, 0.00010468810796737671, 0.00011406466364860535, 0.00012344121932983398, 0.00013281777501106262, 0.00014219433069229126, 0.0001515708863735199, 0.00016094744205474854, 0.00017032399773597717, 0.0001797005534172058, 0.00018907710909843445, 0.00019845366477966309, 0.00020783022046089172, 0.00021720677614212036, 0.000226583331823349, 0.00023595988750457764, 0.0002453364431858063, 0.0002547129988670349, 0.00026408955454826355, 0.0002734661102294922]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 34.0, 44.0, 100.0, 327.0, 1349.0, 26678.0, 1004701.0, 13735.0, 1089.0, 284.0, 93.0, 36.0, 33.0, 8.0, 6.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.247100830078125, -2.17779541015625, -2.108489990234375, -2.0391845703125, -1.969879150390625, -1.90057373046875, -1.831268310546875, -1.761962890625, -1.692657470703125, -1.62335205078125, -1.554046630859375, -1.4847412109375, -1.415435791015625, -1.34613037109375, -1.276824951171875, -1.20751953125, -1.138214111328125, -1.06890869140625, -0.999603271484375, -0.9302978515625, -0.860992431640625, -0.79168701171875, -0.722381591796875, -0.653076171875, -0.583770751953125, -0.51446533203125, -0.445159912109375, -0.3758544921875, -0.306549072265625, -0.23724365234375, -0.167938232421875, -0.0986328125, -0.029327392578125, 0.03997802734375, 0.109283447265625, 0.1785888671875, 0.247894287109375, 0.31719970703125, 0.386505126953125, 0.455810546875, 0.525115966796875, 0.59442138671875, 0.663726806640625, 0.7330322265625, 0.802337646484375, 0.87164306640625, 0.940948486328125, 1.01025390625, 1.079559326171875, 1.14886474609375, 1.218170166015625, 1.2874755859375, 1.356781005859375, 1.42608642578125, 1.495391845703125, 1.564697265625, 1.634002685546875, 1.70330810546875, 1.772613525390625, 1.8419189453125, 1.911224365234375, 1.98052978515625, 2.049835205078125, 2.119140625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 6.0, 13.0, 27.0, 90.0, 186.0, 266.0, 195.0, 119.0, 50.0, 17.0, 13.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6279296875, -1.579620361328125, -1.53131103515625, -1.483001708984375, -1.4346923828125, -1.386383056640625, -1.33807373046875, -1.289764404296875, -1.241455078125, -1.193145751953125, -1.14483642578125, -1.096527099609375, -1.0482177734375, -0.999908447265625, -0.95159912109375, -0.903289794921875, -0.85498046875, -0.806671142578125, -0.75836181640625, -0.710052490234375, -0.6617431640625, -0.613433837890625, -0.56512451171875, -0.516815185546875, -0.468505859375, -0.420196533203125, -0.37188720703125, -0.323577880859375, -0.2752685546875, -0.226959228515625, -0.17864990234375, -0.130340576171875, -0.08203125, -0.033721923828125, 0.01458740234375, 0.062896728515625, 0.1112060546875, 0.159515380859375, 0.20782470703125, 0.256134033203125, 0.304443359375, 0.352752685546875, 0.40106201171875, 0.449371337890625, 0.4976806640625, 0.545989990234375, 0.59429931640625, 0.642608642578125, 0.69091796875, 0.739227294921875, 0.78753662109375, 0.835845947265625, 0.8841552734375, 0.932464599609375, 0.98077392578125, 1.029083251953125, 1.077392578125, 1.125701904296875, 1.17401123046875, 1.222320556640625, 1.2706298828125, 1.318939208984375, 1.36724853515625, 1.415557861328125, 1.4638671875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 6.0, 12.0, 27.0, 72.0, 119.0, 317.0, 283.0, 101.0, 43.0, 15.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.00189971923828, -29.363317489624023, -28.724735260009766, -28.086153030395508, -27.44757080078125, -26.80898666381836, -26.1704044342041, -25.531822204589844, -24.893239974975586, -24.254657745361328, -23.61607551574707, -22.977493286132812, -22.338909149169922, -21.700326919555664, -21.061744689941406, -20.42316246032715, -19.78458023071289, -19.145998001098633, -18.507415771484375, -17.868833541870117, -17.23025131225586, -16.59166717529297, -15.953084945678711, -15.314502716064453, -14.675920486450195, -14.037338256835938, -13.39875602722168, -12.760172843933105, -12.121590614318848, -11.48300838470459, -10.844425201416016, -10.205842971801758, -9.5672607421875, -8.928678512573242, -8.290096282958984, -7.65151309967041, -7.012930870056152, -6.3743486404418945, -5.7357659339904785, -5.0971832275390625, -4.458600997924805, -3.8200185298919678, -3.181436061859131, -2.542853593826294, -1.904271125793457, -1.2656886577606201, -0.6271061897277832, 0.011476516723632812, 0.6500587463378906, 1.2886412143707275, 1.9272236824035645, 2.5658061504364014, 3.2043886184692383, 3.842971086502075, 4.481553554534912, 5.120136260986328, 5.758718490600586, 6.397300720214844, 7.03588342666626, 7.674466133117676, 8.313048362731934, 8.951630592346191, 9.590213775634766, 10.228796005249023, 10.867378234863281]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 4.0, 13.0, 11.0, 7.0, 16.0, 17.0, 16.0, 17.0, 18.0, 18.0, 28.0, 37.0, 23.0, 26.0, 32.0, 42.0, 48.0, 103.0, 102.0, 66.0, 32.0, 27.0, 26.0, 32.0, 30.0, 33.0, 25.0, 14.0, 18.0, 7.0, 5.0, 10.0, 8.0, 12.0, 9.0, 6.0, 12.0, 2.0, 1.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.52434778213501, -7.28047513961792, -7.03660249710083, -6.79272985458374, -6.54885721206665, -6.3049845695495605, -6.0611114501953125, -5.817238807678223, -5.573366165161133, -5.329493522644043, -5.085620880126953, -4.841748237609863, -4.597875595092773, -4.354002952575684, -4.110130310058594, -3.866257429122925, -3.622385025024414, -3.378512382507324, -3.1346397399902344, -2.8907670974731445, -2.6468944549560547, -2.403021812438965, -2.159148931503296, -1.915276288986206, -1.6714036464691162, -1.4275310039520264, -1.1836583614349365, -0.9397855997085571, -0.6959129571914673, -0.45204031467437744, -0.20816755294799805, 0.0357050895690918, 0.27957820892333984, 0.5234508514404297, 0.7673235535621643, 1.011196255683899, 1.2550688982009888, 1.4989415407180786, 1.742814302444458, 1.9866869449615479, 2.2305595874786377, 2.4744322299957275, 2.7183048725128174, 2.9621777534484863, 3.206050395965576, 3.449923038482666, 3.693795680999756, 3.9376683235168457, 4.1815409660339355, 4.425413608551025, 4.669286251068115, 4.913158893585205, 5.157031536102295, 5.400904178619385, 5.644777297973633, 5.888649940490723, 6.1325225830078125, 6.376395225524902, 6.620267868041992, 6.864140510559082, 7.108013153076172, 7.351885795593262, 7.595758438110352, 7.839631080627441, 8.083503723144531]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 12.0, 14.0, 27.0, 30.0, 62.0, 68.0, 113.0, 152.0, 253.0, 453.0, 821.0, 1372.0, 2826.0, 6271.0, 17395.0, 64374.0, 282624.0, 1158681.0, 1865685.0, 612018.0, 130787.0, 31826.0, 9844.0, 4040.0, 1927.0, 1059.0, 554.0, 357.0, 215.0, 129.0, 93.0, 54.0, 40.0, 25.0, 20.0, 17.0, 7.0, 10.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.60693359375, -0.58868408203125, -0.5704345703125, -0.55218505859375, -0.533935546875, -0.51568603515625, -0.4974365234375, -0.47918701171875, -0.4609375, -0.44268798828125, -0.4244384765625, -0.40618896484375, -0.387939453125, -0.36968994140625, -0.3514404296875, -0.33319091796875, -0.31494140625, -0.29669189453125, -0.2784423828125, -0.26019287109375, -0.241943359375, -0.22369384765625, -0.2054443359375, -0.18719482421875, -0.1689453125, -0.15069580078125, -0.1324462890625, -0.11419677734375, -0.095947265625, -0.07769775390625, -0.0594482421875, -0.04119873046875, -0.02294921875, -0.00469970703125, 0.0135498046875, 0.03179931640625, 0.050048828125, 0.06829833984375, 0.0865478515625, 0.10479736328125, 0.123046875, 0.14129638671875, 0.1595458984375, 0.17779541015625, 0.196044921875, 0.21429443359375, 0.2325439453125, 0.25079345703125, 0.26904296875, 0.28729248046875, 0.3055419921875, 0.32379150390625, 0.342041015625, 0.36029052734375, 0.3785400390625, 0.39678955078125, 0.4150390625, 0.43328857421875, 0.4515380859375, 0.46978759765625, 0.488037109375, 0.50628662109375, 0.5245361328125, 0.54278564453125, 0.56103515625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 0.0, 9.0, 6.0, 10.0, 10.0, 9.0, 15.0, 12.0, 21.0, 22.0, 21.0, 25.0, 37.0, 33.0, 35.0, 31.0, 42.0, 34.0, 43.0, 41.0, 45.0, 34.0, 34.0, 58.0, 34.0, 34.0, 35.0, 22.0, 37.0, 30.0, 33.0, 21.0, 14.0, 13.0, 21.0, 15.0, 13.0, 10.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.52099609375, -0.504150390625, -0.4873046875, -0.470458984375, -0.45361328125, -0.436767578125, -0.419921875, -0.403076171875, -0.38623046875, -0.369384765625, -0.3525390625, -0.335693359375, -0.31884765625, -0.302001953125, -0.28515625, -0.268310546875, -0.25146484375, -0.234619140625, -0.2177734375, -0.200927734375, -0.18408203125, -0.167236328125, -0.150390625, -0.133544921875, -0.11669921875, -0.099853515625, -0.0830078125, -0.066162109375, -0.04931640625, -0.032470703125, -0.015625, 0.001220703125, 0.01806640625, 0.034912109375, 0.0517578125, 0.068603515625, 0.08544921875, 0.102294921875, 0.119140625, 0.135986328125, 0.15283203125, 0.169677734375, 0.1865234375, 0.203369140625, 0.22021484375, 0.237060546875, 0.25390625, 0.270751953125, 0.28759765625, 0.304443359375, 0.3212890625, 0.338134765625, 0.35498046875, 0.371826171875, 0.388671875, 0.405517578125, 0.42236328125, 0.439208984375, 0.4560546875, 0.472900390625, 0.48974609375, 0.506591796875, 0.5234375, 0.540283203125, 0.55712890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 17.0, 41.0, 117.0, 290.0, 1041.0, 19763.0, 4152367.0, 19013.0, 1106.0, 295.0, 116.0, 52.0, 27.0, 10.0, 10.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.21209716796875, -4.0531005859375, -3.89410400390625, -3.735107421875, -3.57611083984375, -3.4171142578125, -3.25811767578125, -3.09912109375, -2.94012451171875, -2.7811279296875, -2.62213134765625, -2.463134765625, -2.30413818359375, -2.1451416015625, -1.98614501953125, -1.8271484375, -1.66815185546875, -1.5091552734375, -1.35015869140625, -1.191162109375, -1.03216552734375, -0.8731689453125, -0.71417236328125, -0.55517578125, -0.39617919921875, -0.2371826171875, -0.07818603515625, 0.080810546875, 0.23980712890625, 0.3988037109375, 0.55780029296875, 0.716796875, 0.87579345703125, 1.0347900390625, 1.19378662109375, 1.352783203125, 1.51177978515625, 1.6707763671875, 1.82977294921875, 1.98876953125, 2.14776611328125, 2.3067626953125, 2.46575927734375, 2.624755859375, 2.78375244140625, 2.9427490234375, 3.10174560546875, 3.2607421875, 3.41973876953125, 3.5787353515625, 3.73773193359375, 3.896728515625, 4.05572509765625, 4.2147216796875, 4.37371826171875, 4.53271484375, 4.69171142578125, 4.8507080078125, 5.00970458984375, 5.168701171875, 5.32769775390625, 5.4866943359375, 5.64569091796875, 5.8046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 5.0, 6.0, 3.0, 7.0, 14.0, 41.0, 88.0, 178.0, 383.0, 880.0, 1175.0, 710.0, 292.0, 142.0, 57.0, 44.0, 22.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.678985595703125, -1.60992431640625, -1.540863037109375, -1.4718017578125, -1.402740478515625, -1.33367919921875, -1.264617919921875, -1.195556640625, -1.126495361328125, -1.05743408203125, -0.988372802734375, -0.9193115234375, -0.850250244140625, -0.78118896484375, -0.712127685546875, -0.64306640625, -0.574005126953125, -0.50494384765625, -0.435882568359375, -0.3668212890625, -0.297760009765625, -0.22869873046875, -0.159637451171875, -0.090576171875, -0.021514892578125, 0.04754638671875, 0.116607666015625, 0.1856689453125, 0.254730224609375, 0.32379150390625, 0.392852783203125, 0.4619140625, 0.530975341796875, 0.60003662109375, 0.669097900390625, 0.7381591796875, 0.807220458984375, 0.87628173828125, 0.945343017578125, 1.014404296875, 1.083465576171875, 1.15252685546875, 1.221588134765625, 1.2906494140625, 1.359710693359375, 1.42877197265625, 1.497833251953125, 1.56689453125, 1.635955810546875, 1.70501708984375, 1.774078369140625, 1.8431396484375, 1.912200927734375, 1.98126220703125, 2.050323486328125, 2.119384765625, 2.188446044921875, 2.25750732421875, 2.326568603515625, 2.3956298828125, 2.464691162109375, 2.53375244140625, 2.602813720703125, 2.671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 19.0, 45.0, 172.0, 361.0, 255.0, 85.0, 32.0, 20.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.079544067382812, -11.24988079071045, -10.420218467712402, -9.590555191040039, -8.760892868041992, -7.931229591369629, -7.101566314697266, -6.2719035148620605, -5.4422407150268555, -4.61257791519165, -3.782914876937866, -2.953251838684082, -2.123589038848877, -1.2939262390136719, -0.4642629623413086, 0.3653998374938965, 1.1950626373291016, 2.0247254371643066, 2.854388475418091, 3.684051513671875, 4.51371431350708, 5.343377113342285, 6.173040390014648, 7.0027031898498535, 7.832365989685059, 8.662029266357422, 9.491691589355469, 10.321354866027832, 11.151018142700195, 11.980680465698242, 12.810343742370605, 13.640007019042969, 14.469669342041016, 15.299332618713379, 16.128995895385742, 16.95865821838379, 17.788320541381836, 18.617984771728516, 19.447647094726562, 20.27730941772461, 21.106971740722656, 21.936634063720703, 22.766298294067383, 23.59596061706543, 24.425622940063477, 25.255287170410156, 26.084949493408203, 26.91461181640625, 27.74427604675293, 28.573938369750977, 29.403602600097656, 30.233264923095703, 31.06292724609375, 31.892589569091797, 32.722251892089844, 33.551918029785156, 34.3815803527832, 35.21124267578125, 36.0409049987793, 36.870567321777344, 37.700233459472656, 38.5298957824707, 39.35955810546875, 40.1892204284668, 41.018882751464844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 23.0, 35.0, 37.0, 35.0, 39.0, 43.0, 65.0, 43.0, 46.0, 40.0, 47.0, 44.0, 50.0, 55.0, 38.0, 36.0, 30.0, 35.0, 31.0, 31.0, 29.0, 18.0, 18.0, 15.0, 8.0, 7.0, 13.0, 7.0, 4.0, 8.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.137204170227051, -6.908017635345459, -6.678831100463867, -6.449645042419434, -6.220458507537842, -5.99127197265625, -5.762085437774658, -5.532898902893066, -5.303712368011475, -5.074525833129883, -4.845339298248291, -4.616152763366699, -4.386966705322266, -4.157780170440674, -3.928593635559082, -3.6994071006774902, -3.4702208042144775, -3.2410342693328857, -3.011847972869873, -2.7826614379882812, -2.5534749031066895, -2.3242883682250977, -2.095102071762085, -1.8659155368804932, -1.636729121208191, -1.4075427055358887, -1.1783561706542969, -0.9491697549819946, -0.7199832797050476, -0.4907968044281006, -0.26161038875579834, -0.03242385387420654, 0.1967625617980957, 0.4259490370750427, 0.6551355123519897, 0.884321928024292, 1.1135084629058838, 1.342694878578186, 1.5718812942504883, 1.80106782913208, 2.030254364013672, 2.2594408988952637, 2.4886271953582764, 2.717813730239868, 2.94700026512146, 3.1761865615844727, 3.4053730964660645, 3.6345596313476562, 3.863745927810669, 4.092932224273682, 4.322118759155273, 4.551305294036865, 4.780491828918457, 5.009678363800049, 5.238864898681641, 5.468050956726074, 5.697237491607666, 5.926424026489258, 6.15561056137085, 6.384797096252441, 6.613983154296875, 6.843169689178467, 7.072356224060059, 7.30154275894165, 7.530729293823242]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 9.0, 9.0, 7.0, 19.0, 34.0, 39.0, 44.0, 78.0, 128.0, 184.0, 286.0, 431.0, 670.0, 1104.0, 1641.0, 2820.0, 4775.0, 8109.0, 14518.0, 27257.0, 53189.0, 107500.0, 212368.0, 271908.0, 167528.0, 82562.0, 41531.0, 21577.0, 11780.0, 6430.0, 3757.0, 2294.0, 1444.0, 882.0, 521.0, 367.0, 258.0, 177.0, 111.0, 55.0, 51.0, 34.0, 30.0, 13.0, 16.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61474609375, -0.5922393798828125, -0.569732666015625, -0.5472259521484375, -0.52471923828125, -0.5022125244140625, -0.479705810546875, -0.4571990966796875, -0.4346923828125, -0.4121856689453125, -0.389678955078125, -0.3671722412109375, -0.34466552734375, -0.3221588134765625, -0.299652099609375, -0.2771453857421875, -0.254638671875, -0.2321319580078125, -0.209625244140625, -0.1871185302734375, -0.16461181640625, -0.1421051025390625, -0.119598388671875, -0.0970916748046875, -0.0745849609375, -0.0520782470703125, -0.029571533203125, -0.0070648193359375, 0.01544189453125, 0.0379486083984375, 0.060455322265625, 0.0829620361328125, 0.10546875, 0.1279754638671875, 0.150482177734375, 0.1729888916015625, 0.19549560546875, 0.2180023193359375, 0.240509033203125, 0.2630157470703125, 0.2855224609375, 0.3080291748046875, 0.330535888671875, 0.3530426025390625, 0.37554931640625, 0.3980560302734375, 0.420562744140625, 0.4430694580078125, 0.465576171875, 0.4880828857421875, 0.510589599609375, 0.5330963134765625, 0.55560302734375, 0.5781097412109375, 0.600616455078125, 0.6231231689453125, 0.6456298828125, 0.6681365966796875, 0.690643310546875, 0.7131500244140625, 0.73565673828125, 0.7581634521484375, 0.780670166015625, 0.8031768798828125, 0.82568359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 10.0, 5.0, 5.0, 4.0, 15.0, 14.0, 14.0, 15.0, 20.0, 23.0, 29.0, 32.0, 35.0, 32.0, 34.0, 56.0, 37.0, 41.0, 41.0, 44.0, 54.0, 51.0, 49.0, 31.0, 48.0, 37.0, 23.0, 26.0, 28.0, 24.0, 15.0, 16.0, 19.0, 13.0, 13.0, 5.0, 6.0, 7.0, 7.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.572265625, -0.5529861450195312, -0.5337066650390625, -0.5144271850585938, -0.495147705078125, -0.47586822509765625, -0.4565887451171875, -0.43730926513671875, -0.41802978515625, -0.39875030517578125, -0.3794708251953125, -0.36019134521484375, -0.340911865234375, -0.32163238525390625, -0.3023529052734375, -0.28307342529296875, -0.2637939453125, -0.24451446533203125, -0.2252349853515625, -0.20595550537109375, -0.186676025390625, -0.16739654541015625, -0.1481170654296875, -0.12883758544921875, -0.10955810546875, -0.09027862548828125, -0.0709991455078125, -0.05171966552734375, -0.032440185546875, -0.01316070556640625, 0.0061187744140625, 0.02539825439453125, 0.044677734375, 0.06395721435546875, 0.0832366943359375, 0.10251617431640625, 0.121795654296875, 0.14107513427734375, 0.1603546142578125, 0.17963409423828125, 0.19891357421875, 0.21819305419921875, 0.2374725341796875, 0.25675201416015625, 0.276031494140625, 0.29531097412109375, 0.3145904541015625, 0.33386993408203125, 0.3531494140625, 0.37242889404296875, 0.3917083740234375, 0.41098785400390625, 0.430267333984375, 0.44954681396484375, 0.4688262939453125, 0.48810577392578125, 0.50738525390625, 0.5266647338867188, 0.5459442138671875, 0.5652236938476562, 0.584503173828125, 0.6037826538085938, 0.6230621337890625, 0.6423416137695312, 0.66162109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 7.0, 8.0, 17.0, 16.0, 28.0, 32.0, 64.0, 98.0, 149.0, 243.0, 416.0, 883.0, 2438.0, 15990.0, 772546.0, 242044.0, 9895.0, 1924.0, 791.0, 396.0, 221.0, 123.0, 81.0, 38.0, 32.0, 23.0, 21.0, 5.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.39453125, -4.275421142578125, -4.15631103515625, -4.037200927734375, -3.9180908203125, -3.798980712890625, -3.67987060546875, -3.560760498046875, -3.441650390625, -3.322540283203125, -3.20343017578125, -3.084320068359375, -2.9652099609375, -2.846099853515625, -2.72698974609375, -2.607879638671875, -2.48876953125, -2.369659423828125, -2.25054931640625, -2.131439208984375, -2.0123291015625, -1.893218994140625, -1.77410888671875, -1.654998779296875, -1.535888671875, -1.416778564453125, -1.29766845703125, -1.178558349609375, -1.0594482421875, -0.940338134765625, -0.82122802734375, -0.702117919921875, -0.5830078125, -0.463897705078125, -0.34478759765625, -0.225677490234375, -0.1065673828125, 0.012542724609375, 0.13165283203125, 0.250762939453125, 0.369873046875, 0.488983154296875, 0.60809326171875, 0.727203369140625, 0.8463134765625, 0.965423583984375, 1.08453369140625, 1.203643798828125, 1.32275390625, 1.441864013671875, 1.56097412109375, 1.680084228515625, 1.7991943359375, 1.918304443359375, 2.03741455078125, 2.156524658203125, 2.275634765625, 2.394744873046875, 2.51385498046875, 2.632965087890625, 2.7520751953125, 2.871185302734375, 2.99029541015625, 3.109405517578125, 3.228515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 7.0, 4.0, 2.0, 7.0, 9.0, 12.0, 8.0, 15.0, 18.0, 22.0, 19.0, 29.0, 29.0, 26.0, 44.0, 44.0, 42.0, 52.0, 57.0, 60.0, 57.0, 51.0, 54.0, 43.0, 53.0, 30.0, 32.0, 27.0, 29.0, 19.0, 16.0, 11.0, 19.0, 5.0, 7.0, 5.0, 8.0, 3.0, 1.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.322509765625, -2.24658203125, -2.170654296875, -2.0947265625, -2.018798828125, -1.94287109375, -1.866943359375, -1.791015625, -1.715087890625, -1.63916015625, -1.563232421875, -1.4873046875, -1.411376953125, -1.33544921875, -1.259521484375, -1.18359375, -1.107666015625, -1.03173828125, -0.955810546875, -0.8798828125, -0.803955078125, -0.72802734375, -0.652099609375, -0.576171875, -0.500244140625, -0.42431640625, -0.348388671875, -0.2724609375, -0.196533203125, -0.12060546875, -0.044677734375, 0.03125, 0.107177734375, 0.18310546875, 0.259033203125, 0.3349609375, 0.410888671875, 0.48681640625, 0.562744140625, 0.638671875, 0.714599609375, 0.79052734375, 0.866455078125, 0.9423828125, 1.018310546875, 1.09423828125, 1.170166015625, 1.24609375, 1.322021484375, 1.39794921875, 1.473876953125, 1.5498046875, 1.625732421875, 1.70166015625, 1.777587890625, 1.853515625, 1.929443359375, 2.00537109375, 2.081298828125, 2.1572265625, 2.233154296875, 2.30908203125, 2.385009765625, 2.4609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 1.0, 14.0, 9.0, 8.0, 5.0, 14.0, 27.0, 34.0, 52.0, 80.0, 117.0, 206.0, 437.0, 897.0, 2509.0, 9615.0, 55684.0, 760473.0, 188027.0, 22418.0, 4888.0, 1597.0, 635.0, 314.0, 189.0, 95.0, 60.0, 36.0, 29.0, 19.0, 9.0, 8.0, 6.0, 9.0, 2.0, 5.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6845703125, -0.6648788452148438, -0.6451873779296875, -0.6254959106445312, -0.605804443359375, -0.5861129760742188, -0.5664215087890625, -0.5467300415039062, -0.52703857421875, -0.5073471069335938, -0.4876556396484375, -0.46796417236328125, -0.448272705078125, -0.42858123779296875, -0.4088897705078125, -0.38919830322265625, -0.3695068359375, -0.34981536865234375, -0.3301239013671875, -0.31043243408203125, -0.290740966796875, -0.27104949951171875, -0.2513580322265625, -0.23166656494140625, -0.21197509765625, -0.19228363037109375, -0.1725921630859375, -0.15290069580078125, -0.133209228515625, -0.11351776123046875, -0.0938262939453125, -0.07413482666015625, -0.054443359375, -0.03475189208984375, -0.0150604248046875, 0.00463104248046875, 0.024322509765625, 0.04401397705078125, 0.0637054443359375, 0.08339691162109375, 0.10308837890625, 0.12277984619140625, 0.1424713134765625, 0.16216278076171875, 0.181854248046875, 0.20154571533203125, 0.2212371826171875, 0.24092864990234375, 0.2606201171875, 0.28031158447265625, 0.3000030517578125, 0.31969451904296875, 0.339385986328125, 0.35907745361328125, 0.3787689208984375, 0.39846038818359375, 0.41815185546875, 0.43784332275390625, 0.4575347900390625, 0.47722625732421875, 0.496917724609375, 0.5166091918945312, 0.5363006591796875, 0.5559921264648438, 0.57568359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 13.0, 19.0, 22.0, 45.0, 83.0, 120.0, 190.0, 184.0, 98.0, 83.0, 38.0, 24.0, 22.0, 13.0, 10.0, 12.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003020763397216797, -0.0002916567027568817, -0.00028123706579208374, -0.00027081742882728577, -0.0002603977918624878, -0.0002499781548976898, -0.00023955851793289185, -0.00022913888096809387, -0.0002187192440032959, -0.00020829960703849792, -0.00019787997007369995, -0.00018746033310890198, -0.000177040696144104, -0.00016662105917930603, -0.00015620142221450806, -0.00014578178524971008, -0.0001353621482849121, -0.00012494251132011414, -0.00011452287435531616, -0.00010410323739051819, -9.368360042572021e-05, -8.326396346092224e-05, -7.284432649612427e-05, -6.24246895313263e-05, -5.200505256652832e-05, -4.158541560173035e-05, -3.116577863693237e-05, -2.07461416721344e-05, -1.0326504707336426e-05, 9.313225746154785e-08, 1.0512769222259521e-05, 2.0932406187057495e-05, 3.135204315185547e-05, 4.177168011665344e-05, 5.2191317081451416e-05, 6.261095404624939e-05, 7.303059101104736e-05, 8.345022797584534e-05, 9.386986494064331e-05, 0.00010428950190544128, 0.00011470913887023926, 0.00012512877583503723, 0.0001355484127998352, 0.00014596804976463318, 0.00015638768672943115, 0.00016680732369422913, 0.0001772269606590271, 0.00018764659762382507, 0.00019806623458862305, 0.00020848587155342102, 0.000218905508518219, 0.00022932514548301697, 0.00023974478244781494, 0.0002501644194126129, 0.0002605840563774109, 0.00027100369334220886, 0.00028142333030700684, 0.0002918429672718048, 0.0003022626042366028, 0.00031268224120140076, 0.00032310187816619873, 0.0003335215151309967, 0.0003439411520957947, 0.00035436078906059265, 0.0003647804260253906]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 1.0, 5.0, 8.0, 17.0, 23.0, 38.0, 46.0, 76.0, 107.0, 220.0, 445.0, 968.0, 3615.0, 22006.0, 671845.0, 325755.0, 18197.0, 3147.0, 1018.0, 442.0, 213.0, 115.0, 87.0, 44.0, 29.0, 17.0, 14.0, 10.0, 5.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.927734375, -0.9026336669921875, -0.877532958984375, -0.8524322509765625, -0.82733154296875, -0.8022308349609375, -0.777130126953125, -0.7520294189453125, -0.7269287109375, -0.7018280029296875, -0.676727294921875, -0.6516265869140625, -0.62652587890625, -0.6014251708984375, -0.576324462890625, -0.5512237548828125, -0.526123046875, -0.5010223388671875, -0.475921630859375, -0.4508209228515625, -0.42572021484375, -0.4006195068359375, -0.375518798828125, -0.3504180908203125, -0.3253173828125, -0.3002166748046875, -0.275115966796875, -0.2500152587890625, -0.22491455078125, -0.1998138427734375, -0.174713134765625, -0.1496124267578125, -0.12451171875, -0.0994110107421875, -0.074310302734375, -0.0492095947265625, -0.02410888671875, 0.0009918212890625, 0.026092529296875, 0.0511932373046875, 0.0762939453125, 0.1013946533203125, 0.126495361328125, 0.1515960693359375, 0.17669677734375, 0.2017974853515625, 0.226898193359375, 0.2519989013671875, 0.277099609375, 0.3022003173828125, 0.327301025390625, 0.3524017333984375, 0.37750244140625, 0.4026031494140625, 0.427703857421875, 0.4528045654296875, 0.4779052734375, 0.5030059814453125, 0.528106689453125, 0.5532073974609375, 0.57830810546875, 0.6034088134765625, 0.628509521484375, 0.6536102294921875, 0.6787109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 10.0, 15.0, 14.0, 21.0, 42.0, 35.0, 61.0, 84.0, 105.0, 103.0, 121.0, 93.0, 86.0, 54.0, 39.0, 30.0, 16.0, 12.0, 12.0, 9.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6493377685546875, -0.631195068359375, -0.6130523681640625, -0.59490966796875, -0.5767669677734375, -0.558624267578125, -0.5404815673828125, -0.5223388671875, -0.5041961669921875, -0.486053466796875, -0.4679107666015625, -0.44976806640625, -0.4316253662109375, -0.413482666015625, -0.3953399658203125, -0.377197265625, -0.3590545654296875, -0.340911865234375, -0.3227691650390625, -0.30462646484375, -0.2864837646484375, -0.268341064453125, -0.2501983642578125, -0.2320556640625, -0.2139129638671875, -0.195770263671875, -0.1776275634765625, -0.15948486328125, -0.1413421630859375, -0.123199462890625, -0.1050567626953125, -0.0869140625, -0.0687713623046875, -0.050628662109375, -0.0324859619140625, -0.01434326171875, 0.0037994384765625, 0.021942138671875, 0.0400848388671875, 0.0582275390625, 0.0763702392578125, 0.094512939453125, 0.1126556396484375, 0.13079833984375, 0.1489410400390625, 0.167083740234375, 0.1852264404296875, 0.203369140625, 0.2215118408203125, 0.239654541015625, 0.2577972412109375, 0.27593994140625, 0.2940826416015625, 0.312225341796875, 0.3303680419921875, 0.3485107421875, 0.3666534423828125, 0.384796142578125, 0.4029388427734375, 0.42108154296875, 0.4392242431640625, 0.457366943359375, 0.4755096435546875, 0.49365234375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 14.0, 62.0, 433.0, 398.0, 74.0, 16.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.4105110168457, -45.120765686035156, -43.83102035522461, -42.54127502441406, -41.251529693603516, -39.96178436279297, -38.67203903198242, -37.382293701171875, -36.09254455566406, -34.802799224853516, -33.51305389404297, -32.22330856323242, -30.933563232421875, -29.643817901611328, -28.35407066345215, -27.0643253326416, -25.774581909179688, -24.48483657836914, -23.195091247558594, -21.905345916748047, -20.6156005859375, -19.325855255126953, -18.036108016967773, -16.746362686157227, -15.45661735534668, -14.166872024536133, -12.877126693725586, -11.587380409240723, -10.297635078430176, -9.007889747619629, -7.718143939971924, -6.428398132324219, -5.1386566162109375, -3.8489110469818115, -2.5591654777526855, -1.2694199085235596, 0.020325660705566406, 1.3100709915161133, 2.5998167991638184, 3.8895626068115234, 5.17930793762207, 6.469053268432617, 7.758799076080322, 9.048544883728027, 10.338290214538574, 11.628035545349121, 12.917781829833984, 14.207527160644531, 15.497272491455078, 16.787017822265625, 18.076763153076172, 19.36650848388672, 20.656253814697266, 21.945999145507812, 23.235746383666992, 24.52549171447754, 25.815237045288086, 27.104982376098633, 28.39472770690918, 29.684473037719727, 30.974220275878906, 32.26396560668945, 33.5537109375, 34.84345626831055, 36.133201599121094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 7.0, 10.0, 10.0, 17.0, 18.0, 22.0, 18.0, 25.0, 44.0, 30.0, 20.0, 38.0, 53.0, 168.0, 168.0, 54.0, 44.0, 34.0, 24.0, 27.0, 18.0, 33.0, 17.0, 13.0, 11.0, 12.0, 15.0, 9.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53750991821289, -11.177508354187012, -10.81750774383545, -10.45750617980957, -10.097505569458008, -9.737504005432129, -9.37750244140625, -9.017501831054688, -8.657500267028809, -8.29749870300293, -7.937498092651367, -7.577496528625488, -7.217495441436768, -6.857494354248047, -6.497493267059326, -6.1374921798706055, -5.777491092681885, -5.417490005493164, -5.057488918304443, -4.697487831115723, -4.337486267089844, -3.977485179901123, -3.6174840927124023, -3.2574827671051025, -2.897481679916382, -2.537480592727661, -2.1774792671203613, -1.8174781799316406, -1.4574769735336304, -1.0974757671356201, -0.7374746799468994, -0.3774733543395996, -0.017472267150878906, 0.34252890944480896, 0.7025300860404968, 1.0625312328338623, 1.4225324392318726, 1.7825336456298828, 2.1425347328186035, 2.5025360584259033, 2.862537145614624, 3.2225382328033447, 3.5825395584106445, 3.9425406455993652, 4.302541732788086, 4.662543296813965, 5.022543907165527, 5.382545471191406, 5.742546558380127, 6.102547645568848, 6.462548732757568, 6.822549819946289, 7.182551383972168, 7.542552471160889, 7.902553558349609, 8.262555122375488, 8.62255573272705, 8.98255729675293, 9.342557907104492, 9.702559471130371, 10.062560081481934, 10.422561645507812, 10.782562255859375, 11.142563819885254, 11.502565383911133]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 12.0, 14.0, 29.0, 46.0, 101.0, 148.0, 320.0, 637.0, 1469.0, 3992.0, 13599.0, 77161.0, 894439.0, 2717211.0, 432710.0, 38969.0, 8289.0, 2832.0, 1146.0, 552.0, 260.0, 146.0, 79.0, 58.0, 31.0, 16.0, 11.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.85986328125, -0.8154296875, -0.77099609375, -0.7265625, -0.68212890625, -0.6376953125, -0.59326171875, -0.548828125, -0.50439453125, -0.4599609375, -0.41552734375, -0.37109375, -0.32666015625, -0.2822265625, -0.23779296875, -0.193359375, -0.14892578125, -0.1044921875, -0.06005859375, -0.015625, 0.02880859375, 0.0732421875, 0.11767578125, 0.162109375, 0.20654296875, 0.2509765625, 0.29541015625, 0.33984375, 0.38427734375, 0.4287109375, 0.47314453125, 0.517578125, 0.56201171875, 0.6064453125, 0.65087890625, 0.6953125, 0.73974609375, 0.7841796875, 0.82861328125, 0.873046875, 0.91748046875, 0.9619140625, 1.00634765625, 1.05078125, 1.09521484375, 1.1396484375, 1.18408203125, 1.228515625, 1.27294921875, 1.3173828125, 1.36181640625, 1.40625, 1.45068359375, 1.4951171875, 1.53955078125, 1.583984375, 1.62841796875, 1.6728515625, 1.71728515625, 1.76171875, 1.80615234375, 1.8505859375, 1.89501953125, 1.939453125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 7.0, 8.0, 12.0, 11.0, 22.0, 20.0, 32.0, 35.0, 41.0, 57.0, 55.0, 57.0, 53.0, 61.0, 62.0, 50.0, 76.0, 52.0, 44.0, 46.0, 47.0, 30.0, 21.0, 18.0, 21.0, 17.0, 13.0, 6.0, 6.0, 11.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.495880126953125, -0.47027587890625, -0.444671630859375, -0.4190673828125, -0.393463134765625, -0.36785888671875, -0.342254638671875, -0.316650390625, -0.291046142578125, -0.26544189453125, -0.239837646484375, -0.2142333984375, -0.188629150390625, -0.16302490234375, -0.137420654296875, -0.11181640625, -0.086212158203125, -0.06060791015625, -0.035003662109375, -0.0093994140625, 0.016204833984375, 0.04180908203125, 0.067413330078125, 0.093017578125, 0.118621826171875, 0.14422607421875, 0.169830322265625, 0.1954345703125, 0.221038818359375, 0.24664306640625, 0.272247314453125, 0.2978515625, 0.323455810546875, 0.34906005859375, 0.374664306640625, 0.4002685546875, 0.425872802734375, 0.45147705078125, 0.477081298828125, 0.502685546875, 0.528289794921875, 0.55389404296875, 0.579498291015625, 0.6051025390625, 0.630706787109375, 0.65631103515625, 0.681915283203125, 0.70751953125, 0.733123779296875, 0.75872802734375, 0.784332275390625, 0.8099365234375, 0.835540771484375, 0.86114501953125, 0.886749267578125, 0.912353515625, 0.937957763671875, 0.96356201171875, 0.989166259765625, 1.0147705078125, 1.040374755859375, 1.06597900390625, 1.091583251953125, 1.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 2.0, 2.0, 15.0, 45.0, 66.0, 127.0, 352.0, 868.0, 4737.0, 4020751.0, 163389.0, 2654.0, 691.0, 290.0, 143.0, 58.0, 34.0, 18.0, 12.0, 10.0, 4.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.07421875, -6.80047607421875, -6.5267333984375, -6.25299072265625, -5.979248046875, -5.70550537109375, -5.4317626953125, -5.15802001953125, -4.88427734375, -4.61053466796875, -4.3367919921875, -4.06304931640625, -3.789306640625, -3.51556396484375, -3.2418212890625, -2.96807861328125, -2.6943359375, -2.42059326171875, -2.1468505859375, -1.87310791015625, -1.599365234375, -1.32562255859375, -1.0518798828125, -0.77813720703125, -0.50439453125, -0.23065185546875, 0.0430908203125, 0.31683349609375, 0.590576171875, 0.86431884765625, 1.1380615234375, 1.41180419921875, 1.685546875, 1.95928955078125, 2.2330322265625, 2.50677490234375, 2.780517578125, 3.05426025390625, 3.3280029296875, 3.60174560546875, 3.87548828125, 4.14923095703125, 4.4229736328125, 4.69671630859375, 4.970458984375, 5.24420166015625, 5.5179443359375, 5.79168701171875, 6.0654296875, 6.33917236328125, 6.6129150390625, 6.88665771484375, 7.160400390625, 7.43414306640625, 7.7078857421875, 7.98162841796875, 8.25537109375, 8.52911376953125, 8.8028564453125, 9.07659912109375, 9.350341796875, 9.62408447265625, 9.8978271484375, 10.17156982421875, 10.4453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 21.0, 22.0, 49.0, 102.0, 199.0, 490.0, 1291.0, 1087.0, 430.0, 179.0, 99.0, 48.0, 25.0, 19.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.90557861328125, -1.7681884765625, -1.63079833984375, -1.493408203125, -1.35601806640625, -1.2186279296875, -1.08123779296875, -0.94384765625, -0.80645751953125, -0.6690673828125, -0.53167724609375, -0.394287109375, -0.25689697265625, -0.1195068359375, 0.01788330078125, 0.1552734375, 0.29266357421875, 0.4300537109375, 0.56744384765625, 0.704833984375, 0.84222412109375, 0.9796142578125, 1.11700439453125, 1.25439453125, 1.39178466796875, 1.5291748046875, 1.66656494140625, 1.803955078125, 1.94134521484375, 2.0787353515625, 2.21612548828125, 2.353515625, 2.49090576171875, 2.6282958984375, 2.76568603515625, 2.903076171875, 3.04046630859375, 3.1778564453125, 3.31524658203125, 3.45263671875, 3.59002685546875, 3.7274169921875, 3.86480712890625, 4.002197265625, 4.13958740234375, 4.2769775390625, 4.41436767578125, 4.5517578125, 4.68914794921875, 4.8265380859375, 4.96392822265625, 5.101318359375, 5.23870849609375, 5.3760986328125, 5.51348876953125, 5.65087890625, 5.78826904296875, 5.9256591796875, 6.06304931640625, 6.200439453125, 6.33782958984375, 6.4752197265625, 6.61260986328125, 6.75]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 10.0, 10.0, 22.0, 54.0, 119.0, 240.0, 236.0, 150.0, 66.0, 34.0, 15.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.86121940612793, -14.803691864013672, -13.746164321899414, -12.68863582611084, -11.631108283996582, -10.573580741882324, -9.51605224609375, -8.458524703979492, -7.400997161865234, -6.343469619750977, -5.2859416007995605, -4.2284135818481445, -3.1708860397338867, -2.113358497619629, -1.055830478668213, 0.001697540283203125, 1.059225082397461, 2.116752862930298, 3.1742806434631348, 4.231808662414551, 5.289336204528809, 6.346863746643066, 7.404391765594482, 8.461919784545898, 9.519447326660156, 10.576974868774414, 11.634502410888672, 12.692030906677246, 13.749558448791504, 14.807085990905762, 15.864614486694336, 16.922142028808594, 17.97966766357422, 19.037195205688477, 20.094722747802734, 21.152250289916992, 22.20977783203125, 23.26730728149414, 24.3248348236084, 25.382362365722656, 26.439889907836914, 27.497417449951172, 28.55494499206543, 29.612472534179688, 30.670001983642578, 31.727527618408203, 32.785057067871094, 33.84258270263672, 34.90011215209961, 35.9576416015625, 37.015167236328125, 38.072696685791016, 39.13022232055664, 40.18775177001953, 41.245277404785156, 42.30280685424805, 43.36033630371094, 44.41786575317383, 45.47539138793945, 46.532920837402344, 47.59044647216797, 48.64797592163086, 49.705501556396484, 50.763031005859375, 51.820556640625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 8.0, 12.0, 9.0, 11.0, 18.0, 24.0, 25.0, 39.0, 27.0, 26.0, 28.0, 38.0, 38.0, 44.0, 55.0, 43.0, 59.0, 59.0, 68.0, 39.0, 54.0, 44.0, 32.0, 25.0, 31.0, 26.0, 22.0, 15.0, 12.0, 9.0, 7.0, 8.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.595611572265625, -12.182685852050781, -11.769760131835938, -11.356834411621094, -10.94390869140625, -10.530982971191406, -10.118057250976562, -9.705131530761719, -9.292205810546875, -8.879280090332031, -8.466354370117188, -8.053428649902344, -7.6405029296875, -7.227577209472656, -6.814651966094971, -6.401726245880127, -5.988801002502441, -5.575875282287598, -5.162949562072754, -4.75002384185791, -4.337098121643066, -3.9241726398468018, -3.511247158050537, -3.0983214378356934, -2.6853957176208496, -2.272469997406006, -1.8595443964004517, -1.4466187953948975, -1.0336930751800537, -0.62076735496521, -0.2078418731689453, 0.20508384704589844, 0.6180095672607422, 1.030935287475586, 1.4438608884811401, 1.8567864894866943, 2.269712209701538, 2.682637929916382, 3.0955634117126465, 3.5084891319274902, 3.921414852142334, 4.334340572357178, 4.7472662925720215, 5.160191535949707, 5.573117256164551, 5.9860429763793945, 6.398968696594238, 6.811894416809082, 7.224820137023926, 7.6377458572387695, 8.050671577453613, 8.463597297668457, 8.8765230178833, 9.289448738098145, 9.702373504638672, 10.115299224853516, 10.52822494506836, 10.941150665283203, 11.354076385498047, 11.76700210571289, 12.179927825927734, 12.592853546142578, 13.005779266357422, 13.418704986572266, 13.83163070678711]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 1.0, 5.0, 6.0, 15.0, 23.0, 27.0, 38.0, 64.0, 87.0, 155.0, 235.0, 459.0, 945.0, 1814.0, 4016.0, 9942.0, 29436.0, 120252.0, 633944.0, 185110.0, 39750.0, 12679.0, 4992.0, 2167.0, 1037.0, 572.0, 300.0, 187.0, 96.0, 60.0, 38.0, 33.0, 23.0, 15.0, 10.0, 8.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.57421875, -1.5228118896484375, -1.471405029296875, -1.4199981689453125, -1.36859130859375, -1.3171844482421875, -1.265777587890625, -1.2143707275390625, -1.1629638671875, -1.1115570068359375, -1.060150146484375, -1.0087432861328125, -0.95733642578125, -0.9059295654296875, -0.854522705078125, -0.8031158447265625, -0.751708984375, -0.7003021240234375, -0.648895263671875, -0.5974884033203125, -0.54608154296875, -0.4946746826171875, -0.443267822265625, -0.3918609619140625, -0.3404541015625, -0.2890472412109375, -0.237640380859375, -0.1862335205078125, -0.13482666015625, -0.0834197998046875, -0.032012939453125, 0.0193939208984375, 0.07080078125, 0.1222076416015625, 0.173614501953125, 0.2250213623046875, 0.27642822265625, 0.3278350830078125, 0.379241943359375, 0.4306488037109375, 0.4820556640625, 0.5334625244140625, 0.584869384765625, 0.6362762451171875, 0.68768310546875, 0.7390899658203125, 0.790496826171875, 0.8419036865234375, 0.893310546875, 0.9447174072265625, 0.996124267578125, 1.0475311279296875, 1.09893798828125, 1.1503448486328125, 1.201751708984375, 1.2531585693359375, 1.3045654296875, 1.3559722900390625, 1.407379150390625, 1.4587860107421875, 1.51019287109375, 1.5615997314453125, 1.613006591796875, 1.6644134521484375, 1.7158203125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 19.0, 21.0, 17.0, 21.0, 18.0, 37.0, 27.0, 43.0, 53.0, 55.0, 70.0, 59.0, 69.0, 60.0, 60.0, 34.0, 50.0, 46.0, 49.0, 27.0, 23.0, 26.0, 19.0, 18.0, 12.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.86669921875, -0.8351211547851562, -0.8035430908203125, -0.7719650268554688, -0.740386962890625, -0.7088088989257812, -0.6772308349609375, -0.6456527709960938, -0.61407470703125, -0.5824966430664062, -0.5509185791015625, -0.5193405151367188, -0.487762451171875, -0.45618438720703125, -0.4246063232421875, -0.39302825927734375, -0.3614501953125, -0.32987213134765625, -0.2982940673828125, -0.26671600341796875, -0.235137939453125, -0.20355987548828125, -0.1719818115234375, -0.14040374755859375, -0.10882568359375, -0.07724761962890625, -0.0456695556640625, -0.01409149169921875, 0.017486572265625, 0.04906463623046875, 0.0806427001953125, 0.11222076416015625, 0.143798828125, 0.17537689208984375, 0.2069549560546875, 0.23853302001953125, 0.270111083984375, 0.30168914794921875, 0.3332672119140625, 0.36484527587890625, 0.39642333984375, 0.42800140380859375, 0.4595794677734375, 0.49115753173828125, 0.522735595703125, 0.5543136596679688, 0.5858917236328125, 0.6174697875976562, 0.6490478515625, 0.6806259155273438, 0.7122039794921875, 0.7437820434570312, 0.775360107421875, 0.8069381713867188, 0.8385162353515625, 0.8700942993164062, 0.90167236328125, 0.9332504272460938, 0.9648284912109375, 0.9964065551757812, 1.027984619140625, 1.0595626831054688, 1.0911407470703125, 1.1227188110351562, 1.154296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 8.0, 7.0, 18.0, 27.0, 40.0, 55.0, 83.0, 134.0, 255.0, 495.0, 1294.0, 5068.0, 61670.0, 949746.0, 24940.0, 3000.0, 870.0, 351.0, 173.0, 93.0, 55.0, 38.0, 22.0, 20.0, 17.0, 12.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.45001220703125, -3.3433837890625, -3.23675537109375, -3.130126953125, -3.02349853515625, -2.9168701171875, -2.81024169921875, -2.70361328125, -2.59698486328125, -2.4903564453125, -2.38372802734375, -2.277099609375, -2.17047119140625, -2.0638427734375, -1.95721435546875, -1.8505859375, -1.74395751953125, -1.6373291015625, -1.53070068359375, -1.424072265625, -1.31744384765625, -1.2108154296875, -1.10418701171875, -0.99755859375, -0.89093017578125, -0.7843017578125, -0.67767333984375, -0.571044921875, -0.46441650390625, -0.3577880859375, -0.25115966796875, -0.14453125, -0.03790283203125, 0.0687255859375, 0.17535400390625, 0.281982421875, 0.38861083984375, 0.4952392578125, 0.60186767578125, 0.70849609375, 0.81512451171875, 0.9217529296875, 1.02838134765625, 1.135009765625, 1.24163818359375, 1.3482666015625, 1.45489501953125, 1.5615234375, 1.66815185546875, 1.7747802734375, 1.88140869140625, 1.988037109375, 2.09466552734375, 2.2012939453125, 2.30792236328125, 2.41455078125, 2.52117919921875, 2.6278076171875, 2.73443603515625, 2.841064453125, 2.94769287109375, 3.0543212890625, 3.16094970703125, 3.267578125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 1.0, 8.0, 6.0, 12.0, 5.0, 10.0, 15.0, 12.0, 12.0, 16.0, 24.0, 30.0, 33.0, 33.0, 32.0, 51.0, 46.0, 65.0, 63.0, 71.0, 76.0, 61.0, 50.0, 45.0, 36.0, 29.0, 24.0, 24.0, 14.0, 12.0, 15.0, 17.0, 8.0, 11.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.326171875, -3.213348388671875, -3.10052490234375, -2.987701416015625, -2.8748779296875, -2.762054443359375, -2.64923095703125, -2.536407470703125, -2.423583984375, -2.310760498046875, -2.19793701171875, -2.085113525390625, -1.9722900390625, -1.859466552734375, -1.74664306640625, -1.633819580078125, -1.52099609375, -1.408172607421875, -1.29534912109375, -1.182525634765625, -1.0697021484375, -0.956878662109375, -0.84405517578125, -0.731231689453125, -0.618408203125, -0.505584716796875, -0.39276123046875, -0.279937744140625, -0.1671142578125, -0.054290771484375, 0.05853271484375, 0.171356201171875, 0.2841796875, 0.397003173828125, 0.50982666015625, 0.622650146484375, 0.7354736328125, 0.848297119140625, 0.96112060546875, 1.073944091796875, 1.186767578125, 1.299591064453125, 1.41241455078125, 1.525238037109375, 1.6380615234375, 1.750885009765625, 1.86370849609375, 1.976531982421875, 2.08935546875, 2.202178955078125, 2.31500244140625, 2.427825927734375, 2.5406494140625, 2.653472900390625, 2.76629638671875, 2.879119873046875, 2.991943359375, 3.104766845703125, 3.21759033203125, 3.330413818359375, 3.4432373046875, 3.556060791015625, 3.66888427734375, 3.781707763671875, 3.89453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 13.0, 14.0, 21.0, 24.0, 37.0, 49.0, 96.0, 274.0, 692.0, 3021.0, 46940.0, 983604.0, 11363.0, 1563.0, 389.0, 189.0, 91.0, 61.0, 19.0, 19.0, 12.0, 11.0, 12.0, 3.0, 6.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.125, -1.085235595703125, -1.04547119140625, -1.005706787109375, -0.9659423828125, -0.926177978515625, -0.88641357421875, -0.846649169921875, -0.806884765625, -0.767120361328125, -0.72735595703125, -0.687591552734375, -0.6478271484375, -0.608062744140625, -0.56829833984375, -0.528533935546875, -0.48876953125, -0.449005126953125, -0.40924072265625, -0.369476318359375, -0.3297119140625, -0.289947509765625, -0.25018310546875, -0.210418701171875, -0.170654296875, -0.130889892578125, -0.09112548828125, -0.051361083984375, -0.0115966796875, 0.028167724609375, 0.06793212890625, 0.107696533203125, 0.1474609375, 0.187225341796875, 0.22698974609375, 0.266754150390625, 0.3065185546875, 0.346282958984375, 0.38604736328125, 0.425811767578125, 0.465576171875, 0.505340576171875, 0.54510498046875, 0.584869384765625, 0.6246337890625, 0.664398193359375, 0.70416259765625, 0.743927001953125, 0.78369140625, 0.823455810546875, 0.86322021484375, 0.902984619140625, 0.9427490234375, 0.982513427734375, 1.02227783203125, 1.062042236328125, 1.101806640625, 1.141571044921875, 1.18133544921875, 1.221099853515625, 1.2608642578125, 1.300628662109375, 1.34039306640625, 1.380157470703125, 1.419921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 14.0, 27.0, 24.0, 39.0, 74.0, 132.0, 185.0, 166.0, 105.0, 69.0, 41.0, 15.0, 21.0, 16.0, 14.0, 13.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.00024062395095825195, -0.0002332925796508789, -0.00022596120834350586, -0.0002186298370361328, -0.00021129846572875977, -0.00020396709442138672, -0.00019663572311401367, -0.00018930435180664062, -0.00018197298049926758, -0.00017464160919189453, -0.00016731023788452148, -0.00015997886657714844, -0.0001526474952697754, -0.00014531612396240234, -0.0001379847526550293, -0.00013065338134765625, -0.0001233220100402832, -0.00011599063873291016, -0.00010865926742553711, -0.00010132789611816406, -9.399652481079102e-05, -8.666515350341797e-05, -7.933378219604492e-05, -7.200241088867188e-05, -6.467103958129883e-05, -5.733966827392578e-05, -5.0008296966552734e-05, -4.267692565917969e-05, -3.534555435180664e-05, -2.8014183044433594e-05, -2.0682811737060547e-05, -1.33514404296875e-05, -6.020069122314453e-06, 1.3113021850585938e-06, 8.64267349243164e-06, 1.5974044799804688e-05, 2.3305416107177734e-05, 3.063678741455078e-05, 3.796815872192383e-05, 4.5299530029296875e-05, 5.263090133666992e-05, 5.996227264404297e-05, 6.729364395141602e-05, 7.462501525878906e-05, 8.195638656616211e-05, 8.928775787353516e-05, 9.66191291809082e-05, 0.00010395050048828125, 0.0001112818717956543, 0.00011861324310302734, 0.0001259446144104004, 0.00013327598571777344, 0.00014060735702514648, 0.00014793872833251953, 0.00015527009963989258, 0.00016260147094726562, 0.00016993284225463867, 0.00017726421356201172, 0.00018459558486938477, 0.0001919269561767578, 0.00019925832748413086, 0.0002065896987915039, 0.00021392107009887695, 0.00022125244140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 9.0, 15.0, 34.0, 54.0, 81.0, 159.0, 427.0, 1240.0, 5265.0, 59267.0, 952863.0, 24311.0, 3284.0, 919.0, 297.0, 144.0, 64.0, 36.0, 25.0, 14.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.6846847534179688, -0.6613616943359375, -0.6380386352539062, -0.614715576171875, -0.5913925170898438, -0.5680694580078125, -0.5447463989257812, -0.52142333984375, -0.49810028076171875, -0.4747772216796875, -0.45145416259765625, -0.428131103515625, -0.40480804443359375, -0.3814849853515625, -0.35816192626953125, -0.3348388671875, -0.31151580810546875, -0.2881927490234375, -0.26486968994140625, -0.241546630859375, -0.21822357177734375, -0.1949005126953125, -0.17157745361328125, -0.14825439453125, -0.12493133544921875, -0.1016082763671875, -0.07828521728515625, -0.054962158203125, -0.03163909912109375, -0.0083160400390625, 0.01500701904296875, 0.038330078125, 0.06165313720703125, 0.0849761962890625, 0.10829925537109375, 0.131622314453125, 0.15494537353515625, 0.1782684326171875, 0.20159149169921875, 0.22491455078125, 0.24823760986328125, 0.2715606689453125, 0.29488372802734375, 0.318206787109375, 0.34152984619140625, 0.3648529052734375, 0.38817596435546875, 0.4114990234375, 0.43482208251953125, 0.4581451416015625, 0.48146820068359375, 0.504791259765625, 0.5281143188476562, 0.5514373779296875, 0.5747604370117188, 0.59808349609375, 0.6214065551757812, 0.6447296142578125, 0.6680526733398438, 0.691375732421875, 0.7146987915039062, 0.7380218505859375, 0.7613449096679688, 0.78466796875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 10.0, 7.0, 13.0, 16.0, 17.0, 35.0, 47.0, 67.0, 88.0, 110.0, 125.0, 131.0, 75.0, 74.0, 44.0, 27.0, 25.0, 19.0, 12.0, 9.0, 14.0, 8.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.6201171875, -0.603668212890625, -0.58721923828125, -0.570770263671875, -0.5543212890625, -0.537872314453125, -0.52142333984375, -0.504974365234375, -0.488525390625, -0.472076416015625, -0.45562744140625, -0.439178466796875, -0.4227294921875, -0.406280517578125, -0.38983154296875, -0.373382568359375, -0.35693359375, -0.340484619140625, -0.32403564453125, -0.307586669921875, -0.2911376953125, -0.274688720703125, -0.25823974609375, -0.241790771484375, -0.225341796875, -0.208892822265625, -0.19244384765625, -0.175994873046875, -0.1595458984375, -0.143096923828125, -0.12664794921875, -0.110198974609375, -0.09375, -0.077301025390625, -0.06085205078125, -0.044403076171875, -0.0279541015625, -0.011505126953125, 0.00494384765625, 0.021392822265625, 0.037841796875, 0.054290771484375, 0.07073974609375, 0.087188720703125, 0.1036376953125, 0.120086669921875, 0.13653564453125, 0.152984619140625, 0.16943359375, 0.185882568359375, 0.20233154296875, 0.218780517578125, 0.2352294921875, 0.251678466796875, 0.26812744140625, 0.284576416015625, 0.301025390625, 0.317474365234375, 0.33392333984375, 0.350372314453125, 0.3668212890625, 0.383270263671875, 0.39971923828125, 0.416168212890625, 0.4326171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 12.0, 58.0, 683.0, 209.0, 31.0, 13.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.34331130981445, -45.75852584838867, -44.173736572265625, -42.588951110839844, -41.00416564941406, -39.41938018798828, -37.834590911865234, -36.24980545043945, -34.665016174316406, -33.080230712890625, -31.49544334411621, -29.910655975341797, -28.325870513916016, -26.7410831451416, -25.156295776367188, -23.571510314941406, -21.986724853515625, -20.40193748474121, -18.81715202331543, -17.232364654541016, -15.647578239440918, -14.06279182434082, -12.478004455566406, -10.893218040466309, -9.308431625366211, -7.723645210266113, -6.138858318328857, -4.554071426391602, -2.969285011291504, -1.3844985961914062, 0.2002887725830078, 1.7850751876831055, 3.369861602783203, 4.954648017883301, 6.539434909820557, 8.124221801757812, 9.70900821685791, 11.293794631958008, 12.878582000732422, 14.46336841583252, 16.048154830932617, 17.63294219970703, 19.217727661132812, 20.802515029907227, 22.38730239868164, 23.972087860107422, 25.556875228881836, 27.14166259765625, 28.72644805908203, 30.311235427856445, 31.896020889282227, 33.48080825805664, 35.06559371948242, 36.65038299560547, 38.23516845703125, 39.81995391845703, 41.40473937988281, 42.989524841308594, 44.57431411743164, 46.15909957885742, 47.7438850402832, 49.32867431640625, 50.91345977783203, 52.49824523925781, 54.08303451538086]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 17.0, 20.0, 23.0, 38.0, 57.0, 65.0, 378.0, 166.0, 66.0, 43.0, 37.0, 27.0, 15.0, 12.0, 10.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.040874481201172, -9.316638946533203, -8.59240436553955, -7.868168830871582, -7.143933296203613, -6.419698238372803, -5.695463180541992, -4.971227645874023, -4.246992588043213, -3.5227572917938232, -2.7985219955444336, -2.074286937713623, -1.3500516414642334, -0.6258163452148438, 0.0984187126159668, 0.8226542472839355, 1.546889305114746, 2.2711246013641357, 2.9953598976135254, 3.719594955444336, 4.443830490112305, 5.168065547943115, 5.892300605773926, 6.6165361404418945, 7.340771198272705, 8.065006256103516, 8.789241790771484, 9.513477325439453, 10.237711906433105, 10.961947441101074, 11.686182022094727, 12.410417556762695, 13.134653091430664, 13.858888626098633, 14.583123207092285, 15.307358741760254, 16.031593322753906, 16.755828857421875, 17.480064392089844, 18.204299926757812, 18.92853546142578, 19.65277099609375, 20.37700653076172, 21.101242065429688, 21.825475692749023, 22.549711227416992, 23.27394676208496, 23.99818229675293, 24.722415924072266, 25.446651458740234, 26.170886993408203, 26.895122528076172, 27.619356155395508, 28.343591690063477, 29.067827224731445, 29.792062759399414, 30.516298294067383, 31.24053382873535, 31.96476936340332, 32.689002990722656, 33.413238525390625, 34.137474060058594, 34.86170959472656, 35.58594512939453, 36.3101806640625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 9.0, 14.0, 21.0, 32.0, 30.0, 44.0, 54.0, 47.0, 100.0, 342.0, 99.0, 40.0, 43.0, 37.0, 19.0, 18.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8437728881835938, -0.7983856201171875, -0.7529983520507812, -0.707611083984375, -0.6622238159179688, -0.6168365478515625, -0.5714492797851562, -0.52606201171875, -0.48067474365234375, -0.4352874755859375, -0.38990020751953125, -0.344512939453125, -0.29912567138671875, -0.2537384033203125, -0.20835113525390625, -0.1629638671875, -0.11757659912109375, -0.0721893310546875, -0.02680206298828125, 0.018585205078125, 0.06397247314453125, 0.1093597412109375, 0.15474700927734375, 0.20013427734375, 0.24552154541015625, 0.2909088134765625, 0.33629608154296875, 0.381683349609375, 0.42707061767578125, 0.4724578857421875, 0.5178451538085938, 0.563232421875, 0.6086196899414062, 0.6540069580078125, 0.6993942260742188, 0.744781494140625, 0.7901687622070312, 0.8355560302734375, 0.8809432983398438, 0.92633056640625, 0.9717178344726562, 1.0171051025390625, 1.0624923706054688, 1.107879638671875, 1.1532669067382812, 1.1986541748046875, 1.2440414428710938, 1.2894287109375, 1.3348159790039062, 1.3802032470703125, 1.4255905151367188, 1.470977783203125, 1.5163650512695312, 1.5617523193359375, 1.6071395874023438, 1.65252685546875, 1.6979141235351562, 1.7433013916015625, 1.7886886596679688, 1.834075927734375, 1.8794631958007812, 1.9248504638671875, 1.9702377319335938, 2.015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 7.0, 7.0, 0.0, 5.0, 16.0, 10.0, 27.0, 28.0, 65.0, 159.0, 823.0, 46812.0, 8339089.0, 1119.0, 205.0, 84.0, 50.0, 28.0, 11.0, 8.0, 8.0, 3.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.296606063842773, -26.54012680053711, -25.783649444580078, -25.027170181274414, -24.270692825317383, -23.51421356201172, -22.757736206054688, -22.001256942749023, -21.24477767944336, -20.488298416137695, -19.731821060180664, -18.975341796875, -18.21886444091797, -17.462385177612305, -16.70590591430664, -15.94942855834961, -15.192951202392578, -14.43647289276123, -13.679994583129883, -12.923515319824219, -12.167037963867188, -11.410558700561523, -10.654080390930176, -9.897602081298828, -9.14112377166748, -8.384645462036133, -7.628167152404785, -6.871688365936279, -6.115210056304932, -5.358731746673584, -4.602252960205078, -3.8457746505737305, -3.08929443359375, -2.3328161239624023, -1.5763375759124756, -0.8198590278625488, -0.06338071823120117, 0.6930975914001465, 1.4495763778686523, 2.2060546875, 2.9625329971313477, 3.7190113067626953, 4.475489616394043, 5.231968402862549, 5.9884467124938965, 6.744925022125244, 7.50140380859375, 8.257882118225098, 9.014360427856445, 9.770838737487793, 10.52731704711914, 11.283796310424805, 12.040273666381836, 12.7967529296875, 13.553231239318848, 14.309709548950195, 15.066187858581543, 15.82266616821289, 16.579145431518555, 17.335622787475586, 18.09210205078125, 18.84857940673828, 19.605058670043945, 20.36153793334961, 21.11801528930664]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 7.0, 9.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 6.0, 6.0, 8.0, 8.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.687347412109375, -26.179248809814453, -25.671152114868164, -25.163053512573242, -24.65495491027832, -24.14685821533203, -23.63875961303711, -23.130661010742188, -22.622562408447266, -22.114463806152344, -21.606367111206055, -21.098268508911133, -20.59016990661621, -20.082073211669922, -19.573974609375, -19.065876007080078, -18.55777931213379, -18.049680709838867, -17.541584014892578, -17.033485412597656, -16.525386810302734, -16.017288208007812, -15.509191513061523, -15.001092910766602, -14.492995262145996, -13.98489761352539, -13.476799011230469, -12.968701362609863, -12.460603713989258, -11.952505111694336, -11.44440746307373, -10.936309814453125, -10.428211212158203, -9.920113563537598, -9.412014961242676, -8.90391731262207, -8.395818710327148, -7.887721061706543, -7.3796234130859375, -6.871525287628174, -6.363426685333252, -5.855328559875488, -5.347230911254883, -4.839132785797119, -4.3310346603393555, -3.822936534881592, -3.3148386478424072, -2.8067407608032227, -2.298642635345459, -1.7905446290969849, -1.2824466228485107, -0.7743486166000366, -0.2662506103515625, 0.24184751510620117, 0.7499454021453857, 1.2580432891845703, 1.766141414642334, 2.2742395401000977, 2.7823374271392822, 3.290435314178467, 3.7985334396362305, 4.306631565093994, 4.814729690551758, 5.322827339172363, 5.830925464630127]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 9.0, 22.0, 27.0, 30.0, 46.0, 79.0, 91.0, 166.0, 255.0, 445.0, 891.0, 1928.0, 4929.0, 15850.0, 62754.0, 236602.0, 146543.0, 35313.0, 10472.0, 4020.0, 1760.0, 887.0, 430.0, 266.0, 156.0, 83.0, 64.0, 46.0, 28.0, 20.0, 11.0, 8.0, 6.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.3984375, -9.15606689453125, -8.9136962890625, -8.67132568359375, -8.428955078125, -8.18658447265625, -7.9442138671875, -7.70184326171875, -7.45947265625, -7.21710205078125, -6.9747314453125, -6.73236083984375, -6.489990234375, -6.24761962890625, -6.0052490234375, -5.76287841796875, -5.5205078125, -5.27813720703125, -5.0357666015625, -4.79339599609375, -4.551025390625, -4.30865478515625, -4.0662841796875, -3.82391357421875, -3.58154296875, -3.33917236328125, -3.0968017578125, -2.85443115234375, -2.612060546875, -2.36968994140625, -2.1273193359375, -1.88494873046875, -1.642578125, -1.40020751953125, -1.1578369140625, -0.91546630859375, -0.673095703125, -0.43072509765625, -0.1883544921875, 0.05401611328125, 0.29638671875, 0.53875732421875, 0.7811279296875, 1.02349853515625, 1.265869140625, 1.50823974609375, 1.7506103515625, 1.99298095703125, 2.2353515625, 2.47772216796875, 2.7200927734375, 2.96246337890625, 3.204833984375, 3.44720458984375, 3.6895751953125, 3.93194580078125, 4.17431640625, 4.41668701171875, 4.6590576171875, 4.90142822265625, 5.143798828125, 5.38616943359375, 5.6285400390625, 5.87091064453125, 6.11328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 5.0, 11.0, 29.0, 26.0, 49.0, 72.0, 97.0, 93.0, 139.0, 121.0, 109.0, 61.0, 44.0, 34.0, 27.0, 15.0, 15.0, 12.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5390625, -1.480316162109375, -1.42156982421875, -1.362823486328125, -1.3040771484375, -1.245330810546875, -1.18658447265625, -1.127838134765625, -1.069091796875, -1.010345458984375, -0.95159912109375, -0.892852783203125, -0.8341064453125, -0.775360107421875, -0.71661376953125, -0.657867431640625, -0.59912109375, -0.540374755859375, -0.48162841796875, -0.422882080078125, -0.3641357421875, -0.305389404296875, -0.24664306640625, -0.187896728515625, -0.129150390625, -0.070404052734375, -0.01165771484375, 0.047088623046875, 0.1058349609375, 0.164581298828125, 0.22332763671875, 0.282073974609375, 0.3408203125, 0.399566650390625, 0.45831298828125, 0.517059326171875, 0.5758056640625, 0.634552001953125, 0.69329833984375, 0.752044677734375, 0.810791015625, 0.869537353515625, 0.92828369140625, 0.987030029296875, 1.0457763671875, 1.104522705078125, 1.16326904296875, 1.222015380859375, 1.28076171875, 1.339508056640625, 1.39825439453125, 1.457000732421875, 1.5157470703125, 1.574493408203125, 1.63323974609375, 1.691986083984375, 1.750732421875, 1.809478759765625, 1.86822509765625, 1.926971435546875, 1.9857177734375, 2.044464111328125, 2.10321044921875, 2.161956787109375, 2.220703125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 15.0, 26.0, 65.0, 115.0, 104.0, 55.0, 28.0, 12.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.74677848815918, -11.425983428955078, -11.105188369750977, -10.784393310546875, -10.463598251342773, -10.142803192138672, -9.82200813293457, -9.501213073730469, -9.180418014526367, -8.859622955322266, -8.538827896118164, -8.218032836914062, -7.897237777709961, -7.576442718505859, -7.255647659301758, -6.934852600097656, -6.614058017730713, -6.293262958526611, -5.97246789932251, -5.651672840118408, -5.330877780914307, -5.010082721710205, -4.689288139343262, -4.36849308013916, -4.047698020935059, -3.726902961730957, -3.4061079025268555, -3.085312843322754, -2.7645177841186523, -2.443722724914551, -2.1229279041290283, -1.8021328449249268, -1.481337547302246, -1.1605424880981445, -0.8397474884986877, -0.518952488899231, -0.1981574296951294, 0.12263762950897217, 0.4434325695037842, 0.7642276287078857, 1.0850226879119873, 1.4058177471160889, 1.7266128063201904, 2.047407627105713, 2.3682026863098145, 2.688997745513916, 3.0097928047180176, 3.330587863922119, 3.6513829231262207, 3.9721779823303223, 4.292973041534424, 4.613768100738525, 4.934563159942627, 5.2553582191467285, 5.576152801513672, 5.896947860717773, 6.217742919921875, 6.538537979125977, 6.859333038330078, 7.18012809753418, 7.500923156738281, 7.821718215942383, 8.142513275146484, 8.463308334350586, 8.784103393554688]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 4.0, 3.0, 11.0, 6.0, 6.0, 9.0, 14.0, 28.0, 63.0, 85.0, 102.0, 69.0, 34.0, 17.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.045466423034668, -6.832422256469727, -6.619378089904785, -6.406333923339844, -6.193289279937744, -5.980245113372803, -5.767200946807861, -5.55415678024292, -5.3411126136779785, -5.128068447113037, -4.915024280548096, -4.701979637145996, -4.488935470581055, -4.275891304016113, -4.062847137451172, -3.8498029708862305, -3.63675856590271, -3.4237143993377686, -3.210669994354248, -2.9976258277893066, -2.7845816612243652, -2.571537494659424, -2.3584930896759033, -2.145448923110962, -1.932404637336731, -1.7193603515625, -1.5063161849975586, -1.2932718992233276, -1.0802276134490967, -0.8671834468841553, -0.6541391611099243, -0.4410949945449829, -0.22805070877075195, -0.015006467700004578, 0.1980377733707428, 0.41108202934265137, 0.6241262555122375, 0.8371704816818237, 1.0502147674560547, 1.263258934020996, 1.476303219795227, 1.689347505569458, 1.9023916721343994, 2.11543607711792, 2.3284802436828613, 2.5415244102478027, 2.754568576812744, 2.9676127433776855, 3.180657148361206, 3.3937013149261475, 3.606745719909668, 3.8197898864746094, 4.032834053039551, 4.245878219604492, 4.458922386169434, 4.671966552734375, 4.885011196136475, 5.098055362701416, 5.311099529266357, 5.524144172668457, 5.737188339233398, 5.95023250579834, 6.163276672363281, 6.376320838928223, 6.589365005493164]}, "eval/loss": 4.16819953918457, "eval/wer": 1.9665807219357399, "eval/runtime": 794.4467, "eval/samples_per_second": 3.326, "eval/steps_per_second": 0.278, "train/train_runtime": 6757.0177, "train/train_samples_per_second": 4.223, "train/train_steps_per_second": 0.176, "train/total_flos": 0.0, "train/train_loss": 4.268135019066556} \ No newline at end of file