diff --git "a/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" "b/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" --- "a/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" +++ "b/wandb/run-20220301_171456-1jxdkzs7/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.2575, "train/learning_rate": 2.2429906542056075e-05, "train/epoch": 0.84, "train/global_step": 1500, "_runtime": 7538, "_timestamp": 1646162434, "_step": 1502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 357.0, 657.0, 1.0, 1.0], "bins": [-1045.7138671875, -1028.594970703125, -1011.4760131835938, -994.3571166992188, -977.2382202148438, -960.1193237304688, -943.0003662109375, -925.8814697265625, -908.7625732421875, -891.6436767578125, -874.5247192382812, -857.4058227539062, -840.2869262695312, -823.1680297851562, -806.049072265625, -788.93017578125, -771.811279296875, -754.6923828125, -737.5734252929688, -720.4545288085938, -703.3356323242188, -686.2167358398438, -669.0977783203125, -651.9788818359375, -634.8599243164062, -617.7410278320312, -600.6220703125, -583.503173828125, -566.38427734375, -549.265380859375, -532.1464233398438, -515.0275268554688, -497.9085693359375, -480.7896423339844, -463.6707458496094, -446.55181884765625, -429.43292236328125, -412.3139953613281, -395.195068359375, -378.076171875, -360.957275390625, -343.8383483886719, -326.7194519042969, -309.60052490234375, -292.48162841796875, -275.3627014160156, -258.2437744140625, -241.1248779296875, -224.00596618652344, -206.88705444335938, -189.7681427001953, -172.64923095703125, -155.53030395507812, -138.41140747070312, -121.29248046875, -104.17356872558594, -87.05465698242188, -69.93574523925781, -52.816829681396484, -35.697914123535156, -18.579002380371094, -1.4600906372070312, 15.658828735351562, 32.777740478515625, 49.89665603637695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 8.0, 7.0, 11.0, 27.0, 20.0, 27.0, 45.0, 40.0, 47.0, 42.0, 48.0, 58.0, 58.0, 66.0, 73.0, 71.0, 68.0, 50.0, 67.0, 34.0, 28.0, 17.0, 16.0, 23.0, 16.0, 10.0, 10.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.2100830078125, -94.38960266113281, -91.56912231445312, -88.74864959716797, -85.92816925048828, -83.1076889038086, -80.28721618652344, -77.46673583984375, -74.64625549316406, -71.82577514648438, -69.00529479980469, -66.18482208251953, -63.364341735839844, -60.543861389160156, -57.723384857177734, -54.90290832519531, -52.082427978515625, -49.26194763183594, -46.441471099853516, -43.620994567871094, -40.800514221191406, -37.98003387451172, -35.1595573425293, -32.339080810546875, -29.518600463867188, -26.698122024536133, -23.877643585205078, -21.057165145874023, -18.23668670654297, -15.416208267211914, -12.59572982788086, -9.775251388549805, -6.95477294921875, -4.134294509887695, -1.3138160705566406, 1.506662368774414, 4.327140808105469, 7.147619247436523, 9.968097686767578, 12.788576126098633, 15.609054565429688, 18.429533004760742, 21.250011444091797, 24.07048988342285, 26.890968322753906, 29.71144676208496, 32.531925201416016, 35.35240173339844, 38.172882080078125, 40.99336242675781, 43.813838958740234, 46.634315490722656, 49.454795837402344, 52.27527618408203, 55.09575271606445, 57.916229248046875, 60.73670959472656, 63.55718994140625, 66.37767028808594, 69.1981430053711, 72.01862335205078, 74.83910369873047, 77.65957641601562, 80.48005676269531, 83.300537109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 8.0, 5.0, 7.0, 11.0, 9.0, 24.0, 7.0, 25.0, 23.0, 19.0, 27.0, 41.0, 38.0, 35.0, 31.0, 40.0, 25.0, 32.0, 52.0, 37.0, 61.0, 48.0, 48.0, 38.0, 47.0, 33.0, 43.0, 38.0, 25.0, 22.0, 10.0, 20.0, 16.0, 11.0, 9.0, 11.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.78997802734375, -1.7225341796875, -1.65509033203125, -1.587646484375, -1.52020263671875, -1.4527587890625, -1.38531494140625, -1.31787109375, -1.25042724609375, -1.1829833984375, -1.11553955078125, -1.048095703125, -0.98065185546875, -0.9132080078125, -0.84576416015625, -0.7783203125, -0.71087646484375, -0.6434326171875, -0.57598876953125, -0.508544921875, -0.44110107421875, -0.3736572265625, -0.30621337890625, -0.23876953125, -0.17132568359375, -0.1038818359375, -0.03643798828125, 0.031005859375, 0.09844970703125, 0.1658935546875, 0.23333740234375, 0.30078125, 0.36822509765625, 0.4356689453125, 0.50311279296875, 0.570556640625, 0.63800048828125, 0.7054443359375, 0.77288818359375, 0.84033203125, 0.90777587890625, 0.9752197265625, 1.04266357421875, 1.110107421875, 1.17755126953125, 1.2449951171875, 1.31243896484375, 1.3798828125, 1.44732666015625, 1.5147705078125, 1.58221435546875, 1.649658203125, 1.71710205078125, 1.7845458984375, 1.85198974609375, 1.91943359375, 1.98687744140625, 2.0543212890625, 2.12176513671875, 2.189208984375, 2.25665283203125, 2.3240966796875, 2.39154052734375, 2.458984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 7.0, 10.0, 13.0, 17.0, 22.0, 33.0, 35.0, 59.0, 72.0, 112.0, 129.0, 174.0, 243.0, 370.0, 493.0, 830.0, 1313.0, 2607.0, 5995.0, 17727.0, 71801.0, 630607.0, 3074446.0, 315999.0, 47383.0, 13007.0, 4845.0, 2288.0, 1200.0, 739.0, 468.0, 331.0, 210.0, 161.0, 146.0, 93.0, 60.0, 60.0, 44.0, 30.0, 27.0, 18.0, 14.0, 9.0, 5.0, 8.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.8203125, -10.486083984375, -10.15185546875, -9.817626953125, -9.4833984375, -9.149169921875, -8.81494140625, -8.480712890625, -8.146484375, -7.812255859375, -7.47802734375, -7.143798828125, -6.8095703125, -6.475341796875, -6.14111328125, -5.806884765625, -5.47265625, -5.138427734375, -4.80419921875, -4.469970703125, -4.1357421875, -3.801513671875, -3.46728515625, -3.133056640625, -2.798828125, -2.464599609375, -2.13037109375, -1.796142578125, -1.4619140625, -1.127685546875, -0.79345703125, -0.459228515625, -0.125, 0.209228515625, 0.54345703125, 0.877685546875, 1.2119140625, 1.546142578125, 1.88037109375, 2.214599609375, 2.548828125, 2.883056640625, 3.21728515625, 3.551513671875, 3.8857421875, 4.219970703125, 4.55419921875, 4.888427734375, 5.22265625, 5.556884765625, 5.89111328125, 6.225341796875, 6.5595703125, 6.893798828125, 7.22802734375, 7.562255859375, 7.896484375, 8.230712890625, 8.56494140625, 8.899169921875, 9.2333984375, 9.567626953125, 9.90185546875, 10.236083984375, 10.5703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 15.0, 30.0, 46.0, 99.0, 166.0, 329.0, 565.0, 928.0, 835.0, 481.0, 246.0, 148.0, 86.0, 39.0, 23.0, 15.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-22.546875, -22.0086669921875, -21.470458984375, -20.9322509765625, -20.39404296875, -19.8558349609375, -19.317626953125, -18.7794189453125, -18.2412109375, -17.7030029296875, -17.164794921875, -16.6265869140625, -16.08837890625, -15.5501708984375, -15.011962890625, -14.4737548828125, -13.935546875, -13.3973388671875, -12.859130859375, -12.3209228515625, -11.78271484375, -11.2445068359375, -10.706298828125, -10.1680908203125, -9.6298828125, -9.0916748046875, -8.553466796875, -8.0152587890625, -7.47705078125, -6.9388427734375, -6.400634765625, -5.8624267578125, -5.32421875, -4.7860107421875, -4.247802734375, -3.7095947265625, -3.17138671875, -2.6331787109375, -2.094970703125, -1.5567626953125, -1.0185546875, -0.4803466796875, 0.057861328125, 0.5960693359375, 1.13427734375, 1.6724853515625, 2.210693359375, 2.7489013671875, 3.287109375, 3.8253173828125, 4.363525390625, 4.9017333984375, 5.43994140625, 5.9781494140625, 6.516357421875, 7.0545654296875, 7.5927734375, 8.1309814453125, 8.669189453125, 9.2073974609375, 9.74560546875, 10.2838134765625, 10.822021484375, 11.3602294921875, 11.8984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 14.0, 18.0, 42.0, 101.0, 224.0, 549.0, 1678.0, 12711.0, 4092925.0, 82140.0, 2519.0, 781.0, 312.0, 125.0, 61.0, 35.0, 16.0, 15.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.25, -56.2861328125, -54.322265625, -52.3583984375, -50.39453125, -48.4306640625, -46.466796875, -44.5029296875, -42.5390625, -40.5751953125, -38.611328125, -36.6474609375, -34.68359375, -32.7197265625, -30.755859375, -28.7919921875, -26.828125, -24.8642578125, -22.900390625, -20.9365234375, -18.97265625, -17.0087890625, -15.044921875, -13.0810546875, -11.1171875, -9.1533203125, -7.189453125, -5.2255859375, -3.26171875, -1.2978515625, 0.666015625, 2.6298828125, 4.59375, 6.5576171875, 8.521484375, 10.4853515625, 12.44921875, 14.4130859375, 16.376953125, 18.3408203125, 20.3046875, 22.2685546875, 24.232421875, 26.1962890625, 28.16015625, 30.1240234375, 32.087890625, 34.0517578125, 36.015625, 37.9794921875, 39.943359375, 41.9072265625, 43.87109375, 45.8349609375, 47.798828125, 49.7626953125, 51.7265625, 53.6904296875, 55.654296875, 57.6181640625, 59.58203125, 61.5458984375, 63.509765625, 65.4736328125, 67.4375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 55.0, 664.0, 270.0, 19.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.6010856628418, -53.47708511352539, -47.35308074951172, -41.22908020019531, -35.105079650878906, -28.9810791015625, -22.857074737548828, -16.733074188232422, -10.609073638916016, -4.485072135925293, 1.6389293670654297, 7.762931823730469, 13.886932373046875, 20.01093292236328, 26.134937286376953, 32.25893783569336, 38.382938385009766, 44.50693893432617, 50.630943298339844, 56.75494384765625, 62.878944396972656, 69.00294494628906, 75.126953125, 81.25094604492188, 87.37495422363281, 93.49895477294922, 99.62295532226562, 105.74696350097656, 111.87095642089844, 117.99496459960938, 124.11896514892578, 130.2429656982422, 136.36697387695312, 142.49098205566406, 148.61497497558594, 154.73898315429688, 160.86297607421875, 166.9869842529297, 173.11099243164062, 179.2349853515625, 185.35897827148438, 191.4829864501953, 197.6069793701172, 203.73098754882812, 209.85498046875, 215.97898864746094, 222.10299682617188, 228.22698974609375, 234.3509979248047, 240.47500610351562, 246.5989990234375, 252.72300720214844, 258.8470153808594, 264.97100830078125, 271.0950012207031, 277.218994140625, 283.343017578125, 289.4670104980469, 295.5910339355469, 301.71502685546875, 307.8390197753906, 313.9630126953125, 320.0870361328125, 326.2110290527344, 332.33502197265625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 6.0, 10.0, 17.0, 12.0, 17.0, 16.0, 26.0, 33.0, 31.0, 38.0, 36.0, 26.0, 51.0, 43.0, 54.0, 55.0, 67.0, 45.0, 48.0, 50.0, 40.0, 42.0, 46.0, 41.0, 20.0, 30.0, 17.0, 25.0, 18.0, 4.0, 11.0, 5.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.842864990234375, -34.5989990234375, -33.35512924194336, -32.111263275146484, -30.867395401000977, -29.62352752685547, -28.379661560058594, -27.135793685913086, -25.891925811767578, -24.64805793762207, -23.404190063476562, -22.160324096679688, -20.91645622253418, -19.672588348388672, -18.428722381591797, -17.18485450744629, -15.940986633300781, -14.697118759155273, -13.453251838684082, -12.20938491821289, -10.965517044067383, -9.721649169921875, -8.477782249450684, -7.233915328979492, -5.990047454833984, -4.746180057525635, -3.502312660217285, -2.2584452629089355, -1.014577865600586, 0.22928953170776367, 1.4731569290161133, 2.7170238494873047, 3.9608917236328125, 5.204759120941162, 6.448626518249512, 7.692493915557861, 8.936361312866211, 10.180229187011719, 11.42409610748291, 12.667963027954102, 13.91183090209961, 15.155698776245117, 16.399566650390625, 17.6434326171875, 18.887300491333008, 20.131168365478516, 21.37503433227539, 22.6189022064209, 23.862770080566406, 25.106637954711914, 26.350505828857422, 27.594371795654297, 28.838239669799805, 30.082107543945312, 31.325973510742188, 32.56983947753906, 33.8137092590332, 35.05757522583008, 36.30144500732422, 37.545310974121094, 38.78917694091797, 40.03304672241211, 41.276912689208984, 42.520782470703125, 43.7646484375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 3.0, 8.0, 10.0, 12.0, 21.0, 19.0, 25.0, 16.0, 20.0, 17.0, 24.0, 19.0, 30.0, 28.0, 35.0, 32.0, 22.0, 41.0, 39.0, 32.0, 36.0, 29.0, 29.0, 29.0, 42.0, 46.0, 39.0, 26.0, 26.0, 34.0, 29.0, 20.0, 22.0, 21.0, 15.0, 10.0, 10.0, 12.0, 8.0, 4.0, 11.0, 4.0, 7.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.8408203125, -1.7857208251953125, -1.730621337890625, -1.6755218505859375, -1.62042236328125, -1.5653228759765625, -1.510223388671875, -1.4551239013671875, -1.4000244140625, -1.3449249267578125, -1.289825439453125, -1.2347259521484375, -1.17962646484375, -1.1245269775390625, -1.069427490234375, -1.0143280029296875, -0.959228515625, -0.9041290283203125, -0.849029541015625, -0.7939300537109375, -0.73883056640625, -0.6837310791015625, -0.628631591796875, -0.5735321044921875, -0.5184326171875, -0.4633331298828125, -0.408233642578125, -0.3531341552734375, -0.29803466796875, -0.2429351806640625, -0.187835693359375, -0.1327362060546875, -0.07763671875, -0.0225372314453125, 0.032562255859375, 0.0876617431640625, 0.14276123046875, 0.1978607177734375, 0.252960205078125, 0.3080596923828125, 0.3631591796875, 0.4182586669921875, 0.473358154296875, 0.5284576416015625, 0.58355712890625, 0.6386566162109375, 0.693756103515625, 0.7488555908203125, 0.803955078125, 0.8590545654296875, 0.914154052734375, 0.9692535400390625, 1.02435302734375, 1.0794525146484375, 1.134552001953125, 1.1896514892578125, 1.2447509765625, 1.2998504638671875, 1.354949951171875, 1.4100494384765625, 1.46514892578125, 1.5202484130859375, 1.575347900390625, 1.6304473876953125, 1.685546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 21.0, 24.0, 24.0, 45.0, 67.0, 103.0, 140.0, 196.0, 314.0, 451.0, 711.0, 1131.0, 1677.0, 2619.0, 4098.0, 6088.0, 9755.0, 14773.0, 22697.0, 34826.0, 54211.0, 81112.0, 119975.0, 159646.0, 162951.0, 124768.0, 85333.0, 56065.0, 36598.0, 23912.0, 15465.0, 10055.0, 6583.0, 4189.0, 2714.0, 1731.0, 1202.0, 802.0, 486.0, 325.0, 207.0, 159.0, 89.0, 71.0, 42.0, 34.0, 26.0, 13.0, 13.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2347412109375, -0.2269306182861328, -0.21912002563476562, -0.21130943298339844, -0.20349884033203125, -0.19568824768066406, -0.18787765502929688, -0.1800670623779297, -0.1722564697265625, -0.1644458770751953, -0.15663528442382812, -0.14882469177246094, -0.14101409912109375, -0.13320350646972656, -0.12539291381835938, -0.11758232116699219, -0.109771728515625, -0.10196113586425781, -0.09415054321289062, -0.08633995056152344, -0.07852935791015625, -0.07071876525878906, -0.06290817260742188, -0.05509757995605469, -0.0472869873046875, -0.03947639465332031, -0.031665802001953125, -0.023855209350585938, -0.01604461669921875, -0.008234024047851562, -0.000423431396484375, 0.0073871612548828125, 0.01519775390625, 0.023008346557617188, 0.030818939208984375, 0.03862953186035156, 0.04644012451171875, 0.05425071716308594, 0.062061309814453125, 0.06987190246582031, 0.0776824951171875, 0.08549308776855469, 0.09330368041992188, 0.10111427307128906, 0.10892486572265625, 0.11673545837402344, 0.12454605102539062, 0.1323566436767578, 0.140167236328125, 0.1479778289794922, 0.15578842163085938, 0.16359901428222656, 0.17140960693359375, 0.17922019958496094, 0.18703079223632812, 0.1948413848876953, 0.2026519775390625, 0.2104625701904297, 0.21827316284179688, 0.22608375549316406, 0.23389434814453125, 0.24170494079589844, 0.24951553344726562, 0.2573261260986328, 0.26513671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 9.0, 10.0, 8.0, 13.0, 14.0, 16.0, 21.0, 19.0, 24.0, 26.0, 46.0, 38.0, 51.0, 37.0, 51.0, 48.0, 47.0, 1076.0, 44.0, 47.0, 51.0, 44.0, 41.0, 45.0, 31.0, 23.0, 20.0, 28.0, 23.0, 12.0, 11.0, 13.0, 4.0, 6.0, 7.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4851226806640625, -1.438018798828125, -1.3909149169921875, -1.34381103515625, -1.2967071533203125, -1.249603271484375, -1.2024993896484375, -1.1553955078125, -1.1082916259765625, -1.061187744140625, -1.0140838623046875, -0.96697998046875, -0.9198760986328125, -0.872772216796875, -0.8256683349609375, -0.778564453125, -0.7314605712890625, -0.684356689453125, -0.6372528076171875, -0.59014892578125, -0.5430450439453125, -0.495941162109375, -0.4488372802734375, -0.4017333984375, -0.3546295166015625, -0.307525634765625, -0.2604217529296875, -0.21331787109375, -0.1662139892578125, -0.119110107421875, -0.0720062255859375, -0.02490234375, 0.0222015380859375, 0.069305419921875, 0.1164093017578125, 0.16351318359375, 0.2106170654296875, 0.257720947265625, 0.3048248291015625, 0.3519287109375, 0.3990325927734375, 0.446136474609375, 0.4932403564453125, 0.54034423828125, 0.5874481201171875, 0.634552001953125, 0.6816558837890625, 0.728759765625, 0.7758636474609375, 0.822967529296875, 0.8700714111328125, 0.91717529296875, 0.9642791748046875, 1.011383056640625, 1.0584869384765625, 1.1055908203125, 1.1526947021484375, 1.199798583984375, 1.2469024658203125, 1.29400634765625, 1.3411102294921875, 1.388214111328125, 1.4353179931640625, 1.482421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 13.0, 24.0, 23.0, 55.0, 54.0, 96.0, 187.0, 272.0, 375.0, 623.0, 967.0, 1645.0, 2560.0, 4212.0, 7247.0, 12484.0, 21618.0, 37476.0, 64920.0, 108724.0, 167261.0, 1250176.0, 163120.0, 104504.0, 62400.0, 35958.0, 20657.0, 11784.0, 6993.0, 4177.0, 2411.0, 1497.0, 952.0, 591.0, 359.0, 235.0, 153.0, 108.0, 78.0, 48.0, 24.0, 22.0, 18.0, 13.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.2053852081298828, -0.19885635375976562, -0.19232749938964844, -0.18579864501953125, -0.17926979064941406, -0.17274093627929688, -0.1662120819091797, -0.1596832275390625, -0.1531543731689453, -0.14662551879882812, -0.14009666442871094, -0.13356781005859375, -0.12703895568847656, -0.12051010131835938, -0.11398124694824219, -0.107452392578125, -0.10092353820800781, -0.09439468383789062, -0.08786582946777344, -0.08133697509765625, -0.07480812072753906, -0.06827926635742188, -0.06175041198730469, -0.0552215576171875, -0.04869270324707031, -0.042163848876953125, -0.03563499450683594, -0.02910614013671875, -0.022577285766601562, -0.016048431396484375, -0.009519577026367188, -0.00299072265625, 0.0035381317138671875, 0.010066986083984375, 0.016595840454101562, 0.02312469482421875, 0.029653549194335938, 0.036182403564453125, 0.04271125793457031, 0.0492401123046875, 0.05576896667480469, 0.062297821044921875, 0.06882667541503906, 0.07535552978515625, 0.08188438415527344, 0.08841323852539062, 0.09494209289550781, 0.101470947265625, 0.10799980163574219, 0.11452865600585938, 0.12105751037597656, 0.12758636474609375, 0.13411521911621094, 0.14064407348632812, 0.1471729278564453, 0.1537017822265625, 0.1602306365966797, 0.16675949096679688, 0.17328834533691406, 0.17981719970703125, 0.18634605407714844, 0.19287490844726562, 0.1994037628173828, 0.2059326171875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 0.0, 8.0, 6.0, 7.0, 16.0, 7.0, 12.0, 17.0, 19.0, 24.0, 27.0, 34.0, 44.0, 45.0, 59.0, 55.0, 63.0, 75.0, 71.0, 72.0, 58.0, 46.0, 40.0, 35.0, 27.0, 25.0, 18.0, 22.0, 15.0, 9.0, 6.0, 6.0, 7.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001064300537109375, -0.0010314732789993286, -0.0009986460208892822, -0.0009658187627792358, -0.0009329915046691895, -0.0009001642465591431, -0.0008673369884490967, -0.0008345097303390503, -0.0008016824722290039, -0.0007688552141189575, -0.0007360279560089111, -0.0007032006978988647, -0.0006703734397888184, -0.000637546181678772, -0.0006047189235687256, -0.0005718916654586792, -0.0005390644073486328, -0.0005062371492385864, -0.00047340989112854004, -0.00044058263301849365, -0.00040775537490844727, -0.0003749281167984009, -0.0003421008586883545, -0.0003092736005783081, -0.0002764463424682617, -0.00024361908435821533, -0.00021079182624816895, -0.00017796456813812256, -0.00014513731002807617, -0.00011231005191802979, -7.94827938079834e-05, -4.665553569793701e-05, -1.3828277587890625e-05, 1.8998980522155762e-05, 5.182623863220215e-05, 8.465349674224854e-05, 0.00011748075485229492, 0.0001503080129623413, 0.0001831352710723877, 0.00021596252918243408, 0.00024878978729248047, 0.00028161704540252686, 0.00031444430351257324, 0.00034727156162261963, 0.000380098819732666, 0.0004129260778427124, 0.0004457533359527588, 0.0004785805940628052, 0.0005114078521728516, 0.000544235110282898, 0.0005770623683929443, 0.0006098896265029907, 0.0006427168846130371, 0.0006755441427230835, 0.0007083714008331299, 0.0007411986589431763, 0.0007740259170532227, 0.000806853175163269, 0.0008396804332733154, 0.0008725076913833618, 0.0009053349494934082, 0.0009381622076034546, 0.000970989465713501, 0.0010038167238235474, 0.0010366439819335938]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 8.0, 9.0, 12.0, 15.0, 25.0, 25.0, 30.0, 49.0, 79.0, 65.0, 109.0, 168.0, 222.0, 346.0, 610.0, 4725.0, 1030990.0, 9136.0, 716.0, 363.0, 212.0, 158.0, 125.0, 83.0, 57.0, 52.0, 38.0, 31.0, 21.0, 18.0, 19.0, 9.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247039794921875, -0.024009227752685547, -0.023314476013183594, -0.02261972427368164, -0.021924972534179688, -0.021230220794677734, -0.02053546905517578, -0.019840717315673828, -0.019145965576171875, -0.018451213836669922, -0.01775646209716797, -0.017061710357666016, -0.016366958618164062, -0.01567220687866211, -0.014977455139160156, -0.014282703399658203, -0.01358795166015625, -0.012893199920654297, -0.012198448181152344, -0.01150369644165039, -0.010808944702148438, -0.010114192962646484, -0.009419441223144531, -0.008724689483642578, -0.008029937744140625, -0.007335186004638672, -0.006640434265136719, -0.005945682525634766, -0.0052509307861328125, -0.004556179046630859, -0.0038614273071289062, -0.003166675567626953, -0.002471923828125, -0.0017771720886230469, -0.0010824203491210938, -0.0003876686096191406, 0.0003070831298828125, 0.0010018348693847656, 0.0016965866088867188, 0.002391338348388672, 0.003086090087890625, 0.003780841827392578, 0.004475593566894531, 0.005170345306396484, 0.0058650970458984375, 0.006559848785400391, 0.007254600524902344, 0.007949352264404297, 0.00864410400390625, 0.009338855743408203, 0.010033607482910156, 0.01072835922241211, 0.011423110961914062, 0.012117862701416016, 0.012812614440917969, 0.013507366180419922, 0.014202117919921875, 0.014896869659423828, 0.015591621398925781, 0.016286373138427734, 0.016981124877929688, 0.01767587661743164, 0.018370628356933594, 0.019065380096435547, 0.0197601318359375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 660.0, 349.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.017048466950654984, -0.016749100759625435, -0.016449736431241035, -0.016150370240211487, -0.015851005911827087, -0.015551640652120113, -0.01525227539241314, -0.01495290920138359, -0.014653544872999191, -0.014354179613292217, -0.014054814353585243, -0.01375544909387827, -0.013456083834171295, -0.013156718574464321, -0.012857353314757347, -0.012557987123727798, -0.012258621864020824, -0.01195925660431385, -0.011659891344606876, -0.011360526084899902, -0.011061160825192928, -0.010761795565485954, -0.01046243030577898, -0.010163065046072006, -0.009863698855042458, -0.009564333595335484, -0.00926496833562851, -0.008965603075921535, -0.008666237816214561, -0.008366872556507587, -0.008067507296800613, -0.007768141571432352, -0.007468776777386665, -0.007169411517679691, -0.006870046257972717, -0.006570680998265743, -0.006271315738558769, -0.005971950478851795, -0.005672584753483534, -0.00537321949377656, -0.005073854699730873, -0.004774489440023899, -0.004475124180316925, -0.004175758920609951, -0.0038763934280723333, -0.0035770281683653593, -0.0032776626758277416, -0.0029782974161207676, -0.00267893192358315, -0.002379566663876176, -0.002080201171338558, -0.0017808359116315842, -0.0014814706519246101, -0.001182105392217636, -0.0008827400160953403, -0.0005833746399730444, -0.00028400938026607037, 1.5355937648564577e-05, 0.0003147212555631995, 0.0006140865734778345, 0.0009134518913924694, 0.0012128171510994434, 0.0015121825272217393, 0.0018115479033440351, 0.002110913163051009]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 6.0, 13.0, 12.0, 11.0, 17.0, 16.0, 15.0, 25.0, 27.0, 36.0, 38.0, 32.0, 43.0, 48.0, 49.0, 34.0, 46.0, 50.0, 36.0, 35.0, 42.0, 31.0, 34.0, 35.0, 40.0, 25.0, 31.0, 31.0, 25.0, 21.0, 20.0, 8.0, 12.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000490725040435791, -0.00047256797552108765, -0.0004544109106063843, -0.0004362538456916809, -0.00041809678077697754, -0.00039993971586227417, -0.0003817826509475708, -0.00036362558603286743, -0.00034546852111816406, -0.0003273114562034607, -0.0003091543912887573, -0.00029099732637405396, -0.0002728402614593506, -0.0002546831965446472, -0.00023652613162994385, -0.00021836906671524048, -0.0002002120018005371, -0.00018205493688583374, -0.00016389787197113037, -0.000145740807056427, -0.00012758374214172363, -0.00010942667722702026, -9.12696123123169e-05, -7.311254739761353e-05, -5.4955482482910156e-05, -3.679841756820679e-05, -1.8641352653503418e-05, -4.842877388000488e-07, 1.767277717590332e-05, 3.582984209060669e-05, 5.398690700531006e-05, 7.214397192001343e-05, 9.03010368347168e-05, 0.00010845810174942017, 0.00012661516666412354, 0.0001447722315788269, 0.00016292929649353027, 0.00018108636140823364, 0.000199243426322937, 0.00021740049123764038, 0.00023555755615234375, 0.0002537146210670471, 0.0002718716859817505, 0.00029002875089645386, 0.0003081858158111572, 0.0003263428807258606, 0.00034449994564056396, 0.00036265701055526733, 0.0003808140754699707, 0.00039897114038467407, 0.00041712820529937744, 0.0004352852702140808, 0.0004534423351287842, 0.00047159940004348755, 0.0004897564649581909, 0.0005079135298728943, 0.0005260705947875977, 0.000544227659702301, 0.0005623847246170044, 0.0005805417895317078, 0.0005986988544464111, 0.0006168559193611145, 0.0006350129842758179, 0.0006531700491905212, 0.0006713271141052246]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 3.0, 8.0, 10.0, 12.0, 21.0, 18.0, 26.0, 16.0, 20.0, 17.0, 24.0, 19.0, 30.0, 28.0, 35.0, 32.0, 22.0, 41.0, 39.0, 32.0, 36.0, 29.0, 29.0, 29.0, 43.0, 45.0, 39.0, 26.0, 26.0, 34.0, 29.0, 20.0, 22.0, 21.0, 15.0, 10.0, 10.0, 12.0, 8.0, 4.0, 11.0, 4.0, 7.0, 3.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0], "bins": [-1.8408203125, -1.7857208251953125, -1.730621337890625, -1.6755218505859375, -1.62042236328125, -1.5653228759765625, -1.510223388671875, -1.4551239013671875, -1.4000244140625, -1.3449249267578125, -1.289825439453125, -1.2347259521484375, -1.17962646484375, -1.1245269775390625, -1.069427490234375, -1.0143280029296875, -0.959228515625, -0.9041290283203125, -0.849029541015625, -0.7939300537109375, -0.73883056640625, -0.6837310791015625, -0.628631591796875, -0.5735321044921875, -0.5184326171875, -0.4633331298828125, -0.408233642578125, -0.3531341552734375, -0.29803466796875, -0.2429351806640625, -0.187835693359375, -0.1327362060546875, -0.07763671875, -0.0225372314453125, 0.032562255859375, 0.0876617431640625, 0.14276123046875, 0.1978607177734375, 0.252960205078125, 0.3080596923828125, 0.3631591796875, 0.4182586669921875, 0.473358154296875, 0.5284576416015625, 0.58355712890625, 0.6386566162109375, 0.693756103515625, 0.7488555908203125, 0.803955078125, 0.8590545654296875, 0.914154052734375, 0.9692535400390625, 1.02435302734375, 1.0794525146484375, 1.134552001953125, 1.1896514892578125, 1.2447509765625, 1.2998504638671875, 1.354949951171875, 1.4100494384765625, 1.46514892578125, 1.5202484130859375, 1.575347900390625, 1.6304473876953125, 1.685546875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 16.0, 13.0, 28.0, 32.0, 92.0, 114.0, 194.0, 326.0, 614.0, 1058.0, 1637.0, 2920.0, 4977.0, 9849.0, 23242.0, 87268.0, 552430.0, 282595.0, 47833.0, 16038.0, 7528.0, 4145.0, 2235.0, 1354.0, 811.0, 492.0, 301.0, 178.0, 90.0, 55.0, 37.0, 13.0, 17.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.85205078125, -9.5322265625, -9.21240234375, -8.892578125, -8.57275390625, -8.2529296875, -7.93310546875, -7.61328125, -7.29345703125, -6.9736328125, -6.65380859375, -6.333984375, -6.01416015625, -5.6943359375, -5.37451171875, -5.0546875, -4.73486328125, -4.4150390625, -4.09521484375, -3.775390625, -3.45556640625, -3.1357421875, -2.81591796875, -2.49609375, -2.17626953125, -1.8564453125, -1.53662109375, -1.216796875, -0.89697265625, -0.5771484375, -0.25732421875, 0.0625, 0.38232421875, 0.7021484375, 1.02197265625, 1.341796875, 1.66162109375, 1.9814453125, 2.30126953125, 2.62109375, 2.94091796875, 3.2607421875, 3.58056640625, 3.900390625, 4.22021484375, 4.5400390625, 4.85986328125, 5.1796875, 5.49951171875, 5.8193359375, 6.13916015625, 6.458984375, 6.77880859375, 7.0986328125, 7.41845703125, 7.73828125, 8.05810546875, 8.3779296875, 8.69775390625, 9.017578125, 9.33740234375, 9.6572265625, 9.97705078125, 10.296875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 2.0, 7.0, 6.0, 15.0, 7.0, 10.0, 12.0, 18.0, 16.0, 25.0, 26.0, 24.0, 33.0, 43.0, 40.0, 41.0, 64.0, 87.0, 117.0, 222.0, 1500.0, 198.0, 86.0, 70.0, 54.0, 51.0, 36.0, 41.0, 26.0, 28.0, 30.0, 19.0, 17.0, 19.0, 10.0, 18.0, 8.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8359375, -6.6309814453125, -6.426025390625, -6.2210693359375, -6.01611328125, -5.8111572265625, -5.606201171875, -5.4012451171875, -5.1962890625, -4.9913330078125, -4.786376953125, -4.5814208984375, -4.37646484375, -4.1715087890625, -3.966552734375, -3.7615966796875, -3.556640625, -3.3516845703125, -3.146728515625, -2.9417724609375, -2.73681640625, -2.5318603515625, -2.326904296875, -2.1219482421875, -1.9169921875, -1.7120361328125, -1.507080078125, -1.3021240234375, -1.09716796875, -0.8922119140625, -0.687255859375, -0.4822998046875, -0.27734375, -0.0723876953125, 0.132568359375, 0.3375244140625, 0.54248046875, 0.7474365234375, 0.952392578125, 1.1573486328125, 1.3623046875, 1.5672607421875, 1.772216796875, 1.9771728515625, 2.18212890625, 2.3870849609375, 2.592041015625, 2.7969970703125, 3.001953125, 3.2069091796875, 3.411865234375, 3.6168212890625, 3.82177734375, 4.0267333984375, 4.231689453125, 4.4366455078125, 4.6416015625, 4.8465576171875, 5.051513671875, 5.2564697265625, 5.46142578125, 5.6663818359375, 5.871337890625, 6.0762939453125, 6.28125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 4.0, 9.0, 9.0, 10.0, 14.0, 8.0, 24.0, 23.0, 19.0, 30.0, 33.0, 42.0, 77.0, 146.0, 376.0, 1209.0, 15095.0, 3076451.0, 49425.0, 1723.0, 450.0, 162.0, 89.0, 52.0, 40.0, 36.0, 25.0, 21.0, 18.0, 17.0, 9.0, 11.0, 11.0, 3.0, 12.0, 9.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.234375, -28.279296875, -27.32421875, -26.369140625, -25.4140625, -24.458984375, -23.50390625, -22.548828125, -21.59375, -20.638671875, -19.68359375, -18.728515625, -17.7734375, -16.818359375, -15.86328125, -14.908203125, -13.953125, -12.998046875, -12.04296875, -11.087890625, -10.1328125, -9.177734375, -8.22265625, -7.267578125, -6.3125, -5.357421875, -4.40234375, -3.447265625, -2.4921875, -1.537109375, -0.58203125, 0.373046875, 1.328125, 2.283203125, 3.23828125, 4.193359375, 5.1484375, 6.103515625, 7.05859375, 8.013671875, 8.96875, 9.923828125, 10.87890625, 11.833984375, 12.7890625, 13.744140625, 14.69921875, 15.654296875, 16.609375, 17.564453125, 18.51953125, 19.474609375, 20.4296875, 21.384765625, 22.33984375, 23.294921875, 24.25, 25.205078125, 26.16015625, 27.115234375, 28.0703125, 29.025390625, 29.98046875, 30.935546875, 31.890625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 54.0, 604.0, 350.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.086029052734375, -43.640907287597656, -41.1957893371582, -38.750667572021484, -36.30554962158203, -33.86042785644531, -31.415307998657227, -28.97018814086914, -26.525068283081055, -24.07994842529297, -21.634828567504883, -19.189708709716797, -16.744586944580078, -14.299468040466309, -11.854347229003906, -9.40922737121582, -6.964107513427734, -4.518987655639648, -2.0738673210144043, 0.37125301361083984, 2.816372871398926, 5.261492729187012, 7.706613540649414, 10.1517333984375, 12.596853256225586, 15.041973114013672, 17.487092971801758, 19.932212829589844, 22.377334594726562, 24.822452545166016, 27.267574310302734, 29.71269416809082, 32.157814025878906, 34.602935791015625, 37.04805374145508, 39.4931755065918, 41.93829345703125, 44.38341522216797, 46.82853698730469, 49.27365493774414, 51.718772888183594, 54.16389465332031, 56.609012603759766, 59.054134368896484, 61.49925231933594, 63.944374084472656, 66.38949584960938, 68.83460998535156, 71.27973937988281, 73.72486114501953, 76.16998291015625, 78.61509704589844, 81.06021881103516, 83.50534057617188, 85.9504623413086, 88.39558410644531, 90.8406982421875, 93.28582000732422, 95.73094177246094, 98.17605590820312, 100.62117767333984, 103.06629943847656, 105.51142120361328, 107.95654296875, 110.40165710449219]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 6.0, 7.0, 14.0, 12.0, 16.0, 12.0, 27.0, 20.0, 31.0, 22.0, 36.0, 27.0, 32.0, 30.0, 35.0, 37.0, 33.0, 28.0, 32.0, 36.0, 40.0, 43.0, 40.0, 26.0, 41.0, 31.0, 31.0, 32.0, 32.0, 27.0, 17.0, 28.0, 19.0, 24.0, 18.0, 1.0, 8.0, 12.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.65854835510254, -17.054975509643555, -16.45140266418457, -15.847830772399902, -15.244257926940918, -14.640685081481934, -14.037113189697266, -13.433540344238281, -12.829967498779297, -12.226394653320312, -11.622821807861328, -11.01924991607666, -10.415677070617676, -9.812104225158691, -9.208532333374023, -8.604959487915039, -8.001386642456055, -7.39781379699707, -6.794241428375244, -6.190669059753418, -5.587096214294434, -4.983523368835449, -4.379951000213623, -3.776378631591797, -3.1728057861328125, -2.5692331790924072, -1.965660572052002, -1.3620879650115967, -0.7585153579711914, -0.15494275093078613, 0.44862985610961914, 1.0522022247314453, 1.6557769775390625, 2.2593495845794678, 2.862922191619873, 3.4664947986602783, 4.070067405700684, 4.673640251159668, 5.277212619781494, 5.88078498840332, 6.484357833862305, 7.087930679321289, 7.691503047943115, 8.295075416564941, 8.898648262023926, 9.50222110748291, 10.105792999267578, 10.709365844726562, 11.312938690185547, 11.916511535644531, 12.520084381103516, 13.123656272888184, 13.727229118347168, 14.330801963806152, 14.93437385559082, 15.537946701049805, 16.14151954650879, 16.745092391967773, 17.348665237426758, 17.952238082885742, 18.555809020996094, 19.159381866455078, 19.762954711914062, 20.366527557373047, 20.97010040283203]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 4.0, 5.0, 11.0, 9.0, 16.0, 19.0, 18.0, 14.0, 19.0, 17.0, 20.0, 27.0, 22.0, 20.0, 32.0, 26.0, 30.0, 33.0, 36.0, 27.0, 29.0, 44.0, 29.0, 31.0, 30.0, 35.0, 52.0, 37.0, 28.0, 29.0, 28.0, 24.0, 32.0, 19.0, 16.0, 19.0, 9.0, 17.0, 15.0, 5.0, 8.0, 9.0, 10.0, 5.0, 3.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.8232421875, -1.7660980224609375, -1.708953857421875, -1.6518096923828125, -1.59466552734375, -1.5375213623046875, -1.480377197265625, -1.4232330322265625, -1.3660888671875, -1.3089447021484375, -1.251800537109375, -1.1946563720703125, -1.13751220703125, -1.0803680419921875, -1.023223876953125, -0.9660797119140625, -0.908935546875, -0.8517913818359375, -0.794647216796875, -0.7375030517578125, -0.68035888671875, -0.6232147216796875, -0.566070556640625, -0.5089263916015625, -0.4517822265625, -0.3946380615234375, -0.337493896484375, -0.2803497314453125, -0.22320556640625, -0.1660614013671875, -0.108917236328125, -0.0517730712890625, 0.00537109375, 0.0625152587890625, 0.119659423828125, 0.1768035888671875, 0.23394775390625, 0.2910919189453125, 0.348236083984375, 0.4053802490234375, 0.4625244140625, 0.5196685791015625, 0.576812744140625, 0.6339569091796875, 0.69110107421875, 0.7482452392578125, 0.805389404296875, 0.8625335693359375, 0.919677734375, 0.9768218994140625, 1.033966064453125, 1.0911102294921875, 1.14825439453125, 1.2053985595703125, 1.262542724609375, 1.3196868896484375, 1.3768310546875, 1.4339752197265625, 1.491119384765625, 1.5482635498046875, 1.60540771484375, 1.6625518798828125, 1.719696044921875, 1.7768402099609375, 1.833984375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 5.0, 6.0, 7.0, 18.0, 11.0, 21.0, 33.0, 46.0, 51.0, 63.0, 92.0, 127.0, 166.0, 290.0, 465.0, 1002.0, 2852.0, 10323.0, 48766.0, 368108.0, 3181187.0, 502508.0, 59177.0, 12456.0, 3554.0, 1230.0, 591.0, 361.0, 210.0, 138.0, 107.0, 78.0, 50.0, 45.0, 32.0, 20.0, 21.0, 16.0, 9.0, 11.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.1875, -10.8214111328125, -10.455322265625, -10.0892333984375, -9.72314453125, -9.3570556640625, -8.990966796875, -8.6248779296875, -8.2587890625, -7.8927001953125, -7.526611328125, -7.1605224609375, -6.79443359375, -6.4283447265625, -6.062255859375, -5.6961669921875, -5.330078125, -4.9639892578125, -4.597900390625, -4.2318115234375, -3.86572265625, -3.4996337890625, -3.133544921875, -2.7674560546875, -2.4013671875, -2.0352783203125, -1.669189453125, -1.3031005859375, -0.93701171875, -0.5709228515625, -0.204833984375, 0.1612548828125, 0.52734375, 0.8934326171875, 1.259521484375, 1.6256103515625, 1.99169921875, 2.3577880859375, 2.723876953125, 3.0899658203125, 3.4560546875, 3.8221435546875, 4.188232421875, 4.5543212890625, 4.92041015625, 5.2864990234375, 5.652587890625, 6.0186767578125, 6.384765625, 6.7508544921875, 7.116943359375, 7.4830322265625, 7.84912109375, 8.2152099609375, 8.581298828125, 8.9473876953125, 9.3134765625, 9.6795654296875, 10.045654296875, 10.4117431640625, 10.77783203125, 11.1439208984375, 11.510009765625, 11.8760986328125, 12.2421875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 10.0, 7.0, 19.0, 32.0, 67.0, 100.0, 172.0, 274.0, 442.0, 718.0, 816.0, 585.0, 331.0, 208.0, 133.0, 78.0, 37.0, 25.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.890625, -14.442626953125, -13.99462890625, -13.546630859375, -13.0986328125, -12.650634765625, -12.20263671875, -11.754638671875, -11.306640625, -10.858642578125, -10.41064453125, -9.962646484375, -9.5146484375, -9.066650390625, -8.61865234375, -8.170654296875, -7.72265625, -7.274658203125, -6.82666015625, -6.378662109375, -5.9306640625, -5.482666015625, -5.03466796875, -4.586669921875, -4.138671875, -3.690673828125, -3.24267578125, -2.794677734375, -2.3466796875, -1.898681640625, -1.45068359375, -1.002685546875, -0.5546875, -0.106689453125, 0.34130859375, 0.789306640625, 1.2373046875, 1.685302734375, 2.13330078125, 2.581298828125, 3.029296875, 3.477294921875, 3.92529296875, 4.373291015625, 4.8212890625, 5.269287109375, 5.71728515625, 6.165283203125, 6.61328125, 7.061279296875, 7.50927734375, 7.957275390625, 8.4052734375, 8.853271484375, 9.30126953125, 9.749267578125, 10.197265625, 10.645263671875, 11.09326171875, 11.541259765625, 11.9892578125, 12.437255859375, 12.88525390625, 13.333251953125, 13.78125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 8.0, 13.0, 11.0, 32.0, 68.0, 109.0, 194.0, 458.0, 1474.0, 13421.0, 2186599.0, 1976721.0, 12824.0, 1430.0, 472.0, 219.0, 98.0, 54.0, 34.0, 23.0, 14.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.49267578125, -32.2041015625, -30.91552734375, -29.626953125, -28.33837890625, -27.0498046875, -25.76123046875, -24.47265625, -23.18408203125, -21.8955078125, -20.60693359375, -19.318359375, -18.02978515625, -16.7412109375, -15.45263671875, -14.1640625, -12.87548828125, -11.5869140625, -10.29833984375, -9.009765625, -7.72119140625, -6.4326171875, -5.14404296875, -3.85546875, -2.56689453125, -1.2783203125, 0.01025390625, 1.298828125, 2.58740234375, 3.8759765625, 5.16455078125, 6.453125, 7.74169921875, 9.0302734375, 10.31884765625, 11.607421875, 12.89599609375, 14.1845703125, 15.47314453125, 16.76171875, 18.05029296875, 19.3388671875, 20.62744140625, 21.916015625, 23.20458984375, 24.4931640625, 25.78173828125, 27.0703125, 28.35888671875, 29.6474609375, 30.93603515625, 32.224609375, 33.51318359375, 34.8017578125, 36.09033203125, 37.37890625, 38.66748046875, 39.9560546875, 41.24462890625, 42.533203125, 43.82177734375, 45.1103515625, 46.39892578125, 47.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 12.0, 46.0, 79.0, 142.0, 219.0, 231.0, 169.0, 69.0, 23.0, 10.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.769012451171875, -31.641738891601562, -29.514463424682617, -27.387187957763672, -25.25991439819336, -23.132640838623047, -21.0053653717041, -18.878089904785156, -16.750816345214844, -14.623541831970215, -12.496267318725586, -10.368992805480957, -8.241718292236328, -6.114443778991699, -3.9871692657470703, -1.8598947525024414, 0.2673797607421875, 2.3946542739868164, 4.521928787231445, 6.649203300476074, 8.776477813720703, 10.903752326965332, 13.031026840209961, 15.15830135345459, 17.28557586669922, 19.41284942626953, 21.540124893188477, 23.667400360107422, 25.794673919677734, 27.921947479248047, 30.049222946166992, 32.17649841308594, 34.30376434326172, 36.43103790283203, 38.558311462402344, 40.68558883666992, 42.812862396240234, 44.94013595581055, 47.067413330078125, 49.19468688964844, 51.32196044921875, 53.44923400878906, 55.576507568359375, 57.70378494262695, 59.831058502197266, 61.95833206176758, 64.08560943603516, 66.21288299560547, 68.34015655517578, 70.4674301147461, 72.5947036743164, 74.72197723388672, 76.84925842285156, 78.97653198242188, 81.10380554199219, 83.2310791015625, 85.35835266113281, 87.48562622070312, 89.61289978027344, 91.74017333984375, 93.86744689941406, 95.9947280883789, 98.12200164794922, 100.24927520751953, 102.37654876708984]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 7.0, 11.0, 4.0, 10.0, 17.0, 14.0, 22.0, 22.0, 20.0, 26.0, 26.0, 32.0, 22.0, 34.0, 39.0, 33.0, 45.0, 49.0, 41.0, 35.0, 44.0, 47.0, 36.0, 31.0, 46.0, 34.0, 35.0, 36.0, 30.0, 29.0, 19.0, 25.0, 21.0, 8.0, 18.0, 9.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-35.46125793457031, -34.537391662597656, -33.613529205322266, -32.689666748046875, -31.76580047607422, -30.841936111450195, -29.918071746826172, -28.99420738220215, -28.070343017578125, -27.1464786529541, -26.222614288330078, -25.298749923706055, -24.37488555908203, -23.451021194458008, -22.527156829833984, -21.60329246520996, -20.679428100585938, -19.755563735961914, -18.83169937133789, -17.907835006713867, -16.983970642089844, -16.06010627746582, -15.136241912841797, -14.212377548217773, -13.28851318359375, -12.364648818969727, -11.440784454345703, -10.51692008972168, -9.593055725097656, -8.669191360473633, -7.745326995849609, -6.821462631225586, -5.8975982666015625, -4.973733901977539, -4.049869537353516, -3.126005172729492, -2.2021408081054688, -1.2782764434814453, -0.3544120788574219, 0.5694522857666016, 1.493316650390625, 2.4171810150146484, 3.341045379638672, 4.264909744262695, 5.188774108886719, 6.112638473510742, 7.036502838134766, 7.960367202758789, 8.884231567382812, 9.808095932006836, 10.73196029663086, 11.655824661254883, 12.579689025878906, 13.50355339050293, 14.427417755126953, 15.351282119750977, 16.275146484375, 17.199010848999023, 18.122875213623047, 19.04673957824707, 19.970603942871094, 20.894468307495117, 21.81833267211914, 22.742197036743164, 23.666061401367188]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 15.0, 14.0, 16.0, 24.0, 18.0, 22.0, 21.0, 27.0, 37.0, 26.0, 43.0, 32.0, 30.0, 36.0, 44.0, 50.0, 29.0, 37.0, 51.0, 33.0, 45.0, 35.0, 24.0, 27.0, 26.0, 27.0, 37.0, 16.0, 20.0, 21.0, 17.0, 12.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.96209716796875, -1.8948974609375, -1.82769775390625, -1.760498046875, -1.69329833984375, -1.6260986328125, -1.55889892578125, -1.49169921875, -1.42449951171875, -1.3572998046875, -1.29010009765625, -1.222900390625, -1.15570068359375, -1.0885009765625, -1.02130126953125, -0.9541015625, -0.88690185546875, -0.8197021484375, -0.75250244140625, -0.685302734375, -0.61810302734375, -0.5509033203125, -0.48370361328125, -0.41650390625, -0.34930419921875, -0.2821044921875, -0.21490478515625, -0.147705078125, -0.08050537109375, -0.0133056640625, 0.05389404296875, 0.12109375, 0.18829345703125, 0.2554931640625, 0.32269287109375, 0.389892578125, 0.45709228515625, 0.5242919921875, 0.59149169921875, 0.65869140625, 0.72589111328125, 0.7930908203125, 0.86029052734375, 0.927490234375, 0.99468994140625, 1.0618896484375, 1.12908935546875, 1.1962890625, 1.26348876953125, 1.3306884765625, 1.39788818359375, 1.465087890625, 1.53228759765625, 1.5994873046875, 1.66668701171875, 1.73388671875, 1.80108642578125, 1.8682861328125, 1.93548583984375, 2.002685546875, 2.06988525390625, 2.1370849609375, 2.20428466796875, 2.271484375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 10.0, 17.0, 18.0, 27.0, 38.0, 61.0, 69.0, 103.0, 181.0, 248.0, 377.0, 576.0, 921.0, 1352.0, 2105.0, 3398.0, 5256.0, 8049.0, 12717.0, 19853.0, 31104.0, 47700.0, 73258.0, 108096.0, 146876.0, 165314.0, 137107.0, 98089.0, 65582.0, 43080.0, 27484.0, 17483.0, 11728.0, 7227.0, 4680.0, 2934.0, 1860.0, 1166.0, 785.0, 560.0, 350.0, 236.0, 155.0, 121.0, 57.0, 55.0, 34.0, 21.0, 21.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.279296875, -0.27092742919921875, -0.2625579833984375, -0.25418853759765625, -0.245819091796875, -0.23744964599609375, -0.2290802001953125, -0.22071075439453125, -0.21234130859375, -0.20397186279296875, -0.1956024169921875, -0.18723297119140625, -0.178863525390625, -0.17049407958984375, -0.1621246337890625, -0.15375518798828125, -0.1453857421875, -0.13701629638671875, -0.1286468505859375, -0.12027740478515625, -0.111907958984375, -0.10353851318359375, -0.0951690673828125, -0.08679962158203125, -0.07843017578125, -0.07006072998046875, -0.0616912841796875, -0.05332183837890625, -0.044952392578125, -0.03658294677734375, -0.0282135009765625, -0.01984405517578125, -0.011474609375, -0.00310516357421875, 0.0052642822265625, 0.01363372802734375, 0.022003173828125, 0.03037261962890625, 0.0387420654296875, 0.04711151123046875, 0.05548095703125, 0.06385040283203125, 0.0722198486328125, 0.08058929443359375, 0.088958740234375, 0.09732818603515625, 0.1056976318359375, 0.11406707763671875, 0.1224365234375, 0.13080596923828125, 0.1391754150390625, 0.14754486083984375, 0.155914306640625, 0.16428375244140625, 0.1726531982421875, 0.18102264404296875, 0.18939208984375, 0.19776153564453125, 0.2061309814453125, 0.21450042724609375, 0.222869873046875, 0.23123931884765625, 0.2396087646484375, 0.24797821044921875, 0.25634765625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 9.0, 6.0, 4.0, 9.0, 12.0, 15.0, 14.0, 14.0, 18.0, 26.0, 24.0, 25.0, 23.0, 36.0, 29.0, 35.0, 24.0, 44.0, 39.0, 38.0, 1067.0, 38.0, 48.0, 50.0, 35.0, 31.0, 31.0, 35.0, 33.0, 25.0, 27.0, 21.0, 24.0, 20.0, 15.0, 15.0, 5.0, 14.0, 8.0, 3.0, 4.0, 7.0, 10.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.4296875, -1.3868865966796875, -1.344085693359375, -1.3012847900390625, -1.25848388671875, -1.2156829833984375, -1.172882080078125, -1.1300811767578125, -1.0872802734375, -1.0444793701171875, -1.001678466796875, -0.9588775634765625, -0.91607666015625, -0.8732757568359375, -0.830474853515625, -0.7876739501953125, -0.744873046875, -0.7020721435546875, -0.659271240234375, -0.6164703369140625, -0.57366943359375, -0.5308685302734375, -0.488067626953125, -0.4452667236328125, -0.4024658203125, -0.3596649169921875, -0.316864013671875, -0.2740631103515625, -0.23126220703125, -0.1884613037109375, -0.145660400390625, -0.1028594970703125, -0.06005859375, -0.0172576904296875, 0.025543212890625, 0.0683441162109375, 0.11114501953125, 0.1539459228515625, 0.196746826171875, 0.2395477294921875, 0.2823486328125, 0.3251495361328125, 0.367950439453125, 0.4107513427734375, 0.45355224609375, 0.4963531494140625, 0.539154052734375, 0.5819549560546875, 0.624755859375, 0.6675567626953125, 0.710357666015625, 0.7531585693359375, 0.79595947265625, 0.8387603759765625, 0.881561279296875, 0.9243621826171875, 0.9671630859375, 1.0099639892578125, 1.052764892578125, 1.0955657958984375, 1.13836669921875, 1.1811676025390625, 1.223968505859375, 1.2667694091796875, 1.3095703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 9.0, 13.0, 16.0, 30.0, 47.0, 88.0, 134.0, 229.0, 320.0, 447.0, 744.0, 1098.0, 1655.0, 2684.0, 3976.0, 6300.0, 9942.0, 16093.0, 25217.0, 39864.0, 61856.0, 93532.0, 132450.0, 1210960.0, 153150.0, 115259.0, 79130.0, 51839.0, 32900.0, 20733.0, 13086.0, 8459.0, 5274.0, 3412.0, 2173.0, 1387.0, 902.0, 615.0, 395.0, 240.0, 168.0, 120.0, 66.0, 41.0, 28.0, 25.0, 11.0, 10.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1802978515625, -0.17444229125976562, -0.16858673095703125, -0.16273117065429688, -0.1568756103515625, -0.15102005004882812, -0.14516448974609375, -0.13930892944335938, -0.133453369140625, -0.12759780883789062, -0.12174224853515625, -0.11588668823242188, -0.1100311279296875, -0.10417556762695312, -0.09832000732421875, -0.09246444702148438, -0.08660888671875, -0.08075332641601562, -0.07489776611328125, -0.06904220581054688, -0.0631866455078125, -0.057331085205078125, -0.05147552490234375, -0.045619964599609375, -0.039764404296875, -0.033908843994140625, -0.02805328369140625, -0.022197723388671875, -0.0163421630859375, -0.010486602783203125, -0.00463104248046875, 0.001224517822265625, 0.007080078125, 0.012935638427734375, 0.01879119873046875, 0.024646759033203125, 0.0305023193359375, 0.036357879638671875, 0.04221343994140625, 0.048069000244140625, 0.053924560546875, 0.059780120849609375, 0.06563568115234375, 0.07149124145507812, 0.0773468017578125, 0.08320236206054688, 0.08905792236328125, 0.09491348266601562, 0.10076904296875, 0.10662460327148438, 0.11248016357421875, 0.11833572387695312, 0.1241912841796875, 0.13004684448242188, 0.13590240478515625, 0.14175796508789062, 0.147613525390625, 0.15346908569335938, 0.15932464599609375, 0.16518020629882812, 0.1710357666015625, 0.17689132690429688, 0.18274688720703125, 0.18860244750976562, 0.1944580078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 2.0, 5.0, 0.0, 7.0, 8.0, 11.0, 7.0, 6.0, 9.0, 18.0, 23.0, 37.0, 49.0, 44.0, 64.0, 60.0, 64.0, 69.0, 79.0, 74.0, 65.0, 61.0, 46.0, 47.0, 32.0, 22.0, 14.0, 18.0, 12.0, 9.0, 7.0, 7.0, 2.0, 9.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010499954223632812, -0.001010894775390625, -0.0009717941284179688, -0.0009326934814453125, -0.0008935928344726562, -0.0008544921875, -0.0008153915405273438, -0.0007762908935546875, -0.0007371902465820312, -0.000698089599609375, -0.0006589889526367188, -0.0006198883056640625, -0.0005807876586914062, -0.00054168701171875, -0.0005025863647460938, -0.0004634857177734375, -0.00042438507080078125, -0.000385284423828125, -0.00034618377685546875, -0.0003070831298828125, -0.00026798248291015625, -0.0002288818359375, -0.00018978118896484375, -0.0001506805419921875, -0.00011157989501953125, -7.2479248046875e-05, -3.337860107421875e-05, 5.7220458984375e-06, 4.482269287109375e-05, 8.392333984375e-05, 0.00012302398681640625, 0.0001621246337890625, 0.00020122528076171875, 0.000240325927734375, 0.00027942657470703125, 0.0003185272216796875, 0.00035762786865234375, 0.000396728515625, 0.00043582916259765625, 0.0004749298095703125, 0.0005140304565429688, 0.000553131103515625, 0.0005922317504882812, 0.0006313323974609375, 0.0006704330444335938, 0.00070953369140625, 0.0007486343383789062, 0.0007877349853515625, 0.0008268356323242188, 0.000865936279296875, 0.0009050369262695312, 0.0009441375732421875, 0.0009832382202148438, 0.0010223388671875, 0.0010614395141601562, 0.0011005401611328125, 0.0011396408081054688, 0.001178741455078125, 0.0012178421020507812, 0.0012569427490234375, 0.0012960433959960938, 0.00133514404296875, 0.0013742446899414062, 0.0014133453369140625, 0.0014524459838867188]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 11.0, 4.0, 11.0, 17.0, 11.0, 22.0, 47.0, 71.0, 68.0, 133.0, 175.0, 291.0, 717.0, 12144.0, 1005489.0, 27406.0, 1004.0, 288.0, 204.0, 120.0, 78.0, 56.0, 39.0, 31.0, 32.0, 20.0, 13.0, 11.0, 10.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.03515625, -0.03426814079284668, -0.03338003158569336, -0.03249192237854004, -0.03160381317138672, -0.0307157039642334, -0.029827594757080078, -0.028939485549926758, -0.028051376342773438, -0.027163267135620117, -0.026275157928466797, -0.025387048721313477, -0.024498939514160156, -0.023610830307006836, -0.022722721099853516, -0.021834611892700195, -0.020946502685546875, -0.020058393478393555, -0.019170284271240234, -0.018282175064086914, -0.017394065856933594, -0.016505956649780273, -0.015617847442626953, -0.014729738235473633, -0.013841629028320312, -0.012953519821166992, -0.012065410614013672, -0.011177301406860352, -0.010289192199707031, -0.009401082992553711, -0.00851297378540039, -0.00762486457824707, -0.00673675537109375, -0.00584864616394043, -0.004960536956787109, -0.004072427749633789, -0.0031843185424804688, -0.0022962093353271484, -0.0014081001281738281, -0.0005199909210205078, 0.0003681182861328125, 0.0012562274932861328, 0.002144336700439453, 0.0030324459075927734, 0.003920555114746094, 0.004808664321899414, 0.005696773529052734, 0.006584882736206055, 0.007472991943359375, 0.008361101150512695, 0.009249210357666016, 0.010137319564819336, 0.011025428771972656, 0.011913537979125977, 0.012801647186279297, 0.013689756393432617, 0.014577865600585938, 0.015465974807739258, 0.016354084014892578, 0.0172421932220459, 0.01813030242919922, 0.01901841163635254, 0.01990652084350586, 0.02079463005065918, 0.0216827392578125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 71.0, 796.0, 142.0, 4.0], "bins": [-0.023746449500322342, -0.023361224681138992, -0.022975999861955643, -0.022590773180127144, -0.022205548360943794, -0.021820323541760445, -0.021435096859931946, -0.021049872040748596, -0.020664647221565247, -0.020279422402381897, -0.019894197583198547, -0.01950897090137005, -0.0191237460821867, -0.01873852126300335, -0.01835329458117485, -0.0179680697619915, -0.01758284494280815, -0.0171976201236248, -0.016812395304441452, -0.016427168622612953, -0.016041943803429604, -0.015656718984246254, -0.01527149323374033, -0.014886267483234406, -0.014501042664051056, -0.014115817844867706, -0.013730592094361782, -0.013345366343855858, -0.012960141524672508, -0.012574916705489159, -0.012189690954983234, -0.01180446520447731, -0.01141924038529396, -0.011034015566110611, -0.010648789815604687, -0.010263564065098763, -0.009878339245915413, -0.009493114426732063, -0.009107888676226139, -0.008722662925720215, -0.008337438106536865, -0.007952213287353516, -0.007566987536847591, -0.0071817622520029545, -0.0067965369671583176, -0.006411311682313681, -0.006026086397469044, -0.005640861112624407, -0.005255636293441057, -0.00487041100859642, -0.004485185723751783, -0.0040999604389071465, -0.0037147351540625095, -0.0033295098692178726, -0.0029442845843732357, -0.002559059299528599, -0.002173834014683962, -0.001788608729839325, -0.001403383444994688, -0.0010181581601500511, -0.0006329328753054142, -0.0002477075904607773, 0.00013751769438385963, 0.0005227429792284966, 0.0009079683222807944]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 6.0, 5.0, 5.0, 11.0, 15.0, 8.0, 10.0, 22.0, 32.0, 18.0, 22.0, 30.0, 38.0, 39.0, 33.0, 38.0, 35.0, 48.0, 44.0, 52.0, 47.0, 39.0, 40.0, 48.0, 33.0, 35.0, 31.0, 37.0, 28.0, 18.0, 27.0, 17.0, 18.0, 17.0, 17.0, 6.0, 18.0, 4.0, 4.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006969571113586426, -0.0006767930462956429, -0.0006566289812326431, -0.0006364649161696434, -0.0006163008511066437, -0.000596136786043644, -0.0005759727209806442, -0.0005558086559176445, -0.0005356445908546448, -0.000515480525791645, -0.0004953164607286453, -0.0004751523956656456, -0.0004549883306026459, -0.00043482426553964615, -0.0004146602004766464, -0.0003944961354136467, -0.00037433207035064697, -0.00035416800528764725, -0.0003340039402246475, -0.0003138398751616478, -0.00029367581009864807, -0.00027351174503564835, -0.0002533476799726486, -0.0002331836149096489, -0.00021301954984664917, -0.00019285548478364944, -0.00017269141972064972, -0.00015252735465765, -0.00013236328959465027, -0.00011219922453165054, -9.203515946865082e-05, -7.187109440565109e-05, -5.170702934265137e-05, -3.154296427965164e-05, -1.1378899216651917e-05, 8.785165846347809e-06, 2.8949230909347534e-05, 4.911329597234726e-05, 6.927736103534698e-05, 8.944142609834671e-05, 0.00010960549116134644, 0.00012976955622434616, 0.00014993362128734589, 0.0001700976863503456, 0.00019026175141334534, 0.00021042581647634506, 0.0002305898815393448, 0.0002507539466023445, 0.00027091801166534424, 0.00029108207672834396, 0.0003112461417913437, 0.0003314102068543434, 0.00035157427191734314, 0.00037173833698034286, 0.0003919024020433426, 0.0004120664671063423, 0.00043223053216934204, 0.00045239459723234177, 0.0004725586622953415, 0.0004927227273583412, 0.0005128867924213409, 0.0005330508574843407, 0.0005532149225473404, 0.0005733789876103401, 0.0005935430526733398]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 15.0, 14.0, 16.0, 24.0, 18.0, 22.0, 21.0, 27.0, 37.0, 26.0, 43.0, 32.0, 30.0, 36.0, 43.0, 51.0, 29.0, 37.0, 51.0, 33.0, 45.0, 35.0, 24.0, 27.0, 26.0, 27.0, 37.0, 16.0, 20.0, 21.0, 17.0, 12.0, 11.0, 9.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.96209716796875, -1.8948974609375, -1.82769775390625, -1.760498046875, -1.69329833984375, -1.6260986328125, -1.55889892578125, -1.49169921875, -1.42449951171875, -1.3572998046875, -1.29010009765625, -1.222900390625, -1.15570068359375, -1.0885009765625, -1.02130126953125, -0.9541015625, -0.88690185546875, -0.8197021484375, -0.75250244140625, -0.685302734375, -0.61810302734375, -0.5509033203125, -0.48370361328125, -0.41650390625, -0.34930419921875, -0.2821044921875, -0.21490478515625, -0.147705078125, -0.08050537109375, -0.0133056640625, 0.05389404296875, 0.12109375, 0.18829345703125, 0.2554931640625, 0.32269287109375, 0.389892578125, 0.45709228515625, 0.5242919921875, 0.59149169921875, 0.65869140625, 0.72589111328125, 0.7930908203125, 0.86029052734375, 0.927490234375, 0.99468994140625, 1.0618896484375, 1.12908935546875, 1.1962890625, 1.26348876953125, 1.3306884765625, 1.39788818359375, 1.465087890625, 1.53228759765625, 1.5994873046875, 1.66668701171875, 1.73388671875, 1.80108642578125, 1.8682861328125, 1.93548583984375, 2.002685546875, 2.06988525390625, 2.1370849609375, 2.20428466796875, 2.271484375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 11.0, 18.0, 22.0, 28.0, 39.0, 63.0, 68.0, 126.0, 149.0, 251.0, 407.0, 600.0, 1000.0, 1622.0, 2953.0, 5884.0, 12240.0, 27274.0, 68024.0, 182632.0, 391188.0, 214733.0, 79589.0, 31371.0, 13762.0, 6389.0, 3304.0, 1792.0, 1058.0, 659.0, 426.0, 258.0, 196.0, 111.0, 88.0, 72.0, 38.0, 25.0, 13.0, 15.0, 13.0, 14.0, 8.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9223175048828125, -1.857330322265625, -1.7923431396484375, -1.72735595703125, -1.6623687744140625, -1.597381591796875, -1.5323944091796875, -1.4674072265625, -1.4024200439453125, -1.337432861328125, -1.2724456787109375, -1.20745849609375, -1.1424713134765625, -1.077484130859375, -1.0124969482421875, -0.947509765625, -0.8825225830078125, -0.817535400390625, -0.7525482177734375, -0.68756103515625, -0.6225738525390625, -0.557586669921875, -0.4925994873046875, -0.4276123046875, -0.3626251220703125, -0.297637939453125, -0.2326507568359375, -0.16766357421875, -0.1026763916015625, -0.037689208984375, 0.0272979736328125, 0.09228515625, 0.1572723388671875, 0.222259521484375, 0.2872467041015625, 0.35223388671875, 0.4172210693359375, 0.482208251953125, 0.5471954345703125, 0.6121826171875, 0.6771697998046875, 0.742156982421875, 0.8071441650390625, 0.87213134765625, 0.9371185302734375, 1.002105712890625, 1.0670928955078125, 1.132080078125, 1.1970672607421875, 1.262054443359375, 1.3270416259765625, 1.39202880859375, 1.4570159912109375, 1.522003173828125, 1.5869903564453125, 1.6519775390625, 1.7169647216796875, 1.781951904296875, 1.8469390869140625, 1.91192626953125, 1.9769134521484375, 2.041900634765625, 2.1068878173828125, 2.171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 5.0, 11.0, 21.0, 18.0, 13.0, 19.0, 23.0, 29.0, 27.0, 43.0, 30.0, 40.0, 41.0, 45.0, 77.0, 122.0, 439.0, 1459.0, 145.0, 72.0, 44.0, 42.0, 34.0, 41.0, 27.0, 28.0, 30.0, 22.0, 15.0, 12.0, 16.0, 13.0, 9.0, 7.0, 12.0, 3.0, 7.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.71875, -7.45263671875, -7.1865234375, -6.92041015625, -6.654296875, -6.38818359375, -6.1220703125, -5.85595703125, -5.58984375, -5.32373046875, -5.0576171875, -4.79150390625, -4.525390625, -4.25927734375, -3.9931640625, -3.72705078125, -3.4609375, -3.19482421875, -2.9287109375, -2.66259765625, -2.396484375, -2.13037109375, -1.8642578125, -1.59814453125, -1.33203125, -1.06591796875, -0.7998046875, -0.53369140625, -0.267578125, -0.00146484375, 0.2646484375, 0.53076171875, 0.796875, 1.06298828125, 1.3291015625, 1.59521484375, 1.861328125, 2.12744140625, 2.3935546875, 2.65966796875, 2.92578125, 3.19189453125, 3.4580078125, 3.72412109375, 3.990234375, 4.25634765625, 4.5224609375, 4.78857421875, 5.0546875, 5.32080078125, 5.5869140625, 5.85302734375, 6.119140625, 6.38525390625, 6.6513671875, 6.91748046875, 7.18359375, 7.44970703125, 7.7158203125, 7.98193359375, 8.248046875, 8.51416015625, 8.7802734375, 9.04638671875, 9.3125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 12.0, 12.0, 10.0, 12.0, 12.0, 18.0, 15.0, 40.0, 32.0, 35.0, 60.0, 69.0, 98.0, 213.0, 500.0, 1644.0, 26164.0, 3078801.0, 34866.0, 1844.0, 537.0, 221.0, 112.0, 64.0, 67.0, 43.0, 35.0, 29.0, 18.0, 24.0, 17.0, 10.0, 15.0, 15.0, 11.0, 5.0, 1.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.296875, -19.7412109375, -19.185546875, -18.6298828125, -18.07421875, -17.5185546875, -16.962890625, -16.4072265625, -15.8515625, -15.2958984375, -14.740234375, -14.1845703125, -13.62890625, -13.0732421875, -12.517578125, -11.9619140625, -11.40625, -10.8505859375, -10.294921875, -9.7392578125, -9.18359375, -8.6279296875, -8.072265625, -7.5166015625, -6.9609375, -6.4052734375, -5.849609375, -5.2939453125, -4.73828125, -4.1826171875, -3.626953125, -3.0712890625, -2.515625, -1.9599609375, -1.404296875, -0.8486328125, -0.29296875, 0.2626953125, 0.818359375, 1.3740234375, 1.9296875, 2.4853515625, 3.041015625, 3.5966796875, 4.15234375, 4.7080078125, 5.263671875, 5.8193359375, 6.375, 6.9306640625, 7.486328125, 8.0419921875, 8.59765625, 9.1533203125, 9.708984375, 10.2646484375, 10.8203125, 11.3759765625, 11.931640625, 12.4873046875, 13.04296875, 13.5986328125, 14.154296875, 14.7099609375, 15.265625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 21.0, 61.0, 89.0, 170.0, 192.0, 203.0, 144.0, 62.0, 36.0, 14.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.595901489257812, -12.172450065612793, -11.748998641967773, -11.32554817199707, -10.90209674835205, -10.478645324707031, -10.055193901062012, -9.631742477416992, -9.208291053771973, -8.784839630126953, -8.361388206481934, -7.937937259674072, -7.514485836029053, -7.091034889221191, -6.667583465576172, -6.244132041931152, -5.820681095123291, -5.3972296714782715, -4.97377872467041, -4.550327301025391, -4.126875877380371, -3.7034246921539307, -3.2799735069274902, -2.8565220832824707, -2.4330708980560303, -2.00961971282959, -1.5861682891845703, -1.1627171039581299, -0.7392657995223999, -0.3158144950866699, 0.10763669013977051, 0.53108811378479, 0.9545392990112305, 1.3779906034469604, 1.8014419078826904, 2.224893093109131, 2.6483445167541504, 3.071795701980591, 3.4952468872070312, 3.918698310852051, 4.34214973449707, 4.76560115814209, 5.189052104949951, 5.612503528594971, 6.03595495223999, 6.459405899047852, 6.882857322692871, 7.306308746337891, 7.729759693145752, 8.153210639953613, 8.576662063598633, 9.000113487243652, 9.423564910888672, 9.847016334533691, 10.270467758178711, 10.693918228149414, 11.117369651794434, 11.540821075439453, 11.964272499084473, 12.387723922729492, 12.811174392700195, 13.234625816345215, 13.658077239990234, 14.081528663635254, 14.504980087280273]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 0.0, 5.0, 6.0, 5.0, 10.0, 6.0, 20.0, 15.0, 14.0, 20.0, 27.0, 29.0, 43.0, 43.0, 50.0, 45.0, 51.0, 45.0, 49.0, 35.0, 41.0, 49.0, 46.0, 48.0, 44.0, 36.0, 33.0, 31.0, 28.0, 22.0, 29.0, 12.0, 11.0, 8.0, 8.0, 12.0, 9.0, 8.0, 8.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.994285583496094, -25.11273765563965, -24.231189727783203, -23.349641799926758, -22.468093872070312, -21.5865478515625, -20.704999923706055, -19.82345199584961, -18.941904067993164, -18.06035614013672, -17.178808212280273, -16.297260284423828, -15.4157133102417, -14.534165382385254, -13.652618408203125, -12.77107048034668, -11.889522552490234, -11.007974624633789, -10.126426696777344, -9.244879722595215, -8.36333179473877, -7.481783866882324, -6.600236415863037, -5.71868896484375, -4.837141036987305, -3.9555933475494385, -3.0740456581115723, -2.192497968673706, -1.3109502792358398, -0.42940235137939453, 0.4521450996398926, 1.3336925506591797, 2.215242385864258, 3.096790075302124, 3.9783377647399902, 4.859885215759277, 5.741433143615723, 6.622981071472168, 7.504528522491455, 8.386075973510742, 9.267623901367188, 10.149171829223633, 11.030719757080078, 11.912266731262207, 12.793814659118652, 13.675362586975098, 14.556909561157227, 15.438457489013672, 16.320005416870117, 17.201553344726562, 18.083101272583008, 18.964649200439453, 19.846195220947266, 20.727745056152344, 21.609291076660156, 22.4908390045166, 23.372386932373047, 24.253934860229492, 25.135482788085938, 26.017030715942383, 26.898578643798828, 27.78012466430664, 28.661672592163086, 29.54322052001953, 30.424768447875977]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 10.0, 9.0, 8.0, 16.0, 11.0, 22.0, 19.0, 22.0, 17.0, 21.0, 31.0, 36.0, 38.0, 26.0, 39.0, 32.0, 41.0, 44.0, 42.0, 41.0, 39.0, 39.0, 47.0, 30.0, 45.0, 21.0, 20.0, 39.0, 28.0, 31.0, 17.0, 25.0, 17.0, 8.0, 18.0, 8.0, 9.0, 11.0, 6.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.115234375, -2.045074462890625, -1.97491455078125, -1.904754638671875, -1.8345947265625, -1.764434814453125, -1.69427490234375, -1.624114990234375, -1.553955078125, -1.483795166015625, -1.41363525390625, -1.343475341796875, -1.2733154296875, -1.203155517578125, -1.13299560546875, -1.062835693359375, -0.99267578125, -0.922515869140625, -0.85235595703125, -0.782196044921875, -0.7120361328125, -0.641876220703125, -0.57171630859375, -0.501556396484375, -0.431396484375, -0.361236572265625, -0.29107666015625, -0.220916748046875, -0.1507568359375, -0.080596923828125, -0.01043701171875, 0.059722900390625, 0.1298828125, 0.200042724609375, 0.27020263671875, 0.340362548828125, 0.4105224609375, 0.480682373046875, 0.55084228515625, 0.621002197265625, 0.691162109375, 0.761322021484375, 0.83148193359375, 0.901641845703125, 0.9718017578125, 1.041961669921875, 1.11212158203125, 1.182281494140625, 1.25244140625, 1.322601318359375, 1.39276123046875, 1.462921142578125, 1.5330810546875, 1.603240966796875, 1.67340087890625, 1.743560791015625, 1.813720703125, 1.883880615234375, 1.95404052734375, 2.024200439453125, 2.0943603515625, 2.164520263671875, 2.23468017578125, 2.304840087890625, 2.375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 5.0, 14.0, 20.0, 19.0, 29.0, 31.0, 37.0, 43.0, 66.0, 53.0, 108.0, 202.0, 433.0, 1180.0, 3613.0, 14040.0, 68124.0, 544436.0, 3048829.0, 436993.0, 58200.0, 12220.0, 3305.0, 1146.0, 444.0, 216.0, 123.0, 77.0, 56.0, 47.0, 41.0, 22.0, 20.0, 28.0, 8.0, 12.0, 19.0, 3.0, 5.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.734375, -10.431640625, -10.12890625, -9.826171875, -9.5234375, -9.220703125, -8.91796875, -8.615234375, -8.3125, -8.009765625, -7.70703125, -7.404296875, -7.1015625, -6.798828125, -6.49609375, -6.193359375, -5.890625, -5.587890625, -5.28515625, -4.982421875, -4.6796875, -4.376953125, -4.07421875, -3.771484375, -3.46875, -3.166015625, -2.86328125, -2.560546875, -2.2578125, -1.955078125, -1.65234375, -1.349609375, -1.046875, -0.744140625, -0.44140625, -0.138671875, 0.1640625, 0.466796875, 0.76953125, 1.072265625, 1.375, 1.677734375, 1.98046875, 2.283203125, 2.5859375, 2.888671875, 3.19140625, 3.494140625, 3.796875, 4.099609375, 4.40234375, 4.705078125, 5.0078125, 5.310546875, 5.61328125, 5.916015625, 6.21875, 6.521484375, 6.82421875, 7.126953125, 7.4296875, 7.732421875, 8.03515625, 8.337890625, 8.640625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 6.0, 4.0, 0.0, 5.0, 16.0, 18.0, 21.0, 24.0, 35.0, 55.0, 56.0, 98.0, 128.0, 167.0, 200.0, 257.0, 385.0, 450.0, 469.0, 420.0, 344.0, 240.0, 206.0, 125.0, 96.0, 70.0, 52.0, 39.0, 29.0, 24.0, 15.0, 8.0, 10.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9453125, -5.6898193359375, -5.434326171875, -5.1788330078125, -4.92333984375, -4.6678466796875, -4.412353515625, -4.1568603515625, -3.9013671875, -3.6458740234375, -3.390380859375, -3.1348876953125, -2.87939453125, -2.6239013671875, -2.368408203125, -2.1129150390625, -1.857421875, -1.6019287109375, -1.346435546875, -1.0909423828125, -0.83544921875, -0.5799560546875, -0.324462890625, -0.0689697265625, 0.1865234375, 0.4420166015625, 0.697509765625, 0.9530029296875, 1.20849609375, 1.4639892578125, 1.719482421875, 1.9749755859375, 2.23046875, 2.4859619140625, 2.741455078125, 2.9969482421875, 3.25244140625, 3.5079345703125, 3.763427734375, 4.0189208984375, 4.2744140625, 4.5299072265625, 4.785400390625, 5.0408935546875, 5.29638671875, 5.5518798828125, 5.807373046875, 6.0628662109375, 6.318359375, 6.5738525390625, 6.829345703125, 7.0848388671875, 7.34033203125, 7.5958251953125, 7.851318359375, 8.1068115234375, 8.3623046875, 8.6177978515625, 8.873291015625, 9.1287841796875, 9.38427734375, 9.6397705078125, 9.895263671875, 10.1507568359375, 10.40625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 8.0, 3.0, 5.0, 14.0, 17.0, 28.0, 58.0, 109.0, 194.0, 449.0, 1398.0, 6555.0, 62080.0, 1413141.0, 2595083.0, 102806.0, 9487.0, 1763.0, 566.0, 225.0, 136.0, 61.0, 38.0, 26.0, 19.0, 13.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.61474609375, -17.9013671875, -17.18798828125, -16.474609375, -15.76123046875, -15.0478515625, -14.33447265625, -13.62109375, -12.90771484375, -12.1943359375, -11.48095703125, -10.767578125, -10.05419921875, -9.3408203125, -8.62744140625, -7.9140625, -7.20068359375, -6.4873046875, -5.77392578125, -5.060546875, -4.34716796875, -3.6337890625, -2.92041015625, -2.20703125, -1.49365234375, -0.7802734375, -0.06689453125, 0.646484375, 1.35986328125, 2.0732421875, 2.78662109375, 3.5, 4.21337890625, 4.9267578125, 5.64013671875, 6.353515625, 7.06689453125, 7.7802734375, 8.49365234375, 9.20703125, 9.92041015625, 10.6337890625, 11.34716796875, 12.060546875, 12.77392578125, 13.4873046875, 14.20068359375, 14.9140625, 15.62744140625, 16.3408203125, 17.05419921875, 17.767578125, 18.48095703125, 19.1943359375, 19.90771484375, 20.62109375, 21.33447265625, 22.0478515625, 22.76123046875, 23.474609375, 24.18798828125, 24.9013671875, 25.61474609375, 26.328125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 13.0, 25.0, 51.0, 81.0, 111.0, 157.0, 166.0, 139.0, 111.0, 60.0, 44.0, 28.0, 11.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.98526382446289, -27.415998458862305, -25.84673309326172, -24.2774658203125, -22.708202362060547, -21.138935089111328, -19.569669723510742, -18.000404357910156, -16.43113899230957, -14.861873626708984, -13.292608261108398, -11.723341941833496, -10.15407657623291, -8.584811210632324, -7.015544891357422, -5.446279525756836, -3.87701416015625, -2.307748556137085, -0.7384829521179199, 0.8307828903198242, 2.40004825592041, 3.969313621520996, 5.538579940795898, 7.107845306396484, 8.67711067199707, 10.246376037597656, 11.815641403198242, 13.384907722473145, 14.95417308807373, 16.5234375, 18.09270477294922, 19.661970138549805, 21.231231689453125, 22.80049705505371, 24.369762420654297, 25.939029693603516, 27.50829315185547, 29.077560424804688, 30.646825790405273, 32.21609115600586, 33.78535461425781, 35.35462188720703, 36.923885345458984, 38.4931526184082, 40.062416076660156, 41.631683349609375, 43.200950622558594, 44.77021408081055, 46.339481353759766, 47.908748626708984, 49.47801208496094, 51.047279357910156, 52.61654281616211, 54.18581008911133, 55.75507354736328, 57.3243408203125, 58.89360809326172, 60.46287536621094, 62.03213882446289, 63.60140609741211, 65.17066955566406, 66.73993682861328, 68.3092041015625, 69.87846374511719, 71.4477310180664]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 1.0, 7.0, 9.0, 9.0, 14.0, 15.0, 16.0, 25.0, 30.0, 27.0, 32.0, 35.0, 46.0, 46.0, 41.0, 35.0, 43.0, 33.0, 38.0, 56.0, 42.0, 34.0, 34.0, 24.0, 29.0, 40.0, 27.0, 20.0, 25.0, 24.0, 24.0, 25.0, 16.0, 8.0, 10.0, 14.0, 10.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.383392333984375, -23.56831169128418, -22.75322914123535, -21.938148498535156, -21.123065948486328, -20.307985305786133, -19.492904663085938, -18.67782211303711, -17.862741470336914, -17.04766082763672, -16.23257827758789, -15.417497634887695, -14.602416038513184, -13.787334442138672, -12.972253799438477, -12.157172203063965, -11.342090606689453, -10.527009010314941, -9.71192741394043, -8.896846771240234, -8.081765174865723, -7.266683578491211, -6.451602458953857, -5.636521339416504, -4.821439743041992, -4.0063581466674805, -3.191277027130127, -2.3761956691741943, -1.5611143112182617, -0.74603271484375, 0.06904840469360352, 0.884129524230957, 1.6992111206054688, 2.5142924785614014, 3.329373836517334, 4.1444549560546875, 4.959536552429199, 5.774618148803711, 6.5896992683410645, 7.404780387878418, 8.21986198425293, 9.034943580627441, 9.850025177001953, 10.665105819702148, 11.48018741607666, 12.295269012451172, 13.110349655151367, 13.925431251525879, 14.74051284790039, 15.555594444274902, 16.370676040649414, 17.18575668334961, 18.000839233398438, 18.815919876098633, 19.631000518798828, 20.446083068847656, 21.26116371154785, 22.076244354248047, 22.891326904296875, 23.70640754699707, 24.521488189697266, 25.336570739746094, 26.15165138244629, 26.966732025146484, 27.781814575195312]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 11.0, 5.0, 14.0, 19.0, 12.0, 16.0, 22.0, 25.0, 21.0, 26.0, 28.0, 25.0, 23.0, 31.0, 34.0, 39.0, 35.0, 40.0, 51.0, 47.0, 32.0, 47.0, 32.0, 35.0, 38.0, 36.0, 32.0, 19.0, 38.0, 17.0, 17.0, 23.0, 20.0, 16.0, 16.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.92926025390625, -1.8585205078125, -1.78778076171875, -1.717041015625, -1.64630126953125, -1.5755615234375, -1.50482177734375, -1.43408203125, -1.36334228515625, -1.2926025390625, -1.22186279296875, -1.151123046875, -1.08038330078125, -1.0096435546875, -0.93890380859375, -0.8681640625, -0.79742431640625, -0.7266845703125, -0.65594482421875, -0.585205078125, -0.51446533203125, -0.4437255859375, -0.37298583984375, -0.30224609375, -0.23150634765625, -0.1607666015625, -0.09002685546875, -0.019287109375, 0.05145263671875, 0.1221923828125, 0.19293212890625, 0.263671875, 0.33441162109375, 0.4051513671875, 0.47589111328125, 0.546630859375, 0.61737060546875, 0.6881103515625, 0.75885009765625, 0.82958984375, 0.90032958984375, 0.9710693359375, 1.04180908203125, 1.112548828125, 1.18328857421875, 1.2540283203125, 1.32476806640625, 1.3955078125, 1.46624755859375, 1.5369873046875, 1.60772705078125, 1.678466796875, 1.74920654296875, 1.8199462890625, 1.89068603515625, 1.96142578125, 2.03216552734375, 2.1029052734375, 2.17364501953125, 2.244384765625, 2.31512451171875, 2.3858642578125, 2.45660400390625, 2.52734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 8.0, 10.0, 12.0, 25.0, 36.0, 46.0, 74.0, 123.0, 146.0, 227.0, 331.0, 451.0, 664.0, 873.0, 1289.0, 1833.0, 2599.0, 3687.0, 5218.0, 7335.0, 10173.0, 14118.0, 19916.0, 27695.0, 38542.0, 53010.0, 71618.0, 93018.0, 113957.0, 124772.0, 112608.0, 91503.0, 69971.0, 51672.0, 37346.0, 26670.0, 19321.0, 13742.0, 9708.0, 7122.0, 4937.0, 3595.0, 2548.0, 1738.0, 1266.0, 905.0, 665.0, 473.0, 321.0, 183.0, 158.0, 93.0, 80.0, 54.0, 26.0, 28.0, 9.0, 8.0, 9.0, 2.0, 4.0], "bins": [-0.22216796875, -0.21532249450683594, -0.20847702026367188, -0.2016315460205078, -0.19478607177734375, -0.1879405975341797, -0.18109512329101562, -0.17424964904785156, -0.1674041748046875, -0.16055870056152344, -0.15371322631835938, -0.1468677520751953, -0.14002227783203125, -0.1331768035888672, -0.12633132934570312, -0.11948585510253906, -0.112640380859375, -0.10579490661621094, -0.09894943237304688, -0.09210395812988281, -0.08525848388671875, -0.07841300964355469, -0.07156753540039062, -0.06472206115722656, -0.0578765869140625, -0.05103111267089844, -0.044185638427734375, -0.03734016418457031, -0.03049468994140625, -0.023649215698242188, -0.016803741455078125, -0.009958267211914062, -0.00311279296875, 0.0037326812744140625, 0.010578155517578125, 0.017423629760742188, 0.02426910400390625, 0.031114578247070312, 0.037960052490234375, 0.04480552673339844, 0.0516510009765625, 0.05849647521972656, 0.06534194946289062, 0.07218742370605469, 0.07903289794921875, 0.08587837219238281, 0.09272384643554688, 0.09956932067871094, 0.106414794921875, 0.11326026916503906, 0.12010574340820312, 0.1269512176513672, 0.13379669189453125, 0.1406421661376953, 0.14748764038085938, 0.15433311462402344, 0.1611785888671875, 0.16802406311035156, 0.17486953735351562, 0.1817150115966797, 0.18856048583984375, 0.1954059600830078, 0.20225143432617188, 0.20909690856933594, 0.2159423828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 7.0, 8.0, 12.0, 4.0, 18.0, 21.0, 23.0, 26.0, 29.0, 25.0, 29.0, 33.0, 45.0, 34.0, 40.0, 36.0, 29.0, 1071.0, 57.0, 53.0, 51.0, 45.0, 40.0, 38.0, 32.0, 32.0, 35.0, 19.0, 21.0, 14.0, 13.0, 16.0, 10.0, 7.0, 8.0, 8.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4716796875, -1.4220428466796875, -1.372406005859375, -1.3227691650390625, -1.27313232421875, -1.2234954833984375, -1.173858642578125, -1.1242218017578125, -1.0745849609375, -1.0249481201171875, -0.975311279296875, -0.9256744384765625, -0.87603759765625, -0.8264007568359375, -0.776763916015625, -0.7271270751953125, -0.677490234375, -0.6278533935546875, -0.578216552734375, -0.5285797119140625, -0.47894287109375, -0.4293060302734375, -0.379669189453125, -0.3300323486328125, -0.2803955078125, -0.2307586669921875, -0.181121826171875, -0.1314849853515625, -0.08184814453125, -0.0322113037109375, 0.017425537109375, 0.0670623779296875, 0.11669921875, 0.1663360595703125, 0.215972900390625, 0.2656097412109375, 0.31524658203125, 0.3648834228515625, 0.414520263671875, 0.4641571044921875, 0.5137939453125, 0.5634307861328125, 0.613067626953125, 0.6627044677734375, 0.71234130859375, 0.7619781494140625, 0.811614990234375, 0.8612518310546875, 0.910888671875, 0.9605255126953125, 1.010162353515625, 1.0597991943359375, 1.10943603515625, 1.1590728759765625, 1.208709716796875, 1.2583465576171875, 1.3079833984375, 1.3576202392578125, 1.407257080078125, 1.4568939208984375, 1.50653076171875, 1.5561676025390625, 1.605804443359375, 1.6554412841796875, 1.705078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 8.0, 10.0, 21.0, 32.0, 30.0, 56.0, 87.0, 121.0, 169.0, 234.0, 356.0, 561.0, 902.0, 1368.0, 2136.0, 3296.0, 5350.0, 8334.0, 13381.0, 21592.0, 34767.0, 55242.0, 86611.0, 128185.0, 1012532.0, 365840.0, 126089.0, 84409.0, 54426.0, 34304.0, 21086.0, 13201.0, 8084.0, 5070.0, 3247.0, 2043.0, 1291.0, 861.0, 598.0, 381.0, 266.0, 184.0, 130.0, 83.0, 64.0, 36.0, 15.0, 16.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2049560546875, -0.19854736328125, -0.192138671875, -0.18572998046875, -0.1793212890625, -0.17291259765625, -0.16650390625, -0.16009521484375, -0.1536865234375, -0.14727783203125, -0.140869140625, -0.13446044921875, -0.1280517578125, -0.12164306640625, -0.115234375, -0.10882568359375, -0.1024169921875, -0.09600830078125, -0.089599609375, -0.08319091796875, -0.0767822265625, -0.07037353515625, -0.06396484375, -0.05755615234375, -0.0511474609375, -0.04473876953125, -0.038330078125, -0.03192138671875, -0.0255126953125, -0.01910400390625, -0.0126953125, -0.00628662109375, 0.0001220703125, 0.00653076171875, 0.012939453125, 0.01934814453125, 0.0257568359375, 0.03216552734375, 0.03857421875, 0.04498291015625, 0.0513916015625, 0.05780029296875, 0.064208984375, 0.07061767578125, 0.0770263671875, 0.08343505859375, 0.08984375, 0.09625244140625, 0.1026611328125, 0.10906982421875, 0.115478515625, 0.12188720703125, 0.1282958984375, 0.13470458984375, 0.14111328125, 0.14752197265625, 0.1539306640625, 0.16033935546875, 0.166748046875, 0.17315673828125, 0.1795654296875, 0.18597412109375, 0.1923828125, 0.19879150390625, 0.2052001953125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 1.0, 5.0, 8.0, 14.0, 11.0, 14.0, 14.0, 14.0, 23.0, 22.0, 35.0, 30.0, 36.0, 48.0, 41.0, 41.0, 35.0, 47.0, 38.0, 57.0, 56.0, 46.0, 42.0, 49.0, 45.0, 43.0, 18.0, 21.0, 38.0, 20.0, 17.0, 8.0, 15.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010223388671875, -0.0009914636611938477, -0.0009605884552001953, -0.000929713249206543, -0.0008988380432128906, -0.0008679628372192383, -0.0008370876312255859, -0.0008062124252319336, -0.0007753372192382812, -0.0007444620132446289, -0.0007135868072509766, -0.0006827116012573242, -0.0006518363952636719, -0.0006209611892700195, -0.0005900859832763672, -0.0005592107772827148, -0.0005283355712890625, -0.0004974603652954102, -0.0004665851593017578, -0.00043570995330810547, -0.0004048347473144531, -0.0003739595413208008, -0.00034308433532714844, -0.0003122091293334961, -0.00028133392333984375, -0.0002504587173461914, -0.00021958351135253906, -0.00018870830535888672, -0.00015783309936523438, -0.00012695789337158203, -9.608268737792969e-05, -6.520748138427734e-05, -3.4332275390625e-05, -3.4570693969726562e-06, 2.7418136596679688e-05, 5.829334259033203e-05, 8.916854858398438e-05, 0.00012004375457763672, 0.00015091896057128906, 0.0001817941665649414, 0.00021266937255859375, 0.0002435445785522461, 0.00027441978454589844, 0.0003052949905395508, 0.0003361701965332031, 0.00036704540252685547, 0.0003979206085205078, 0.00042879581451416016, 0.0004596710205078125, 0.0004905462265014648, 0.0005214214324951172, 0.0005522966384887695, 0.0005831718444824219, 0.0006140470504760742, 0.0006449222564697266, 0.0006757974624633789, 0.0007066726684570312, 0.0007375478744506836, 0.0007684230804443359, 0.0007992982864379883, 0.0008301734924316406, 0.000861048698425293, 0.0008919239044189453, 0.0009227991104125977, 0.00095367431640625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 11.0, 6.0, 13.0, 16.0, 26.0, 40.0, 33.0, 58.0, 86.0, 108.0, 114.0, 192.0, 370.0, 1444.0, 15230.0, 662852.0, 355502.0, 10366.0, 1088.0, 336.0, 170.0, 116.0, 75.0, 51.0, 40.0, 37.0, 38.0, 25.0, 14.0, 22.0, 10.0, 7.0, 7.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.024200439453125, -0.023487091064453125, -0.02277374267578125, -0.022060394287109375, -0.0213470458984375, -0.020633697509765625, -0.01992034912109375, -0.019207000732421875, -0.01849365234375, -0.017780303955078125, -0.01706695556640625, -0.016353607177734375, -0.0156402587890625, -0.014926910400390625, -0.01421356201171875, -0.013500213623046875, -0.012786865234375, -0.012073516845703125, -0.01136016845703125, -0.010646820068359375, -0.0099334716796875, -0.009220123291015625, -0.00850677490234375, -0.007793426513671875, -0.007080078125, -0.006366729736328125, -0.00565338134765625, -0.004940032958984375, -0.0042266845703125, -0.003513336181640625, -0.00279998779296875, -0.002086639404296875, -0.001373291015625, -0.000659942626953125, 5.340576171875e-05, 0.000766754150390625, 0.0014801025390625, 0.002193450927734375, 0.00290679931640625, 0.003620147705078125, 0.00433349609375, 0.005046844482421875, 0.00576019287109375, 0.006473541259765625, 0.0071868896484375, 0.007900238037109375, 0.00861358642578125, 0.009326934814453125, 0.010040283203125, 0.010753631591796875, 0.01146697998046875, 0.012180328369140625, 0.0128936767578125, 0.013607025146484375, 0.01432037353515625, 0.015033721923828125, 0.0157470703125, 0.016460418701171875, 0.01717376708984375, 0.017887115478515625, 0.0186004638671875, 0.019313812255859375, 0.02002716064453125, 0.020740509033203125, 0.021453857421875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 14.0, 206.0, 677.0, 107.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0265224389731884, -0.026052378118038177, -0.025582315400242805, -0.025112254545092583, -0.02464219182729721, -0.024172130972146988, -0.023702070116996765, -0.023232007399201393, -0.02276194654405117, -0.022291885688900948, -0.021821822971105576, -0.021351762115955353, -0.02088169939815998, -0.020411638543009758, -0.019941575825214386, -0.019471514970064163, -0.01900145411491394, -0.018531393259763718, -0.018061330541968346, -0.017591269686818123, -0.01712120696902275, -0.016651146113872528, -0.016181085258722305, -0.015711022540926933, -0.015240959823131561, -0.014770898036658764, -0.014300836250185966, -0.013830775395035744, -0.013360713608562946, -0.012890651822090149, -0.012420590035617352, -0.011950528249144554, -0.011480468325316906, -0.011010406538844109, -0.010540344752371311, -0.010070282965898514, -0.009600222110748291, -0.009130160324275494, -0.008660098537802696, -0.008190036751329899, -0.0077199749648571014, -0.007249913178384304, -0.006779851857572794, -0.006309790071099997, -0.0058397287502884865, -0.005369666963815689, -0.004899605177342892, -0.004429543390870094, -0.0039594825357198715, -0.0034894209820777178, -0.003019359428435564, -0.0025492976419627666, -0.002079236088320613, -0.0016091745346784592, -0.0011391127482056618, -0.000669051194563508, -0.00019898940809071064, 0.000271072203759104, 0.0007411338156089187, 0.0012111954856663942, 0.001681257039308548, 0.0021513185929507017, 0.002621380379423499, 0.003091441933065653, 0.0035615034867078066]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 8.0, 20.0, 16.0, 20.0, 20.0, 28.0, 35.0, 31.0, 34.0, 46.0, 44.0, 37.0, 45.0, 62.0, 39.0, 57.0, 57.0, 49.0, 52.0, 52.0, 35.0, 34.0, 33.0, 20.0, 22.0, 19.0, 23.0, 10.0, 11.0, 12.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005894899368286133, -0.0005647763609886169, -0.0005400627851486206, -0.0005153492093086243, -0.0004906356334686279, -0.0004659220576286316, -0.00044120848178863525, -0.0004164949059486389, -0.0003917813301086426, -0.00036706775426864624, -0.0003423541784286499, -0.00031764060258865356, -0.0002929270267486572, -0.0002682134509086609, -0.00024349987506866455, -0.0002187862992286682, -0.00019407272338867188, -0.00016935914754867554, -0.0001446455717086792, -0.00011993199586868286, -9.521842002868652e-05, -7.050484418869019e-05, -4.579126834869385e-05, -2.107769250869751e-05, 3.635883331298828e-06, 2.8349459171295166e-05, 5.3063035011291504e-05, 7.777661085128784e-05, 0.00010249018669128418, 0.00012720376253128052, 0.00015191733837127686, 0.0001766309142112732, 0.00020134449005126953, 0.00022605806589126587, 0.0002507716417312622, 0.00027548521757125854, 0.0003001987934112549, 0.0003249123692512512, 0.00034962594509124756, 0.0003743395209312439, 0.00039905309677124023, 0.00042376667261123657, 0.0004484802484512329, 0.00047319382429122925, 0.0004979074001312256, 0.0005226209759712219, 0.0005473345518112183, 0.0005720481276512146, 0.0005967617034912109, 0.0006214752793312073, 0.0006461888551712036, 0.0006709024310112, 0.0006956160068511963, 0.0007203295826911926, 0.000745043158531189, 0.0007697567343711853, 0.0007944703102111816, 0.000819183886051178, 0.0008438974618911743, 0.0008686110377311707, 0.000893324613571167, 0.0009180381894111633, 0.0009427517652511597, 0.000967465341091156, 0.0009921789169311523]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 11.0, 5.0, 14.0, 19.0, 12.0, 16.0, 22.0, 25.0, 21.0, 26.0, 28.0, 25.0, 23.0, 31.0, 34.0, 39.0, 35.0, 40.0, 51.0, 47.0, 32.0, 47.0, 32.0, 35.0, 38.0, 36.0, 32.0, 19.0, 38.0, 17.0, 17.0, 23.0, 20.0, 16.0, 16.0, 11.0, 7.0, 6.0, 7.0, 7.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.92926025390625, -1.8585205078125, -1.78778076171875, -1.717041015625, -1.64630126953125, -1.5755615234375, -1.50482177734375, -1.43408203125, -1.36334228515625, -1.2926025390625, -1.22186279296875, -1.151123046875, -1.08038330078125, -1.0096435546875, -0.93890380859375, -0.8681640625, -0.79742431640625, -0.7266845703125, -0.65594482421875, -0.585205078125, -0.51446533203125, -0.4437255859375, -0.37298583984375, -0.30224609375, -0.23150634765625, -0.1607666015625, -0.09002685546875, -0.019287109375, 0.05145263671875, 0.1221923828125, 0.19293212890625, 0.263671875, 0.33441162109375, 0.4051513671875, 0.47589111328125, 0.546630859375, 0.61737060546875, 0.6881103515625, 0.75885009765625, 0.82958984375, 0.90032958984375, 0.9710693359375, 1.04180908203125, 1.112548828125, 1.18328857421875, 1.2540283203125, 1.32476806640625, 1.3955078125, 1.46624755859375, 1.5369873046875, 1.60772705078125, 1.678466796875, 1.74920654296875, 1.8199462890625, 1.89068603515625, 1.96142578125, 2.03216552734375, 2.1029052734375, 2.17364501953125, 2.244384765625, 2.31512451171875, 2.3858642578125, 2.45660400390625, 2.52734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 8.0, 12.0, 23.0, 34.0, 46.0, 80.0, 110.0, 230.0, 447.0, 765.0, 1352.0, 2405.0, 4274.0, 8127.0, 16028.0, 36311.0, 113795.0, 484418.0, 266419.0, 64033.0, 24312.0, 11644.0, 6031.0, 3389.0, 1799.0, 1012.0, 600.0, 362.0, 176.0, 120.0, 65.0, 39.0, 34.0, 18.0, 12.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.865234375, -2.7803955078125, -2.695556640625, -2.6107177734375, -2.52587890625, -2.4410400390625, -2.356201171875, -2.2713623046875, -2.1865234375, -2.1016845703125, -2.016845703125, -1.9320068359375, -1.84716796875, -1.7623291015625, -1.677490234375, -1.5926513671875, -1.5078125, -1.4229736328125, -1.338134765625, -1.2532958984375, -1.16845703125, -1.0836181640625, -0.998779296875, -0.9139404296875, -0.8291015625, -0.7442626953125, -0.659423828125, -0.5745849609375, -0.48974609375, -0.4049072265625, -0.320068359375, -0.2352294921875, -0.150390625, -0.0655517578125, 0.019287109375, 0.1041259765625, 0.18896484375, 0.2738037109375, 0.358642578125, 0.4434814453125, 0.5283203125, 0.6131591796875, 0.697998046875, 0.7828369140625, 0.86767578125, 0.9525146484375, 1.037353515625, 1.1221923828125, 1.20703125, 1.2918701171875, 1.376708984375, 1.4615478515625, 1.54638671875, 1.6312255859375, 1.716064453125, 1.8009033203125, 1.8857421875, 1.9705810546875, 2.055419921875, 2.1402587890625, 2.22509765625, 2.3099365234375, 2.394775390625, 2.4796142578125, 2.564453125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 5.0, 7.0, 7.0, 17.0, 10.0, 18.0, 13.0, 25.0, 33.0, 27.0, 31.0, 30.0, 48.0, 41.0, 43.0, 52.0, 63.0, 117.0, 237.0, 1598.0, 126.0, 69.0, 44.0, 44.0, 34.0, 38.0, 24.0, 29.0, 27.0, 27.0, 20.0, 17.0, 14.0, 8.0, 13.0, 13.0, 13.0, 9.0, 9.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.74609375, -6.50726318359375, -6.2684326171875, -6.02960205078125, -5.790771484375, -5.55194091796875, -5.3131103515625, -5.07427978515625, -4.83544921875, -4.59661865234375, -4.3577880859375, -4.11895751953125, -3.880126953125, -3.64129638671875, -3.4024658203125, -3.16363525390625, -2.9248046875, -2.68597412109375, -2.4471435546875, -2.20831298828125, -1.969482421875, -1.73065185546875, -1.4918212890625, -1.25299072265625, -1.01416015625, -0.77532958984375, -0.5364990234375, -0.29766845703125, -0.058837890625, 0.17999267578125, 0.4188232421875, 0.65765380859375, 0.896484375, 1.13531494140625, 1.3741455078125, 1.61297607421875, 1.851806640625, 2.09063720703125, 2.3294677734375, 2.56829833984375, 2.80712890625, 3.04595947265625, 3.2847900390625, 3.52362060546875, 3.762451171875, 4.00128173828125, 4.2401123046875, 4.47894287109375, 4.7177734375, 4.95660400390625, 5.1954345703125, 5.43426513671875, 5.673095703125, 5.91192626953125, 6.1507568359375, 6.38958740234375, 6.62841796875, 6.86724853515625, 7.1060791015625, 7.34490966796875, 7.583740234375, 7.82257080078125, 8.0614013671875, 8.30023193359375, 8.5390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 8.0, 7.0, 19.0, 10.0, 15.0, 16.0, 14.0, 26.0, 28.0, 41.0, 71.0, 78.0, 158.0, 274.0, 545.0, 1129.0, 3636.0, 19534.0, 545822.0, 2531742.0, 34274.0, 5260.0, 1561.0, 593.0, 284.0, 168.0, 105.0, 63.0, 51.0, 35.0, 35.0, 20.0, 26.0, 12.0, 12.0, 6.0, 5.0, 6.0, 6.0, 7.0, 4.0, 6.0], "bins": [-18.53125, -18.08056640625, -17.6298828125, -17.17919921875, -16.728515625, -16.27783203125, -15.8271484375, -15.37646484375, -14.92578125, -14.47509765625, -14.0244140625, -13.57373046875, -13.123046875, -12.67236328125, -12.2216796875, -11.77099609375, -11.3203125, -10.86962890625, -10.4189453125, -9.96826171875, -9.517578125, -9.06689453125, -8.6162109375, -8.16552734375, -7.71484375, -7.26416015625, -6.8134765625, -6.36279296875, -5.912109375, -5.46142578125, -5.0107421875, -4.56005859375, -4.109375, -3.65869140625, -3.2080078125, -2.75732421875, -2.306640625, -1.85595703125, -1.4052734375, -0.95458984375, -0.50390625, -0.05322265625, 0.3974609375, 0.84814453125, 1.298828125, 1.74951171875, 2.2001953125, 2.65087890625, 3.1015625, 3.55224609375, 4.0029296875, 4.45361328125, 4.904296875, 5.35498046875, 5.8056640625, 6.25634765625, 6.70703125, 7.15771484375, 7.6083984375, 8.05908203125, 8.509765625, 8.96044921875, 9.4111328125, 9.86181640625, 10.3125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 21.0, 86.0, 216.0, 317.0, 240.0, 88.0, 28.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.368688583374023, -12.221512794494629, -11.07433795928955, -9.927162170410156, -8.779987335205078, -7.632811546325684, -6.485635757446289, -5.338460922241211, -4.191285133361816, -3.04410982131958, -1.8969342708587646, -0.7497587203979492, 0.3974165916442871, 1.5445919036865234, 2.691767692565918, 3.838942527770996, 4.986118316650391, 6.133293628692627, 7.280468940734863, 8.427644729614258, 9.574819564819336, 10.72199535369873, 11.869171142578125, 13.016345977783203, 14.163521766662598, 15.310697555541992, 16.45787239074707, 17.60504913330078, 18.75222396850586, 19.899398803710938, 21.046573638916016, 22.193748474121094, 23.340927124023438, 24.488101959228516, 25.635278701782227, 26.782453536987305, 27.929628372192383, 29.076805114746094, 30.223979949951172, 31.37115478515625, 32.51832962036133, 33.665504455566406, 34.812679290771484, 35.95985412597656, 37.107032775878906, 38.254207611083984, 39.40138244628906, 40.54855728149414, 41.69573211669922, 42.8429069519043, 43.990081787109375, 45.13726043701172, 46.2844352722168, 47.431610107421875, 48.57878494262695, 49.72595977783203, 50.873138427734375, 52.02031326293945, 53.16748809814453, 54.314666748046875, 55.46184158325195, 56.60901641845703, 57.75619125366211, 58.90336608886719, 60.050540924072266]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 8.0, 5.0, 11.0, 15.0, 17.0, 19.0, 15.0, 21.0, 23.0, 35.0, 29.0, 29.0, 32.0, 46.0, 52.0, 49.0, 44.0, 38.0, 52.0, 46.0, 39.0, 46.0, 33.0, 26.0, 30.0, 32.0, 36.0, 18.0, 27.0, 16.0, 17.0, 14.0, 13.0, 19.0, 10.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.566871643066406, -26.690608978271484, -25.81434440612793, -24.938081741333008, -24.061817169189453, -23.18555450439453, -22.30929183959961, -21.433027267456055, -20.556764602661133, -19.68050193786621, -18.804237365722656, -17.927974700927734, -17.05171012878418, -16.175447463989258, -15.29918384552002, -14.422920227050781, -13.546656608581543, -12.670392990112305, -11.794129371643066, -10.917865753173828, -10.041603088378906, -9.165339469909668, -8.28907585144043, -7.41281270980835, -6.536549091339111, -5.660285472869873, -4.784022331237793, -3.9077587127685547, -3.0314953327178955, -2.1552319526672363, -1.278968334197998, -0.40270519256591797, 0.4735584259033203, 1.3498218059539795, 2.2260851860046387, 3.102348804473877, 3.978612184524536, 4.854875564575195, 5.731139183044434, 6.607402324676514, 7.483665943145752, 8.359929084777832, 9.23619270324707, 10.112456321716309, 10.988719940185547, 11.864982604980469, 12.741247177124023, 13.617509841918945, 14.493773460388184, 15.370037078857422, 16.246299743652344, 17.1225643157959, 17.99882698059082, 18.875091552734375, 19.751354217529297, 20.62761688232422, 21.503881454467773, 22.380144119262695, 23.25640869140625, 24.132671356201172, 25.008935928344727, 25.88519859313965, 26.761463165283203, 27.637725830078125, 28.513988494873047]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 5.0, 5.0, 7.0, 6.0, 13.0, 19.0, 13.0, 11.0, 19.0, 23.0, 19.0, 25.0, 28.0, 28.0, 26.0, 28.0, 35.0, 33.0, 35.0, 40.0, 44.0, 47.0, 42.0, 37.0, 42.0, 34.0, 37.0, 29.0, 43.0, 33.0, 29.0, 17.0, 19.0, 27.0, 13.0, 16.0, 18.0, 15.0, 6.0, 5.0, 7.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.034027099609375, -1.96063232421875, -1.887237548828125, -1.8138427734375, -1.740447998046875, -1.66705322265625, -1.593658447265625, -1.520263671875, -1.446868896484375, -1.37347412109375, -1.300079345703125, -1.2266845703125, -1.153289794921875, -1.07989501953125, -1.006500244140625, -0.93310546875, -0.859710693359375, -0.78631591796875, -0.712921142578125, -0.6395263671875, -0.566131591796875, -0.49273681640625, -0.419342041015625, -0.345947265625, -0.272552490234375, -0.19915771484375, -0.125762939453125, -0.0523681640625, 0.021026611328125, 0.09442138671875, 0.167816162109375, 0.2412109375, 0.314605712890625, 0.38800048828125, 0.461395263671875, 0.5347900390625, 0.608184814453125, 0.68157958984375, 0.754974365234375, 0.828369140625, 0.901763916015625, 0.97515869140625, 1.048553466796875, 1.1219482421875, 1.195343017578125, 1.26873779296875, 1.342132568359375, 1.41552734375, 1.488922119140625, 1.56231689453125, 1.635711669921875, 1.7091064453125, 1.782501220703125, 1.85589599609375, 1.929290771484375, 2.002685546875, 2.076080322265625, 2.14947509765625, 2.222869873046875, 2.2962646484375, 2.369659423828125, 2.44305419921875, 2.516448974609375, 2.58984375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 8.0, 3.0, 3.0, 8.0, 8.0, 7.0, 10.0, 18.0, 22.0, 17.0, 32.0, 42.0, 43.0, 43.0, 78.0, 84.0, 149.0, 291.0, 765.0, 2499.0, 8142.0, 31866.0, 178035.0, 2098984.0, 1687693.0, 147619.0, 27349.0, 6851.0, 2062.0, 713.0, 271.0, 150.0, 93.0, 71.0, 43.0, 53.0, 28.0, 23.0, 17.0, 16.0, 21.0, 17.0, 8.0, 4.0, 6.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9375, -8.6287841796875, -8.320068359375, -8.0113525390625, -7.70263671875, -7.3939208984375, -7.085205078125, -6.7764892578125, -6.4677734375, -6.1590576171875, -5.850341796875, -5.5416259765625, -5.23291015625, -4.9241943359375, -4.615478515625, -4.3067626953125, -3.998046875, -3.6893310546875, -3.380615234375, -3.0718994140625, -2.76318359375, -2.4544677734375, -2.145751953125, -1.8370361328125, -1.5283203125, -1.2196044921875, -0.910888671875, -0.6021728515625, -0.29345703125, 0.0152587890625, 0.323974609375, 0.6326904296875, 0.94140625, 1.2501220703125, 1.558837890625, 1.8675537109375, 2.17626953125, 2.4849853515625, 2.793701171875, 3.1024169921875, 3.4111328125, 3.7198486328125, 4.028564453125, 4.3372802734375, 4.64599609375, 4.9547119140625, 5.263427734375, 5.5721435546875, 5.880859375, 6.1895751953125, 6.498291015625, 6.8070068359375, 7.11572265625, 7.4244384765625, 7.733154296875, 8.0418701171875, 8.3505859375, 8.6593017578125, 8.968017578125, 9.2767333984375, 9.58544921875, 9.8941650390625, 10.202880859375, 10.5115966796875, 10.8203125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 14.0, 18.0, 26.0, 33.0, 47.0, 60.0, 84.0, 110.0, 155.0, 203.0, 267.0, 415.0, 441.0, 487.0, 429.0, 321.0, 253.0, 187.0, 139.0, 103.0, 71.0, 56.0, 30.0, 34.0, 21.0, 16.0, 6.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.6015625, -10.3377685546875, -10.073974609375, -9.8101806640625, -9.54638671875, -9.2825927734375, -9.018798828125, -8.7550048828125, -8.4912109375, -8.2274169921875, -7.963623046875, -7.6998291015625, -7.43603515625, -7.1722412109375, -6.908447265625, -6.6446533203125, -6.380859375, -6.1170654296875, -5.853271484375, -5.5894775390625, -5.32568359375, -5.0618896484375, -4.798095703125, -4.5343017578125, -4.2705078125, -4.0067138671875, -3.742919921875, -3.4791259765625, -3.21533203125, -2.9515380859375, -2.687744140625, -2.4239501953125, -2.16015625, -1.8963623046875, -1.632568359375, -1.3687744140625, -1.10498046875, -0.8411865234375, -0.577392578125, -0.3135986328125, -0.0498046875, 0.2139892578125, 0.477783203125, 0.7415771484375, 1.00537109375, 1.2691650390625, 1.532958984375, 1.7967529296875, 2.060546875, 2.3243408203125, 2.588134765625, 2.8519287109375, 3.11572265625, 3.3795166015625, 3.643310546875, 3.9071044921875, 4.1708984375, 4.4346923828125, 4.698486328125, 4.9622802734375, 5.22607421875, 5.4898681640625, 5.753662109375, 6.0174560546875, 6.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 9.0, 8.0, 14.0, 17.0, 20.0, 33.0, 60.0, 87.0, 109.0, 200.0, 299.0, 580.0, 1436.0, 4692.0, 25354.0, 229115.0, 2929243.0, 914420.0, 73730.0, 10385.0, 2457.0, 888.0, 454.0, 224.0, 144.0, 89.0, 70.0, 55.0, 30.0, 22.0, 8.0, 7.0, 11.0, 10.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.9207763671875, -14.318115234375, -13.7154541015625, -13.11279296875, -12.5101318359375, -11.907470703125, -11.3048095703125, -10.7021484375, -10.0994873046875, -9.496826171875, -8.8941650390625, -8.29150390625, -7.6888427734375, -7.086181640625, -6.4835205078125, -5.880859375, -5.2781982421875, -4.675537109375, -4.0728759765625, -3.47021484375, -2.8675537109375, -2.264892578125, -1.6622314453125, -1.0595703125, -0.4569091796875, 0.145751953125, 0.7484130859375, 1.35107421875, 1.9537353515625, 2.556396484375, 3.1590576171875, 3.76171875, 4.3643798828125, 4.967041015625, 5.5697021484375, 6.17236328125, 6.7750244140625, 7.377685546875, 7.9803466796875, 8.5830078125, 9.1856689453125, 9.788330078125, 10.3909912109375, 10.99365234375, 11.5963134765625, 12.198974609375, 12.8016357421875, 13.404296875, 14.0069580078125, 14.609619140625, 15.2122802734375, 15.81494140625, 16.4176025390625, 17.020263671875, 17.6229248046875, 18.2255859375, 18.8282470703125, 19.430908203125, 20.0335693359375, 20.63623046875, 21.2388916015625, 21.841552734375, 22.4442138671875, 23.046875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 17.0, 36.0, 65.0, 114.0, 164.0, 176.0, 150.0, 140.0, 69.0, 37.0, 18.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.77677917480469, -64.78504943847656, -62.79331970214844, -60.80158996582031, -58.80986404418945, -56.81813430786133, -54.8264045715332, -52.83467483520508, -50.84294891357422, -48.851219177246094, -46.85948944091797, -44.867759704589844, -42.876033782958984, -40.88430404663086, -38.892574310302734, -36.90084457397461, -34.909114837646484, -32.91738510131836, -30.925657272338867, -28.933927536010742, -26.94219970703125, -24.950469970703125, -22.958740234375, -20.967010498046875, -18.975282669067383, -16.983552932739258, -14.991825103759766, -13.00009536743164, -11.008366584777832, -9.016637802124023, -7.024908065795898, -5.03317928314209, -3.0414466857910156, -1.049717664718628, 0.9420113563537598, 2.9337406158447266, 4.925469398498535, 6.917198181152344, 8.908927917480469, 10.900656700134277, 12.892385482788086, 14.884114265441895, 16.875843048095703, 18.867572784423828, 20.859302520751953, 22.851030349731445, 24.84276008605957, 26.834487915039062, 28.826217651367188, 30.817947387695312, 32.80967712402344, 34.80140686035156, 36.79313278198242, 38.78486251831055, 40.77659225463867, 42.7683219909668, 44.760047912597656, 46.75177764892578, 48.743507385253906, 50.73523712158203, 52.72696304321289, 54.718692779541016, 56.71042251586914, 58.702152252197266, 60.69388198852539]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 10.0, 16.0, 16.0, 18.0, 19.0, 21.0, 20.0, 26.0, 28.0, 38.0, 45.0, 35.0, 30.0, 46.0, 35.0, 39.0, 41.0, 44.0, 43.0, 35.0, 31.0, 41.0, 40.0, 30.0, 38.0, 25.0, 22.0, 14.0, 12.0, 13.0, 20.0, 17.0, 18.0, 13.0, 7.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.56378173828125, -26.69440460205078, -25.825027465820312, -24.955650329589844, -24.086273193359375, -23.216896057128906, -22.347518920898438, -21.47814178466797, -20.6087646484375, -19.73938751220703, -18.870010375976562, -18.000633239746094, -17.131256103515625, -16.261878967285156, -15.392501831054688, -14.523124694824219, -13.65374755859375, -12.784370422363281, -11.914993286132812, -11.045616149902344, -10.176239013671875, -9.306861877441406, -8.437484741210938, -7.568107604980469, -6.69873046875, -5.829353332519531, -4.9599761962890625, -4.090599060058594, -3.221221923828125, -2.3518447875976562, -1.4824676513671875, -0.6130905151367188, 0.25628662109375, 1.1256637573242188, 1.9950408935546875, 2.8644180297851562, 3.733795166015625, 4.603172302246094, 5.4725494384765625, 6.341926574707031, 7.2113037109375, 8.080680847167969, 8.950057983398438, 9.819435119628906, 10.688812255859375, 11.558189392089844, 12.427566528320312, 13.296943664550781, 14.16632080078125, 15.035697937011719, 15.905075073242188, 16.774452209472656, 17.643829345703125, 18.513206481933594, 19.382583618164062, 20.25196075439453, 21.121337890625, 21.99071502685547, 22.860092163085938, 23.729469299316406, 24.598846435546875, 25.468223571777344, 26.337600708007812, 27.20697784423828, 28.07635498046875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 8.0, 8.0, 9.0, 13.0, 21.0, 12.0, 14.0, 24.0, 19.0, 31.0, 29.0, 28.0, 30.0, 31.0, 30.0, 36.0, 35.0, 36.0, 39.0, 40.0, 37.0, 37.0, 47.0, 38.0, 35.0, 36.0, 25.0, 28.0, 19.0, 25.0, 29.0, 20.0, 24.0, 7.0, 13.0, 9.0, 14.0, 11.0, 10.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9443359375, -1.8712615966796875, -1.798187255859375, -1.7251129150390625, -1.65203857421875, -1.5789642333984375, -1.505889892578125, -1.4328155517578125, -1.3597412109375, -1.2866668701171875, -1.213592529296875, -1.1405181884765625, -1.06744384765625, -0.9943695068359375, -0.921295166015625, -0.8482208251953125, -0.775146484375, -0.7020721435546875, -0.628997802734375, -0.5559234619140625, -0.48284912109375, -0.4097747802734375, -0.336700439453125, -0.2636260986328125, -0.1905517578125, -0.1174774169921875, -0.044403076171875, 0.0286712646484375, 0.10174560546875, 0.1748199462890625, 0.247894287109375, 0.3209686279296875, 0.39404296875, 0.4671173095703125, 0.540191650390625, 0.6132659912109375, 0.68634033203125, 0.7594146728515625, 0.832489013671875, 0.9055633544921875, 0.9786376953125, 1.0517120361328125, 1.124786376953125, 1.1978607177734375, 1.27093505859375, 1.3440093994140625, 1.417083740234375, 1.4901580810546875, 1.563232421875, 1.6363067626953125, 1.709381103515625, 1.7824554443359375, 1.85552978515625, 1.9286041259765625, 2.001678466796875, 2.0747528076171875, 2.1478271484375, 2.2209014892578125, 2.293975830078125, 2.3670501708984375, 2.44012451171875, 2.5131988525390625, 2.586273193359375, 2.6593475341796875, 2.732421875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 13.0, 26.0, 24.0, 49.0, 72.0, 106.0, 173.0, 244.0, 387.0, 547.0, 848.0, 1152.0, 1794.0, 2705.0, 3884.0, 6025.0, 8923.0, 13030.0, 19534.0, 29039.0, 42398.0, 61555.0, 87450.0, 118289.0, 145158.0, 139889.0, 110411.0, 80356.0, 56747.0, 38043.0, 25989.0, 17576.0, 11868.0, 7935.0, 5322.0, 3629.0, 2464.0, 1614.0, 1032.0, 741.0, 479.0, 331.0, 252.0, 138.0, 117.0, 67.0, 53.0, 30.0, 24.0, 10.0, 5.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.302734375, -0.2937965393066406, -0.28485870361328125, -0.2759208679199219, -0.2669830322265625, -0.2580451965332031, -0.24910736083984375, -0.24016952514648438, -0.231231689453125, -0.22229385375976562, -0.21335601806640625, -0.20441818237304688, -0.1954803466796875, -0.18654251098632812, -0.17760467529296875, -0.16866683959960938, -0.15972900390625, -0.15079116821289062, -0.14185333251953125, -0.13291549682617188, -0.1239776611328125, -0.11503982543945312, -0.10610198974609375, -0.09716415405273438, -0.088226318359375, -0.07928848266601562, -0.07035064697265625, -0.061412811279296875, -0.0524749755859375, -0.043537139892578125, -0.03459930419921875, -0.025661468505859375, -0.0167236328125, -0.007785797119140625, 0.00115203857421875, 0.010089874267578125, 0.0190277099609375, 0.027965545654296875, 0.03690338134765625, 0.045841217041015625, 0.054779052734375, 0.06371688842773438, 0.07265472412109375, 0.08159255981445312, 0.0905303955078125, 0.09946823120117188, 0.10840606689453125, 0.11734390258789062, 0.12628173828125, 0.13521957397460938, 0.14415740966796875, 0.15309524536132812, 0.1620330810546875, 0.17097091674804688, 0.17990875244140625, 0.18884658813476562, 0.197784423828125, 0.20672225952148438, 0.21566009521484375, 0.22459793090820312, 0.2335357666015625, 0.24247360229492188, 0.25141143798828125, 0.2603492736816406, 0.269287109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 5.0, 9.0, 12.0, 16.0, 15.0, 10.0, 8.0, 21.0, 19.0, 31.0, 19.0, 39.0, 32.0, 41.0, 37.0, 37.0, 51.0, 59.0, 43.0, 1054.0, 35.0, 31.0, 37.0, 36.0, 33.0, 38.0, 35.0, 39.0, 31.0, 28.0, 17.0, 20.0, 15.0, 10.0, 11.0, 10.0, 6.0, 6.0, 6.0, 5.0, 1.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4468994140625, -1.393798828125, -1.3406982421875, -1.28759765625, -1.2344970703125, -1.181396484375, -1.1282958984375, -1.0751953125, -1.0220947265625, -0.968994140625, -0.9158935546875, -0.86279296875, -0.8096923828125, -0.756591796875, -0.7034912109375, -0.650390625, -0.5972900390625, -0.544189453125, -0.4910888671875, -0.43798828125, -0.3848876953125, -0.331787109375, -0.2786865234375, -0.2255859375, -0.1724853515625, -0.119384765625, -0.0662841796875, -0.01318359375, 0.0399169921875, 0.093017578125, 0.1461181640625, 0.19921875, 0.2523193359375, 0.305419921875, 0.3585205078125, 0.41162109375, 0.4647216796875, 0.517822265625, 0.5709228515625, 0.6240234375, 0.6771240234375, 0.730224609375, 0.7833251953125, 0.83642578125, 0.8895263671875, 0.942626953125, 0.9957275390625, 1.048828125, 1.1019287109375, 1.155029296875, 1.2081298828125, 1.26123046875, 1.3143310546875, 1.367431640625, 1.4205322265625, 1.4736328125, 1.5267333984375, 1.579833984375, 1.6329345703125, 1.68603515625, 1.7391357421875, 1.792236328125, 1.8453369140625, 1.8984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 9.0, 3.0, 6.0, 9.0, 14.0, 23.0, 38.0, 66.0, 68.0, 113.0, 154.0, 225.0, 298.0, 479.0, 738.0, 1032.0, 1590.0, 2459.0, 3770.0, 5652.0, 8646.0, 13682.0, 21226.0, 33041.0, 51507.0, 78181.0, 113812.0, 149207.0, 1207617.0, 131314.0, 94180.0, 62540.0, 40792.0, 26590.0, 16805.0, 10918.0, 6935.0, 4476.0, 2986.0, 1965.0, 1294.0, 832.0, 547.0, 431.0, 265.0, 194.0, 128.0, 92.0, 68.0, 39.0, 24.0, 18.0, 14.0, 11.0, 6.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.19970703125, -0.1933135986328125, -0.186920166015625, -0.1805267333984375, -0.17413330078125, -0.1677398681640625, -0.161346435546875, -0.1549530029296875, -0.1485595703125, -0.1421661376953125, -0.135772705078125, -0.1293792724609375, -0.12298583984375, -0.1165924072265625, -0.110198974609375, -0.1038055419921875, -0.097412109375, -0.0910186767578125, -0.084625244140625, -0.0782318115234375, -0.07183837890625, -0.0654449462890625, -0.059051513671875, -0.0526580810546875, -0.0462646484375, -0.0398712158203125, -0.033477783203125, -0.0270843505859375, -0.02069091796875, -0.0142974853515625, -0.007904052734375, -0.0015106201171875, 0.0048828125, 0.0112762451171875, 0.017669677734375, 0.0240631103515625, 0.03045654296875, 0.0368499755859375, 0.043243408203125, 0.0496368408203125, 0.0560302734375, 0.0624237060546875, 0.068817138671875, 0.0752105712890625, 0.08160400390625, 0.0879974365234375, 0.094390869140625, 0.1007843017578125, 0.107177734375, 0.1135711669921875, 0.119964599609375, 0.1263580322265625, 0.13275146484375, 0.1391448974609375, 0.145538330078125, 0.1519317626953125, 0.1583251953125, 0.1647186279296875, 0.171112060546875, 0.1775054931640625, 0.18389892578125, 0.1902923583984375, 0.196685791015625, 0.2030792236328125, 0.20947265625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 10.0, 12.0, 15.0, 23.0, 35.0, 48.0, 50.0, 77.0, 82.0, 99.0, 99.0, 104.0, 92.0, 75.0, 41.0, 38.0, 30.0, 19.0, 9.0, 13.0, 6.0, 3.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0022735595703125, -0.0022094398736953735, -0.002145320177078247, -0.0020812004804611206, -0.002017080783843994, -0.0019529610872268677, -0.0018888413906097412, -0.0018247216939926147, -0.0017606019973754883, -0.0016964823007583618, -0.0016323626041412354, -0.0015682429075241089, -0.0015041232109069824, -0.001440003514289856, -0.0013758838176727295, -0.001311764121055603, -0.0012476444244384766, -0.00118352472782135, -0.0011194050312042236, -0.0010552853345870972, -0.0009911656379699707, -0.0009270459413528442, -0.0008629262447357178, -0.0007988065481185913, -0.0007346868515014648, -0.0006705671548843384, -0.0006064474582672119, -0.0005423277616500854, -0.000478208065032959, -0.0004140883684158325, -0.00034996867179870605, -0.0002858489751815796, -0.00022172927856445312, -0.00015760958194732666, -9.34898853302002e-05, -2.937018871307373e-05, 3.4749507904052734e-05, 9.88692045211792e-05, 0.00016298890113830566, 0.00022710859775543213, 0.0002912282943725586, 0.00035534799098968506, 0.0004194676876068115, 0.000483587384223938, 0.0005477070808410645, 0.0006118267774581909, 0.0006759464740753174, 0.0007400661706924438, 0.0008041858673095703, 0.0008683055639266968, 0.0009324252605438232, 0.0009965449571609497, 0.0010606646537780762, 0.0011247843503952026, 0.001188904047012329, 0.0012530237436294556, 0.001317143440246582, 0.0013812631368637085, 0.001445382833480835, 0.0015095025300979614, 0.0015736222267150879, 0.0016377419233322144, 0.0017018616199493408, 0.0017659813165664673, 0.0018301010131835938]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 8.0, 5.0, 15.0, 16.0, 18.0, 23.0, 47.0, 37.0, 94.0, 124.0, 192.0, 358.0, 1277.0, 15769.0, 737461.0, 283391.0, 8012.0, 863.0, 256.0, 168.0, 123.0, 77.0, 51.0, 37.0, 36.0, 16.0, 14.0, 9.0, 9.0, 8.0, 9.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.031690120697021484, -0.03072643280029297, -0.029762744903564453, -0.028799057006835938, -0.027835369110107422, -0.026871681213378906, -0.02590799331665039, -0.024944305419921875, -0.02398061752319336, -0.023016929626464844, -0.022053241729736328, -0.021089553833007812, -0.020125865936279297, -0.01916217803955078, -0.018198490142822266, -0.01723480224609375, -0.016271114349365234, -0.015307426452636719, -0.014343738555908203, -0.013380050659179688, -0.012416362762451172, -0.011452674865722656, -0.01048898696899414, -0.009525299072265625, -0.00856161117553711, -0.007597923278808594, -0.006634235382080078, -0.0056705474853515625, -0.004706859588623047, -0.0037431716918945312, -0.0027794837951660156, -0.0018157958984375, -0.0008521080017089844, 0.00011157989501953125, 0.0010752677917480469, 0.0020389556884765625, 0.003002643585205078, 0.003966331481933594, 0.004930019378662109, 0.005893707275390625, 0.006857395172119141, 0.007821083068847656, 0.008784770965576172, 0.009748458862304688, 0.010712146759033203, 0.011675834655761719, 0.012639522552490234, 0.01360321044921875, 0.014566898345947266, 0.015530586242675781, 0.016494274139404297, 0.017457962036132812, 0.018421649932861328, 0.019385337829589844, 0.02034902572631836, 0.021312713623046875, 0.02227640151977539, 0.023240089416503906, 0.024203777313232422, 0.025167465209960938, 0.026131153106689453, 0.02709484100341797, 0.028058528900146484, 0.029022216796875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 6.0, 7.0, 17.0, 18.0, 35.0, 99.0, 165.0, 233.0, 202.0, 113.0, 67.0, 25.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00420135073363781, -0.00405042665079236, -0.003899502335116267, -0.003748578019440174, -0.0035976539365947247, -0.0034467296209186316, -0.0032958053052425385, -0.003144881222397089, -0.002993956906720996, -0.002843032591044903, -0.0026921085081994534, -0.0025411841925233603, -0.002390259876847267, -0.0022393357940018177, -0.0020884114783257246, -0.0019374872790649533, -0.001786563079804182, -0.0016356388805434108, -0.0014847146812826395, -0.0013337903656065464, -0.0011828661663457751, -0.0010319419670850039, -0.0008810177096165717, -0.0007300934521481395, -0.0005791692528873682, -0.00042824502452276647, -0.00027732079615816474, -0.000126396567793563, 2.4527660571038723e-05, 0.00017545185983181, 0.0003263761173002422, 0.0004773003747686744, 0.0006282245740294456, 0.0007791487732902169, 0.0009300730307586491, 0.0010809972882270813, 0.0012319214874878526, 0.0013828456867486238, 0.001533770002424717, 0.0016846942016854882, 0.0018356184009462595, 0.0019865427166223526, 0.002137466799467802, 0.002288391115143895, 0.0024393154308199883, 0.0025902395136654377, 0.002741163829341531, 0.002892088145017624, 0.0030430122278630733, 0.0031939365435391665, 0.003344860626384616, 0.003495784942060709, 0.0036467090249061584, 0.0037976333405822515, 0.003948557656258345, 0.004099481739103794, 0.004250406287610531, 0.00440133037045598, 0.004552254918962717, 0.0047031790018081665, 0.004854103084653616, 0.005005027167499065, 0.005155951716005802, 0.005306875798851252, 0.005457799881696701]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 13.0, 7.0, 13.0, 19.0, 17.0, 19.0, 18.0, 28.0, 23.0, 38.0, 35.0, 38.0, 33.0, 45.0, 46.0, 47.0, 44.0, 42.0, 25.0, 33.0, 26.0, 45.0, 37.0, 46.0, 32.0, 27.0, 23.0, 32.0, 17.0, 16.0, 21.0, 17.0, 11.0, 10.0, 8.0, 11.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011556148529052734, -0.001118888147175312, -0.0010821614414453506, -0.0010454347357153893, -0.0010087080299854279, -0.0009719813242554665, -0.0009352546185255051, -0.0008985279127955437, -0.0008618012070655823, -0.0008250745013356209, -0.0007883477956056595, -0.0007516210898756981, -0.0007148943841457367, -0.0006781676784157753, -0.0006414409726858139, -0.0006047142669558525, -0.0005679875612258911, -0.0005312608554959297, -0.0004945341497659683, -0.00045780744403600693, -0.00042108073830604553, -0.00038435403257608414, -0.00034762732684612274, -0.00031090062111616135, -0.00027417391538619995, -0.00023744720965623856, -0.00020072050392627716, -0.00016399379819631577, -0.00012726709246635437, -9.054038673639297e-05, -5.381368100643158e-05, -1.7086975276470184e-05, 1.963973045349121e-05, 5.6366436183452606e-05, 9.3093141913414e-05, 0.0001298198476433754, 0.0001665465533733368, 0.0002032732591032982, 0.00023999996483325958, 0.000276726670563221, 0.0003134533762931824, 0.00035018008202314377, 0.00038690678775310516, 0.00042363349348306656, 0.00046036019921302795, 0.0004970869049429893, 0.0005338136106729507, 0.0005705403164029121, 0.0006072670221328735, 0.0006439937278628349, 0.0006807204335927963, 0.0007174471393227577, 0.0007541738450527191, 0.0007909005507826805, 0.0008276272565126419, 0.0008643539622426033, 0.0009010806679725647, 0.0009378073737025261, 0.0009745340794324875, 0.0010112607851624489, 0.0010479874908924103, 0.0010847141966223717, 0.001121440902352333, 0.0011581676080822945, 0.0011948943138122559]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 8.0, 8.0, 9.0, 13.0, 21.0, 12.0, 14.0, 24.0, 19.0, 31.0, 29.0, 28.0, 30.0, 31.0, 30.0, 36.0, 35.0, 36.0, 39.0, 40.0, 37.0, 37.0, 47.0, 38.0, 35.0, 36.0, 25.0, 28.0, 19.0, 25.0, 29.0, 20.0, 24.0, 7.0, 13.0, 9.0, 14.0, 11.0, 10.0, 8.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9443359375, -1.8712615966796875, -1.798187255859375, -1.7251129150390625, -1.65203857421875, -1.5789642333984375, -1.505889892578125, -1.4328155517578125, -1.3597412109375, -1.2866668701171875, -1.213592529296875, -1.1405181884765625, -1.06744384765625, -0.9943695068359375, -0.921295166015625, -0.8482208251953125, -0.775146484375, -0.7020721435546875, -0.628997802734375, -0.5559234619140625, -0.48284912109375, -0.4097747802734375, -0.336700439453125, -0.2636260986328125, -0.1905517578125, -0.1174774169921875, -0.044403076171875, 0.0286712646484375, 0.10174560546875, 0.1748199462890625, 0.247894287109375, 0.3209686279296875, 0.39404296875, 0.4671173095703125, 0.540191650390625, 0.6132659912109375, 0.68634033203125, 0.7594146728515625, 0.832489013671875, 0.9055633544921875, 0.9786376953125, 1.0517120361328125, 1.124786376953125, 1.1978607177734375, 1.27093505859375, 1.3440093994140625, 1.417083740234375, 1.4901580810546875, 1.563232421875, 1.6363067626953125, 1.709381103515625, 1.7824554443359375, 1.85552978515625, 1.9286041259765625, 2.001678466796875, 2.0747528076171875, 2.1478271484375, 2.2209014892578125, 2.293975830078125, 2.3670501708984375, 2.44012451171875, 2.5131988525390625, 2.586273193359375, 2.6593475341796875, 2.732421875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 16.0, 37.0, 78.0, 135.0, 195.0, 406.0, 688.0, 1399.0, 2736.0, 5778.0, 12431.0, 29581.0, 86321.0, 393155.0, 379245.0, 84022.0, 28724.0, 12459.0, 5554.0, 2693.0, 1340.0, 735.0, 354.0, 197.0, 105.0, 66.0, 35.0, 21.0, 20.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.503204345703125, -2.42242431640625, -2.341644287109375, -2.2608642578125, -2.180084228515625, -2.09930419921875, -2.018524169921875, -1.937744140625, -1.856964111328125, -1.77618408203125, -1.695404052734375, -1.6146240234375, -1.533843994140625, -1.45306396484375, -1.372283935546875, -1.29150390625, -1.210723876953125, -1.12994384765625, -1.049163818359375, -0.9683837890625, -0.887603759765625, -0.80682373046875, -0.726043701171875, -0.645263671875, -0.564483642578125, -0.48370361328125, -0.402923583984375, -0.3221435546875, -0.241363525390625, -0.16058349609375, -0.079803466796875, 0.0009765625, 0.081756591796875, 0.16253662109375, 0.243316650390625, 0.3240966796875, 0.404876708984375, 0.48565673828125, 0.566436767578125, 0.647216796875, 0.727996826171875, 0.80877685546875, 0.889556884765625, 0.9703369140625, 1.051116943359375, 1.13189697265625, 1.212677001953125, 1.29345703125, 1.374237060546875, 1.45501708984375, 1.535797119140625, 1.6165771484375, 1.697357177734375, 1.77813720703125, 1.858917236328125, 1.939697265625, 2.020477294921875, 2.10125732421875, 2.182037353515625, 2.2628173828125, 2.343597412109375, 2.42437744140625, 2.505157470703125, 2.5859375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 9.0, 11.0, 15.0, 18.0, 27.0, 27.0, 32.0, 46.0, 46.0, 47.0, 58.0, 70.0, 152.0, 1810.0, 220.0, 85.0, 60.0, 43.0, 48.0, 41.0, 32.0, 34.0, 21.0, 19.0, 11.0, 18.0, 10.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.3984375, -9.03125, -8.6640625, -8.296875, -7.9296875, -7.5625, -7.1953125, -6.828125, -6.4609375, -6.09375, -5.7265625, -5.359375, -4.9921875, -4.625, -4.2578125, -3.890625, -3.5234375, -3.15625, -2.7890625, -2.421875, -2.0546875, -1.6875, -1.3203125, -0.953125, -0.5859375, -0.21875, 0.1484375, 0.515625, 0.8828125, 1.25, 1.6171875, 1.984375, 2.3515625, 2.71875, 3.0859375, 3.453125, 3.8203125, 4.1875, 4.5546875, 4.921875, 5.2890625, 5.65625, 6.0234375, 6.390625, 6.7578125, 7.125, 7.4921875, 7.859375, 8.2265625, 8.59375, 8.9609375, 9.328125, 9.6953125, 10.0625, 10.4296875, 10.796875, 11.1640625, 11.53125, 11.8984375, 12.265625, 12.6328125, 13.0, 13.3671875, 13.734375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 14.0, 16.0, 15.0, 13.0, 28.0, 34.0, 49.0, 59.0, 118.0, 177.0, 372.0, 1195.0, 14927.0, 2992445.0, 131883.0, 3111.0, 552.0, 238.0, 144.0, 92.0, 54.0, 34.0, 28.0, 22.0, 21.0, 15.0, 11.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.515625, -20.9454345703125, -20.375244140625, -19.8050537109375, -19.23486328125, -18.6646728515625, -18.094482421875, -17.5242919921875, -16.9541015625, -16.3839111328125, -15.813720703125, -15.2435302734375, -14.67333984375, -14.1031494140625, -13.532958984375, -12.9627685546875, -12.392578125, -11.8223876953125, -11.252197265625, -10.6820068359375, -10.11181640625, -9.5416259765625, -8.971435546875, -8.4012451171875, -7.8310546875, -7.2608642578125, -6.690673828125, -6.1204833984375, -5.55029296875, -4.9801025390625, -4.409912109375, -3.8397216796875, -3.26953125, -2.6993408203125, -2.129150390625, -1.5589599609375, -0.98876953125, -0.4185791015625, 0.151611328125, 0.7218017578125, 1.2919921875, 1.8621826171875, 2.432373046875, 3.0025634765625, 3.57275390625, 4.1429443359375, 4.713134765625, 5.2833251953125, 5.853515625, 6.4237060546875, 6.993896484375, 7.5640869140625, 8.13427734375, 8.7044677734375, 9.274658203125, 9.8448486328125, 10.4150390625, 10.9852294921875, 11.555419921875, 12.1256103515625, 12.69580078125, 13.2659912109375, 13.836181640625, 14.4063720703125, 14.9765625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 35.0, 671.0, 304.0, 9.0, 0.0, 1.0], "bins": [-150.18838500976562, -147.67611694335938, -145.1638641357422, -142.651611328125, -140.13934326171875, -137.6270751953125, -135.1148223876953, -132.60256958007812, -130.09030151367188, -127.57804107666016, -125.06578063964844, -122.55352020263672, -120.041259765625, -117.52899932861328, -115.01673889160156, -112.50447845458984, -109.99221801757812, -107.4799575805664, -104.96769714355469, -102.45543670654297, -99.94317626953125, -97.43091583251953, -94.91865539550781, -92.4063949584961, -89.89413452148438, -87.38187408447266, -84.86961364746094, -82.35735321044922, -79.8450927734375, -77.33283233642578, -74.82057189941406, -72.30831146240234, -69.79605102539062, -67.2837905883789, -64.77153015136719, -62.25926971435547, -59.74700927734375, -57.23474884033203, -54.72248840332031, -52.210227966308594, -49.697967529296875, -47.185707092285156, -44.67344665527344, -42.16118621826172, -39.64892578125, -37.13666534423828, -34.62440490722656, -32.112144470214844, -29.599885940551758, -27.08762550354004, -24.57536506652832, -22.0631046295166, -19.550844192504883, -17.038583755493164, -14.526323318481445, -12.014062881469727, -9.501802444458008, -6.989542007446289, -4.47728157043457, -1.9650211334228516, 0.5472393035888672, 3.059499740600586, 5.571760177612305, 8.084020614624023, 10.596281051635742]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 12.0, 6.0, 12.0, 14.0, 23.0, 20.0, 25.0, 29.0, 15.0, 25.0, 24.0, 33.0, 34.0, 37.0, 35.0, 49.0, 41.0, 42.0, 31.0, 26.0, 31.0, 37.0, 43.0, 35.0, 37.0, 34.0, 25.0, 25.0, 23.0, 22.0, 20.0, 17.0, 15.0, 17.0, 14.0, 6.0, 12.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-26.18975067138672, -25.385900497436523, -24.582050323486328, -23.778200149536133, -22.974349975585938, -22.170499801635742, -21.366649627685547, -20.56279945373535, -19.758949279785156, -18.95509910583496, -18.151248931884766, -17.34739875793457, -16.543548583984375, -15.73969841003418, -14.935848236083984, -14.131998062133789, -13.328147888183594, -12.524297714233398, -11.720447540283203, -10.916597366333008, -10.112747192382812, -9.308897018432617, -8.505046844482422, -7.701196670532227, -6.897346496582031, -6.093496322631836, -5.289646148681641, -4.485795974731445, -3.68194580078125, -2.8780956268310547, -2.0742454528808594, -1.270395278930664, -0.46654510498046875, 0.33730506896972656, 1.1411552429199219, 1.9450054168701172, 2.7488555908203125, 3.552705764770508, 4.356555938720703, 5.160406112670898, 5.964256286621094, 6.768106460571289, 7.571956634521484, 8.37580680847168, 9.179656982421875, 9.98350715637207, 10.787357330322266, 11.591207504272461, 12.395057678222656, 13.198907852172852, 14.002758026123047, 14.806608200073242, 15.610458374023438, 16.414308547973633, 17.218158721923828, 18.022008895874023, 18.82585906982422, 19.629709243774414, 20.43355941772461, 21.237409591674805, 22.041259765625, 22.845109939575195, 23.64896011352539, 24.452810287475586, 25.25666046142578]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 4.0, 3.0, 2.0, 9.0, 9.0, 10.0, 15.0, 14.0, 21.0, 14.0, 20.0, 21.0, 28.0, 30.0, 34.0, 27.0, 32.0, 32.0, 40.0, 28.0, 45.0, 34.0, 38.0, 43.0, 48.0, 41.0, 37.0, 34.0, 37.0, 39.0, 21.0, 24.0, 20.0, 25.0, 23.0, 16.0, 11.0, 14.0, 14.0, 15.0, 7.0, 6.0, 4.0, 4.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.052734375, -1.975250244140625, -1.89776611328125, -1.820281982421875, -1.7427978515625, -1.665313720703125, -1.58782958984375, -1.510345458984375, -1.432861328125, -1.355377197265625, -1.27789306640625, -1.200408935546875, -1.1229248046875, -1.045440673828125, -0.96795654296875, -0.890472412109375, -0.81298828125, -0.735504150390625, -0.65802001953125, -0.580535888671875, -0.5030517578125, -0.425567626953125, -0.34808349609375, -0.270599365234375, -0.193115234375, -0.115631103515625, -0.03814697265625, 0.039337158203125, 0.1168212890625, 0.194305419921875, 0.27178955078125, 0.349273681640625, 0.4267578125, 0.504241943359375, 0.58172607421875, 0.659210205078125, 0.7366943359375, 0.814178466796875, 0.89166259765625, 0.969146728515625, 1.046630859375, 1.124114990234375, 1.20159912109375, 1.279083251953125, 1.3565673828125, 1.434051513671875, 1.51153564453125, 1.589019775390625, 1.66650390625, 1.743988037109375, 1.82147216796875, 1.898956298828125, 1.9764404296875, 2.053924560546875, 2.13140869140625, 2.208892822265625, 2.286376953125, 2.363861083984375, 2.44134521484375, 2.518829345703125, 2.5963134765625, 2.673797607421875, 2.75128173828125, 2.828765869140625, 2.90625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 10.0, 7.0, 11.0, 13.0, 17.0, 23.0, 48.0, 62.0, 140.0, 284.0, 759.0, 1971.0, 5787.0, 18006.0, 62428.0, 276773.0, 2004541.0, 1541099.0, 209327.0, 50393.0, 14907.0, 4715.0, 1725.0, 637.0, 274.0, 121.0, 71.0, 43.0, 28.0, 21.0, 9.0, 11.0, 10.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.75848388671875, -6.5247802734375, -6.29107666015625, -6.057373046875, -5.82366943359375, -5.5899658203125, -5.35626220703125, -5.12255859375, -4.88885498046875, -4.6551513671875, -4.42144775390625, -4.187744140625, -3.95404052734375, -3.7203369140625, -3.48663330078125, -3.2529296875, -3.01922607421875, -2.7855224609375, -2.55181884765625, -2.318115234375, -2.08441162109375, -1.8507080078125, -1.61700439453125, -1.38330078125, -1.14959716796875, -0.9158935546875, -0.68218994140625, -0.448486328125, -0.21478271484375, 0.0189208984375, 0.25262451171875, 0.486328125, 0.72003173828125, 0.9537353515625, 1.18743896484375, 1.421142578125, 1.65484619140625, 1.8885498046875, 2.12225341796875, 2.35595703125, 2.58966064453125, 2.8233642578125, 3.05706787109375, 3.290771484375, 3.52447509765625, 3.7581787109375, 3.99188232421875, 4.2255859375, 4.45928955078125, 4.6929931640625, 4.92669677734375, 5.160400390625, 5.39410400390625, 5.6278076171875, 5.86151123046875, 6.09521484375, 6.32891845703125, 6.5626220703125, 6.79632568359375, 7.030029296875, 7.26373291015625, 7.4974365234375, 7.73114013671875, 7.96484375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 17.0, 21.0, 50.0, 82.0, 118.0, 185.0, 283.0, 468.0, 677.0, 726.0, 507.0, 387.0, 203.0, 121.0, 85.0, 53.0, 21.0, 16.0, 20.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.8046875, -15.4105224609375, -15.016357421875, -14.6221923828125, -14.22802734375, -13.8338623046875, -13.439697265625, -13.0455322265625, -12.6513671875, -12.2572021484375, -11.863037109375, -11.4688720703125, -11.07470703125, -10.6805419921875, -10.286376953125, -9.8922119140625, -9.498046875, -9.1038818359375, -8.709716796875, -8.3155517578125, -7.92138671875, -7.5272216796875, -7.133056640625, -6.7388916015625, -6.3447265625, -5.9505615234375, -5.556396484375, -5.1622314453125, -4.76806640625, -4.3739013671875, -3.979736328125, -3.5855712890625, -3.19140625, -2.7972412109375, -2.403076171875, -2.0089111328125, -1.61474609375, -1.2205810546875, -0.826416015625, -0.4322509765625, -0.0380859375, 0.3560791015625, 0.750244140625, 1.1444091796875, 1.53857421875, 1.9327392578125, 2.326904296875, 2.7210693359375, 3.115234375, 3.5093994140625, 3.903564453125, 4.2977294921875, 4.69189453125, 5.0860595703125, 5.480224609375, 5.8743896484375, 6.2685546875, 6.6627197265625, 7.056884765625, 7.4510498046875, 7.84521484375, 8.2393798828125, 8.633544921875, 9.0277099609375, 9.421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 6.0, 14.0, 28.0, 19.0, 43.0, 52.0, 87.0, 144.0, 200.0, 372.0, 723.0, 1915.0, 9284.0, 103093.0, 2664354.0, 1346351.0, 58133.0, 6467.0, 1518.0, 633.0, 306.0, 165.0, 100.0, 90.0, 39.0, 43.0, 31.0, 22.0, 12.0, 14.0, 7.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.421875, -24.693359375, -23.96484375, -23.236328125, -22.5078125, -21.779296875, -21.05078125, -20.322265625, -19.59375, -18.865234375, -18.13671875, -17.408203125, -16.6796875, -15.951171875, -15.22265625, -14.494140625, -13.765625, -13.037109375, -12.30859375, -11.580078125, -10.8515625, -10.123046875, -9.39453125, -8.666015625, -7.9375, -7.208984375, -6.48046875, -5.751953125, -5.0234375, -4.294921875, -3.56640625, -2.837890625, -2.109375, -1.380859375, -0.65234375, 0.076171875, 0.8046875, 1.533203125, 2.26171875, 2.990234375, 3.71875, 4.447265625, 5.17578125, 5.904296875, 6.6328125, 7.361328125, 8.08984375, 8.818359375, 9.546875, 10.275390625, 11.00390625, 11.732421875, 12.4609375, 13.189453125, 13.91796875, 14.646484375, 15.375, 16.103515625, 16.83203125, 17.560546875, 18.2890625, 19.017578125, 19.74609375, 20.474609375, 21.203125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 27.0, 67.0, 146.0, 276.0, 243.0, 145.0, 75.0, 19.0, 8.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.09095764160156, -162.89561462402344, -159.70028686523438, -156.50494384765625, -153.3096160888672, -150.11427307128906, -146.9189453125, -143.72360229492188, -140.5282745361328, -137.3329315185547, -134.13760375976562, -130.9422607421875, -127.74693298339844, -124.55159759521484, -121.35626220703125, -118.16092681884766, -114.96559143066406, -111.77025604248047, -108.57492065429688, -105.37958526611328, -102.18424987792969, -98.9889144897461, -95.7935791015625, -92.5982437133789, -89.40290069580078, -86.20756530761719, -83.0122299194336, -79.81689453125, -76.6215591430664, -73.42622375488281, -70.23088836669922, -67.03555297851562, -63.8402214050293, -60.6448860168457, -57.44955062866211, -54.254215240478516, -51.05887985229492, -47.86354446411133, -44.66820526123047, -41.472869873046875, -38.27753448486328, -35.08219909667969, -31.886863708496094, -28.6915283203125, -25.496192932128906, -22.300857543945312, -19.105520248413086, -15.910184860229492, -12.714851379394531, -9.519515991210938, -6.3241801261901855, -3.1288442611694336, 0.06649112701416016, 3.261826515197754, 6.457162857055664, 9.652498245239258, 12.847833633422852, 16.043169021606445, 19.23850440979004, 22.433841705322266, 25.62917709350586, 28.824512481689453, 32.01984786987305, 35.21518325805664, 38.410518646240234]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 6.0, 10.0, 8.0, 8.0, 5.0, 6.0, 17.0, 20.0, 18.0, 11.0, 21.0, 33.0, 28.0, 24.0, 35.0, 43.0, 27.0, 30.0, 36.0, 43.0, 40.0, 42.0, 35.0, 45.0, 47.0, 36.0, 38.0, 32.0, 28.0, 40.0, 21.0, 23.0, 19.0, 14.0, 16.0, 23.0, 13.0, 7.0, 12.0, 8.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.056198120117188, -25.192293167114258, -24.328386306762695, -23.464481353759766, -22.600574493408203, -21.736669540405273, -20.872764587402344, -20.00885772705078, -19.14495277404785, -18.281047821044922, -17.41714096069336, -16.55323600769043, -15.689330101013184, -14.825424194335938, -13.961519241333008, -13.097613334655762, -12.233707427978516, -11.36980152130127, -10.505895614624023, -9.641990661621094, -8.778084754943848, -7.914178848266602, -7.050273418426514, -6.186367988586426, -5.32246208190918, -4.458556175231934, -3.5946507453918457, -2.7307450771331787, -1.8668394088745117, -1.0029335021972656, -0.13902807235717773, 0.7248773574829102, 1.5887832641601562, 2.4526889324188232, 3.3165946006774902, 4.180500030517578, 5.044405937194824, 5.90831184387207, 6.772217273712158, 7.636122703552246, 8.500028610229492, 9.363934516906738, 10.227840423583984, 11.091745376586914, 11.95565128326416, 12.819557189941406, 13.683462142944336, 14.547368049621582, 15.411273956298828, 16.275178909301758, 17.13908576965332, 18.00299072265625, 18.866897583007812, 19.730802536010742, 20.594707489013672, 21.458614349365234, 22.322519302368164, 23.186424255371094, 24.050331115722656, 24.914236068725586, 25.778141021728516, 26.642047882080078, 27.505952835083008, 28.369857788085938, 29.2337646484375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 3.0, 4.0, 10.0, 19.0, 16.0, 12.0, 18.0, 16.0, 17.0, 28.0, 19.0, 19.0, 23.0, 23.0, 32.0, 33.0, 44.0, 40.0, 46.0, 39.0, 40.0, 42.0, 48.0, 34.0, 35.0, 32.0, 34.0, 29.0, 30.0, 20.0, 31.0, 29.0, 24.0, 25.0, 8.0, 11.0, 9.0, 10.0, 7.0, 11.0, 10.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.251953125, -2.1708984375, -2.08984375, -2.0087890625, -1.927734375, -1.8466796875, -1.765625, -1.6845703125, -1.603515625, -1.5224609375, -1.44140625, -1.3603515625, -1.279296875, -1.1982421875, -1.1171875, -1.0361328125, -0.955078125, -0.8740234375, -0.79296875, -0.7119140625, -0.630859375, -0.5498046875, -0.46875, -0.3876953125, -0.306640625, -0.2255859375, -0.14453125, -0.0634765625, 0.017578125, 0.0986328125, 0.1796875, 0.2607421875, 0.341796875, 0.4228515625, 0.50390625, 0.5849609375, 0.666015625, 0.7470703125, 0.828125, 0.9091796875, 0.990234375, 1.0712890625, 1.15234375, 1.2333984375, 1.314453125, 1.3955078125, 1.4765625, 1.5576171875, 1.638671875, 1.7197265625, 1.80078125, 1.8818359375, 1.962890625, 2.0439453125, 2.125, 2.2060546875, 2.287109375, 2.3681640625, 2.44921875, 2.5302734375, 2.611328125, 2.6923828125, 2.7734375, 2.8544921875, 2.935546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 17.0, 28.0, 45.0, 80.0, 123.0, 212.0, 270.0, 396.0, 620.0, 940.0, 1428.0, 2172.0, 3121.0, 4728.0, 7021.0, 10629.0, 16062.0, 23916.0, 36422.0, 53999.0, 77824.0, 109150.0, 139693.0, 149890.0, 123990.0, 91797.0, 64037.0, 42895.0, 29008.0, 19505.0, 12868.0, 8602.0, 5820.0, 3789.0, 2538.0, 1679.0, 1072.0, 750.0, 460.0, 355.0, 236.0, 115.0, 78.0, 63.0, 36.0, 25.0, 16.0, 14.0, 8.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.31103515625, -0.3010749816894531, -0.29111480712890625, -0.2811546325683594, -0.2711944580078125, -0.2612342834472656, -0.25127410888671875, -0.24131393432617188, -0.231353759765625, -0.22139358520507812, -0.21143341064453125, -0.20147323608398438, -0.1915130615234375, -0.18155288696289062, -0.17159271240234375, -0.16163253784179688, -0.15167236328125, -0.14171218872070312, -0.13175201416015625, -0.12179183959960938, -0.1118316650390625, -0.10187149047851562, -0.09191131591796875, -0.08195114135742188, -0.071990966796875, -0.062030792236328125, -0.05207061767578125, -0.042110443115234375, -0.0321502685546875, -0.022190093994140625, -0.01222991943359375, -0.002269744873046875, 0.0076904296875, 0.017650604248046875, 0.02761077880859375, 0.037570953369140625, 0.0475311279296875, 0.057491302490234375, 0.06745147705078125, 0.07741165161132812, 0.087371826171875, 0.09733200073242188, 0.10729217529296875, 0.11725234985351562, 0.1272125244140625, 0.13717269897460938, 0.14713287353515625, 0.15709304809570312, 0.16705322265625, 0.17701339721679688, 0.18697357177734375, 0.19693374633789062, 0.2068939208984375, 0.21685409545898438, 0.22681427001953125, 0.23677444458007812, 0.246734619140625, 0.2566947937011719, 0.26665496826171875, 0.2766151428222656, 0.2865753173828125, 0.2965354919433594, 0.30649566650390625, 0.3164558410644531, 0.326416015625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 10.0, 12.0, 9.0, 9.0, 10.0, 16.0, 17.0, 16.0, 31.0, 25.0, 22.0, 40.0, 33.0, 37.0, 45.0, 37.0, 44.0, 35.0, 34.0, 1078.0, 35.0, 29.0, 40.0, 45.0, 22.0, 31.0, 29.0, 36.0, 29.0, 25.0, 28.0, 18.0, 13.0, 10.0, 9.0, 4.0, 9.0, 4.0, 8.0, 10.0, 4.0, 2.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 3.0], "bins": [-1.849609375, -1.795379638671875, -1.74114990234375, -1.686920166015625, -1.6326904296875, -1.578460693359375, -1.52423095703125, -1.470001220703125, -1.415771484375, -1.361541748046875, -1.30731201171875, -1.253082275390625, -1.1988525390625, -1.144622802734375, -1.09039306640625, -1.036163330078125, -0.98193359375, -0.927703857421875, -0.87347412109375, -0.819244384765625, -0.7650146484375, -0.710784912109375, -0.65655517578125, -0.602325439453125, -0.548095703125, -0.493865966796875, -0.43963623046875, -0.385406494140625, -0.3311767578125, -0.276947021484375, -0.22271728515625, -0.168487548828125, -0.1142578125, -0.060028076171875, -0.00579833984375, 0.048431396484375, 0.1026611328125, 0.156890869140625, 0.21112060546875, 0.265350341796875, 0.319580078125, 0.373809814453125, 0.42803955078125, 0.482269287109375, 0.5364990234375, 0.590728759765625, 0.64495849609375, 0.699188232421875, 0.75341796875, 0.807647705078125, 0.86187744140625, 0.916107177734375, 0.9703369140625, 1.024566650390625, 1.07879638671875, 1.133026123046875, 1.187255859375, 1.241485595703125, 1.29571533203125, 1.349945068359375, 1.4041748046875, 1.458404541015625, 1.51263427734375, 1.566864013671875, 1.62109375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 3.0, 6.0, 13.0, 19.0, 21.0, 36.0, 68.0, 92.0, 122.0, 229.0, 330.0, 489.0, 770.0, 1134.0, 1759.0, 2584.0, 4092.0, 6058.0, 9678.0, 15116.0, 23232.0, 35673.0, 55027.0, 81885.0, 118382.0, 175339.0, 1182375.0, 125501.0, 88414.0, 59002.0, 38633.0, 25279.0, 16110.0, 10402.0, 6718.0, 4274.0, 2788.0, 1954.0, 1153.0, 770.0, 509.0, 355.0, 246.0, 177.0, 104.0, 78.0, 42.0, 32.0, 23.0, 20.0, 10.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.223388671875, -0.21642684936523438, -0.20946502685546875, -0.20250320434570312, -0.1955413818359375, -0.18857955932617188, -0.18161773681640625, -0.17465591430664062, -0.167694091796875, -0.16073226928710938, -0.15377044677734375, -0.14680862426757812, -0.1398468017578125, -0.13288497924804688, -0.12592315673828125, -0.11896133422851562, -0.11199951171875, -0.10503768920898438, -0.09807586669921875, -0.09111404418945312, -0.0841522216796875, -0.07719039916992188, -0.07022857666015625, -0.06326675415039062, -0.056304931640625, -0.049343109130859375, -0.04238128662109375, -0.035419464111328125, -0.0284576416015625, -0.021495819091796875, -0.01453399658203125, -0.007572174072265625, -0.0006103515625, 0.006351470947265625, 0.01331329345703125, 0.020275115966796875, 0.0272369384765625, 0.034198760986328125, 0.04116058349609375, 0.048122406005859375, 0.055084228515625, 0.062046051025390625, 0.06900787353515625, 0.07596969604492188, 0.0829315185546875, 0.08989334106445312, 0.09685516357421875, 0.10381698608398438, 0.11077880859375, 0.11774063110351562, 0.12470245361328125, 0.13166427612304688, 0.1386260986328125, 0.14558792114257812, 0.15254974365234375, 0.15951156616210938, 0.166473388671875, 0.17343521118164062, 0.18039703369140625, 0.18735885620117188, 0.1943206787109375, 0.20128250122070312, 0.20824432373046875, 0.21520614624023438, 0.22216796875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 10.0, 17.0, 24.0, 25.0, 43.0, 64.0, 98.0, 173.0, 169.0, 116.0, 59.0, 40.0, 30.0, 26.0, 19.0, 9.0, 15.0, 8.0, 9.0, 1.0, 3.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0044403076171875, -0.0042972564697265625, -0.004154205322265625, -0.0040111541748046875, -0.00386810302734375, -0.0037250518798828125, -0.003582000732421875, -0.0034389495849609375, -0.0032958984375, -0.0031528472900390625, -0.003009796142578125, -0.0028667449951171875, -0.00272369384765625, -0.0025806427001953125, -0.002437591552734375, -0.0022945404052734375, -0.0021514892578125, -0.0020084381103515625, -0.001865386962890625, -0.0017223358154296875, -0.00157928466796875, -0.0014362335205078125, -0.001293182373046875, -0.0011501312255859375, -0.001007080078125, -0.0008640289306640625, -0.000720977783203125, -0.0005779266357421875, -0.00043487548828125, -0.0002918243408203125, -0.000148773193359375, -5.7220458984375e-06, 0.0001373291015625, 0.0002803802490234375, 0.000423431396484375, 0.0005664825439453125, 0.00070953369140625, 0.0008525848388671875, 0.000995635986328125, 0.0011386871337890625, 0.00128173828125, 0.0014247894287109375, 0.001567840576171875, 0.0017108917236328125, 0.00185394287109375, 0.0019969940185546875, 0.002140045166015625, 0.0022830963134765625, 0.0024261474609375, 0.0025691986083984375, 0.002712249755859375, 0.0028553009033203125, 0.00299835205078125, 0.0031414031982421875, 0.003284454345703125, 0.0034275054931640625, 0.003570556640625, 0.0037136077880859375, 0.003856658935546875, 0.0039997100830078125, 0.00414276123046875, 0.0042858123779296875, 0.004428863525390625, 0.0045719146728515625, 0.0047149658203125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 7.0, 4.0, 5.0, 5.0, 7.0, 16.0, 15.0, 24.0, 35.0, 58.0, 73.0, 163.0, 522.0, 4486.0, 648347.0, 390022.0, 3875.0, 471.0, 161.0, 111.0, 49.0, 27.0, 23.0, 15.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0858154296875, -0.08321285247802734, -0.08061027526855469, -0.07800769805908203, -0.07540512084960938, -0.07280254364013672, -0.07019996643066406, -0.0675973892211914, -0.06499481201171875, -0.062392234802246094, -0.05978965759277344, -0.05718708038330078, -0.054584503173828125, -0.05198192596435547, -0.04937934875488281, -0.046776771545410156, -0.0441741943359375, -0.041571617126464844, -0.03896903991699219, -0.03636646270751953, -0.033763885498046875, -0.03116130828857422, -0.028558731079101562, -0.025956153869628906, -0.02335357666015625, -0.020750999450683594, -0.018148422241210938, -0.015545845031738281, -0.012943267822265625, -0.010340690612792969, -0.0077381134033203125, -0.005135536193847656, -0.002532958984375, 6.961822509765625e-05, 0.0026721954345703125, 0.005274772644042969, 0.007877349853515625, 0.010479927062988281, 0.013082504272460938, 0.015685081481933594, 0.01828765869140625, 0.020890235900878906, 0.023492813110351562, 0.02609539031982422, 0.028697967529296875, 0.03130054473876953, 0.03390312194824219, 0.036505699157714844, 0.0391082763671875, 0.041710853576660156, 0.04431343078613281, 0.04691600799560547, 0.049518585205078125, 0.05212116241455078, 0.05472373962402344, 0.057326316833496094, 0.05992889404296875, 0.0625314712524414, 0.06513404846191406, 0.06773662567138672, 0.07033920288085938, 0.07294178009033203, 0.07554435729980469, 0.07814693450927734, 0.08074951171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 6.0, 8.0, 13.0, 19.0, 30.0, 35.0, 55.0, 85.0, 136.0, 156.0, 153.0, 115.0, 74.0, 47.0, 25.0, 17.0, 11.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.008963936939835548, -0.008772906847298145, -0.008581876754760742, -0.008390846662223339, -0.008199816569685936, -0.008008786477148533, -0.00781775638461113, -0.007626726292073727, -0.0074356961995363235, -0.0072446661069989204, -0.007053636014461517, -0.006862605921924114, -0.006671575829386711, -0.006480545736849308, -0.006289515644311905, -0.006098485551774502, -0.005907454993575811, -0.005716424901038408, -0.005525394808501005, -0.005334364715963602, -0.005143334623426199, -0.004952304530888796, -0.0047612739726901054, -0.004570243880152702, -0.004379213787615299, -0.004188183695077896, -0.003997153602540493, -0.00380612351000309, -0.003615093417465687, -0.0034240633249282837, -0.003233032999560237, -0.003042002907022834, -0.0028509730473160744, -0.0026599429547786713, -0.002468912862241268, -0.002277882769703865, -0.002086852677166462, -0.001895822468213737, -0.001704792259261012, -0.001513762166723609, -0.0013227320741862059, -0.0011317019816488028, -0.0009406718309037387, -0.0007496416801586747, -0.0005586115876212716, -0.0003675814950838685, -0.00017655128613114357, 1.4478806406259537e-05, 0.00020550889894366264, 0.0003965390205848962, 0.0005875691422261298, 0.0007785992929711938, 0.0009696293855085969, 0.001160659478046, 0.001351689686998725, 0.001542719779536128, 0.0017337498720735312, 0.0019247799646109343, 0.0021158100571483374, 0.002306840382516384, 0.0024978704750537872, 0.0026889005675911903, 0.0028799306601285934, 0.0030709607526659966, 0.0032619908452033997]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 7.0, 5.0, 3.0, 9.0, 16.0, 15.0, 21.0, 10.0, 24.0, 25.0, 24.0, 25.0, 34.0, 34.0, 35.0, 41.0, 39.0, 38.0, 44.0, 36.0, 35.0, 37.0, 35.0, 35.0, 23.0, 34.0, 35.0, 31.0, 26.0, 28.0, 34.0, 33.0, 27.0, 19.0, 11.0, 16.0, 5.0, 9.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.001646876335144043, -0.0015959041193127632, -0.0015449319034814835, -0.0014939596876502037, -0.001442987471818924, -0.0013920152559876442, -0.0013410430401563644, -0.0012900708243250847, -0.001239098608493805, -0.0011881263926625252, -0.0011371541768312454, -0.0010861819609999657, -0.001035209745168686, -0.0009842375293374062, -0.0009332653135061264, -0.0008822930976748466, -0.0008313208818435669, -0.0007803486660122871, -0.0007293764501810074, -0.0006784042343497276, -0.0006274320185184479, -0.0005764598026871681, -0.0005254875868558884, -0.0004745153710246086, -0.00042354315519332886, -0.0003725709393620491, -0.00032159872353076935, -0.0002706265076994896, -0.00021965429186820984, -0.00016868207603693008, -0.00011770986020565033, -6.673764437437057e-05, -1.576542854309082e-05, 3.5206787288188934e-05, 8.617900311946869e-05, 0.00013715121895074844, 0.0001881234347820282, 0.00023909565061330795, 0.0002900678664445877, 0.00034104008227586746, 0.0003920122981071472, 0.00044298451393842697, 0.0004939567297697067, 0.0005449289456009865, 0.0005959011614322662, 0.000646873377263546, 0.0006978455930948257, 0.0007488178089261055, 0.0007997900247573853, 0.000850762240588665, 0.0009017344564199448, 0.0009527066722512245, 0.0010036788880825043, 0.001054651103913784, 0.0011056233197450638, 0.0011565955355763435, 0.0012075677514076233, 0.001258539967238903, 0.0013095121830701828, 0.0013604843989014626, 0.0014114566147327423, 0.001462428830564022, 0.0015134010463953018, 0.0015643732622265816, 0.0016153454780578613]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 3.0, 4.0, 10.0, 19.0, 16.0, 12.0, 18.0, 16.0, 17.0, 28.0, 19.0, 19.0, 23.0, 23.0, 32.0, 33.0, 44.0, 40.0, 47.0, 38.0, 40.0, 42.0, 48.0, 34.0, 35.0, 32.0, 34.0, 29.0, 30.0, 20.0, 31.0, 29.0, 24.0, 25.0, 8.0, 11.0, 9.0, 10.0, 7.0, 11.0, 10.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.251953125, -2.1708984375, -2.08984375, -2.0087890625, -1.927734375, -1.8466796875, -1.765625, -1.6845703125, -1.603515625, -1.5224609375, -1.44140625, -1.3603515625, -1.279296875, -1.1982421875, -1.1171875, -1.0361328125, -0.955078125, -0.8740234375, -0.79296875, -0.7119140625, -0.630859375, -0.5498046875, -0.46875, -0.3876953125, -0.306640625, -0.2255859375, -0.14453125, -0.0634765625, 0.017578125, 0.0986328125, 0.1796875, 0.2607421875, 0.341796875, 0.4228515625, 0.50390625, 0.5849609375, 0.666015625, 0.7470703125, 0.828125, 0.9091796875, 0.990234375, 1.0712890625, 1.15234375, 1.2333984375, 1.314453125, 1.3955078125, 1.4765625, 1.5576171875, 1.638671875, 1.7197265625, 1.80078125, 1.8818359375, 1.962890625, 2.0439453125, 2.125, 2.2060546875, 2.287109375, 2.3681640625, 2.44921875, 2.5302734375, 2.611328125, 2.6923828125, 2.7734375, 2.8544921875, 2.935546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 5.0, 10.0, 12.0, 13.0, 19.0, 32.0, 41.0, 56.0, 108.0, 123.0, 192.0, 311.0, 481.0, 719.0, 1039.0, 1676.0, 2503.0, 4078.0, 6820.0, 12398.0, 26693.0, 78319.0, 315170.0, 420861.0, 108036.0, 33667.0, 14557.0, 7753.0, 4589.0, 2887.0, 1853.0, 1140.0, 830.0, 509.0, 339.0, 215.0, 137.0, 104.0, 75.0, 55.0, 41.0, 27.0, 19.0, 11.0, 12.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.265625, -3.169921875, -3.07421875, -2.978515625, -2.8828125, -2.787109375, -2.69140625, -2.595703125, -2.5, -2.404296875, -2.30859375, -2.212890625, -2.1171875, -2.021484375, -1.92578125, -1.830078125, -1.734375, -1.638671875, -1.54296875, -1.447265625, -1.3515625, -1.255859375, -1.16015625, -1.064453125, -0.96875, -0.873046875, -0.77734375, -0.681640625, -0.5859375, -0.490234375, -0.39453125, -0.298828125, -0.203125, -0.107421875, -0.01171875, 0.083984375, 0.1796875, 0.275390625, 0.37109375, 0.466796875, 0.5625, 0.658203125, 0.75390625, 0.849609375, 0.9453125, 1.041015625, 1.13671875, 1.232421875, 1.328125, 1.423828125, 1.51953125, 1.615234375, 1.7109375, 1.806640625, 1.90234375, 1.998046875, 2.09375, 2.189453125, 2.28515625, 2.380859375, 2.4765625, 2.572265625, 2.66796875, 2.763671875, 2.859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 6.0, 12.0, 9.0, 18.0, 24.0, 11.0, 18.0, 17.0, 38.0, 27.0, 28.0, 39.0, 56.0, 38.0, 51.0, 98.0, 205.0, 1581.0, 244.0, 79.0, 66.0, 41.0, 54.0, 44.0, 34.0, 27.0, 28.0, 26.0, 20.0, 18.0, 9.0, 16.0, 9.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.8756103515625, -8.563720703125, -8.2518310546875, -7.93994140625, -7.6280517578125, -7.316162109375, -7.0042724609375, -6.6923828125, -6.3804931640625, -6.068603515625, -5.7567138671875, -5.44482421875, -5.1329345703125, -4.821044921875, -4.5091552734375, -4.197265625, -3.8853759765625, -3.573486328125, -3.2615966796875, -2.94970703125, -2.6378173828125, -2.325927734375, -2.0140380859375, -1.7021484375, -1.3902587890625, -1.078369140625, -0.7664794921875, -0.45458984375, -0.1427001953125, 0.169189453125, 0.4810791015625, 0.79296875, 1.1048583984375, 1.416748046875, 1.7286376953125, 2.04052734375, 2.3524169921875, 2.664306640625, 2.9761962890625, 3.2880859375, 3.5999755859375, 3.911865234375, 4.2237548828125, 4.53564453125, 4.8475341796875, 5.159423828125, 5.4713134765625, 5.783203125, 6.0950927734375, 6.406982421875, 6.7188720703125, 7.03076171875, 7.3426513671875, 7.654541015625, 7.9664306640625, 8.2783203125, 8.5902099609375, 8.902099609375, 9.2139892578125, 9.52587890625, 9.8377685546875, 10.149658203125, 10.4615478515625, 10.7734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 5.0, 2.0, 10.0, 15.0, 10.0, 9.0, 15.0, 21.0, 23.0, 32.0, 35.0, 47.0, 70.0, 89.0, 170.0, 215.0, 405.0, 1355.0, 8081.0, 109528.0, 2948705.0, 68328.0, 6286.0, 1103.0, 393.0, 220.0, 131.0, 78.0, 60.0, 57.0, 36.0, 37.0, 18.0, 22.0, 18.0, 9.0, 19.0, 9.0, 6.0, 9.0, 5.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-15.1328125, -14.666259765625, -14.19970703125, -13.733154296875, -13.2666015625, -12.800048828125, -12.33349609375, -11.866943359375, -11.400390625, -10.933837890625, -10.46728515625, -10.000732421875, -9.5341796875, -9.067626953125, -8.60107421875, -8.134521484375, -7.66796875, -7.201416015625, -6.73486328125, -6.268310546875, -5.8017578125, -5.335205078125, -4.86865234375, -4.402099609375, -3.935546875, -3.468994140625, -3.00244140625, -2.535888671875, -2.0693359375, -1.602783203125, -1.13623046875, -0.669677734375, -0.203125, 0.263427734375, 0.72998046875, 1.196533203125, 1.6630859375, 2.129638671875, 2.59619140625, 3.062744140625, 3.529296875, 3.995849609375, 4.46240234375, 4.928955078125, 5.3955078125, 5.862060546875, 6.32861328125, 6.795166015625, 7.26171875, 7.728271484375, 8.19482421875, 8.661376953125, 9.1279296875, 9.594482421875, 10.06103515625, 10.527587890625, 10.994140625, 11.460693359375, 11.92724609375, 12.393798828125, 12.8603515625, 13.326904296875, 13.79345703125, 14.260009765625, 14.7265625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 224.0, 711.0, 76.0], "bins": [-222.7293701171875, -219.15403747558594, -215.57870483398438, -212.0033721923828, -208.42803955078125, -204.8527069091797, -201.27737426757812, -197.70204162597656, -194.126708984375, -190.55137634277344, -186.97604370117188, -183.4007110595703, -179.82537841796875, -176.2500457763672, -172.67471313476562, -169.09938049316406, -165.5240478515625, -161.94871520996094, -158.37338256835938, -154.7980499267578, -151.22271728515625, -147.6473846435547, -144.07205200195312, -140.49671936035156, -136.92138671875, -133.34605407714844, -129.77072143554688, -126.19538879394531, -122.62005615234375, -119.04472351074219, -115.46939086914062, -111.89405822753906, -108.31873321533203, -104.74340057373047, -101.1680679321289, -97.59273529052734, -94.01740264892578, -90.44207000732422, -86.86673736572266, -83.2914047241211, -79.71607971191406, -76.1407470703125, -72.56541442871094, -68.99008178710938, -65.41474914550781, -61.83941650390625, -58.26408386230469, -54.688751220703125, -51.11341857910156, -47.5380859375, -43.96275329589844, -40.387420654296875, -36.81208801269531, -33.23675537109375, -29.66142463684082, -26.086091995239258, -22.510757446289062, -18.9354248046875, -15.360092163085938, -11.784760475158691, -8.209427833557129, -4.634096145629883, -1.0587635040283203, 2.516569137573242, 6.091900825500488]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 9.0, 11.0, 23.0, 18.0, 14.0, 24.0, 25.0, 18.0, 17.0, 25.0, 30.0, 35.0, 33.0, 30.0, 31.0, 35.0, 36.0, 40.0, 31.0, 41.0, 37.0, 33.0, 30.0, 38.0, 30.0, 24.0, 24.0, 34.0, 23.0, 30.0, 19.0, 21.0, 19.0, 11.0, 14.0, 8.0, 11.0, 6.0, 3.0, 7.0, 4.0, 7.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0], "bins": [-29.643850326538086, -28.738550186157227, -27.833251953125, -26.92795181274414, -26.022653579711914, -25.117353439331055, -24.212055206298828, -23.30675506591797, -22.40145492553711, -21.49615478515625, -20.590856552124023, -19.685556411743164, -18.780258178710938, -17.874958038330078, -16.96965789794922, -16.064359664916992, -15.159061431884766, -14.253762245178223, -13.34846305847168, -12.44316291809082, -11.537864685058594, -10.632564544677734, -9.727265357971191, -8.821966171264648, -7.9166669845581055, -7.0113677978515625, -6.1060686111450195, -5.200768947601318, -4.295469760894775, -3.3901705741882324, -2.4848709106445312, -1.5795717239379883, -0.6742744445800781, 0.2310248613357544, 1.136324167251587, 2.041623592376709, 2.946922779083252, 3.852221965789795, 4.757521629333496, 5.662820816040039, 6.568120002746582, 7.473419189453125, 8.378718376159668, 9.284017562866211, 10.18931770324707, 11.094615936279297, 11.999916076660156, 12.9052152633667, 13.810514450073242, 14.715813636779785, 15.621112823486328, 16.526412963867188, 17.431711196899414, 18.337011337280273, 19.2423095703125, 20.14760971069336, 21.05290985107422, 21.958209991455078, 22.863508224487305, 23.768808364868164, 24.67410659790039, 25.57940673828125, 26.48470687866211, 27.390005111694336, 28.295303344726562]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 5.0, 7.0, 10.0, 7.0, 12.0, 19.0, 11.0, 18.0, 21.0, 14.0, 20.0, 22.0, 28.0, 17.0, 24.0, 34.0, 41.0, 37.0, 37.0, 35.0, 48.0, 42.0, 40.0, 33.0, 38.0, 39.0, 28.0, 29.0, 36.0, 27.0, 37.0, 33.0, 16.0, 21.0, 26.0, 14.0, 8.0, 12.0, 8.0, 11.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2578125, -2.1766357421875, -2.095458984375, -2.0142822265625, -1.93310546875, -1.8519287109375, -1.770751953125, -1.6895751953125, -1.6083984375, -1.5272216796875, -1.446044921875, -1.3648681640625, -1.28369140625, -1.2025146484375, -1.121337890625, -1.0401611328125, -0.958984375, -0.8778076171875, -0.796630859375, -0.7154541015625, -0.63427734375, -0.5531005859375, -0.471923828125, -0.3907470703125, -0.3095703125, -0.2283935546875, -0.147216796875, -0.0660400390625, 0.01513671875, 0.0963134765625, 0.177490234375, 0.2586669921875, 0.33984375, 0.4210205078125, 0.502197265625, 0.5833740234375, 0.66455078125, 0.7457275390625, 0.826904296875, 0.9080810546875, 0.9892578125, 1.0704345703125, 1.151611328125, 1.2327880859375, 1.31396484375, 1.3951416015625, 1.476318359375, 1.5574951171875, 1.638671875, 1.7198486328125, 1.801025390625, 1.8822021484375, 1.96337890625, 2.0445556640625, 2.125732421875, 2.2069091796875, 2.2880859375, 2.3692626953125, 2.450439453125, 2.5316162109375, 2.61279296875, 2.6939697265625, 2.775146484375, 2.8563232421875, 2.9375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 4.0, 3.0, 5.0, 9.0, 4.0, 12.0, 7.0, 12.0, 16.0, 26.0, 29.0, 38.0, 70.0, 102.0, 175.0, 437.0, 956.0, 2328.0, 6365.0, 18682.0, 60895.0, 249611.0, 1593092.0, 1865852.0, 293271.0, 69472.0, 20996.0, 6924.0, 2668.0, 1089.0, 480.0, 266.0, 127.0, 78.0, 40.0, 31.0, 25.0, 21.0, 9.0, 8.0, 10.0, 9.0, 7.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.1640625, -6.933349609375, -6.70263671875, -6.471923828125, -6.2412109375, -6.010498046875, -5.77978515625, -5.549072265625, -5.318359375, -5.087646484375, -4.85693359375, -4.626220703125, -4.3955078125, -4.164794921875, -3.93408203125, -3.703369140625, -3.47265625, -3.241943359375, -3.01123046875, -2.780517578125, -2.5498046875, -2.319091796875, -2.08837890625, -1.857666015625, -1.626953125, -1.396240234375, -1.16552734375, -0.934814453125, -0.7041015625, -0.473388671875, -0.24267578125, -0.011962890625, 0.21875, 0.449462890625, 0.68017578125, 0.910888671875, 1.1416015625, 1.372314453125, 1.60302734375, 1.833740234375, 2.064453125, 2.295166015625, 2.52587890625, 2.756591796875, 2.9873046875, 3.218017578125, 3.44873046875, 3.679443359375, 3.91015625, 4.140869140625, 4.37158203125, 4.602294921875, 4.8330078125, 5.063720703125, 5.29443359375, 5.525146484375, 5.755859375, 5.986572265625, 6.21728515625, 6.447998046875, 6.6787109375, 6.909423828125, 7.14013671875, 7.370849609375, 7.6015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 7.0, 11.0, 17.0, 20.0, 22.0, 33.0, 54.0, 74.0, 73.0, 114.0, 129.0, 200.0, 249.0, 330.0, 422.0, 517.0, 417.0, 329.0, 268.0, 202.0, 145.0, 105.0, 80.0, 54.0, 50.0, 37.0, 24.0, 23.0, 11.0, 12.0, 13.0, 3.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.1494140625, -8.884765625, -8.6201171875, -8.35546875, -8.0908203125, -7.826171875, -7.5615234375, -7.296875, -7.0322265625, -6.767578125, -6.5029296875, -6.23828125, -5.9736328125, -5.708984375, -5.4443359375, -5.1796875, -4.9150390625, -4.650390625, -4.3857421875, -4.12109375, -3.8564453125, -3.591796875, -3.3271484375, -3.0625, -2.7978515625, -2.533203125, -2.2685546875, -2.00390625, -1.7392578125, -1.474609375, -1.2099609375, -0.9453125, -0.6806640625, -0.416015625, -0.1513671875, 0.11328125, 0.3779296875, 0.642578125, 0.9072265625, 1.171875, 1.4365234375, 1.701171875, 1.9658203125, 2.23046875, 2.4951171875, 2.759765625, 3.0244140625, 3.2890625, 3.5537109375, 3.818359375, 4.0830078125, 4.34765625, 4.6123046875, 4.876953125, 5.1416015625, 5.40625, 5.6708984375, 5.935546875, 6.2001953125, 6.46484375, 6.7294921875, 6.994140625, 7.2587890625, 7.5234375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 20.0, 32.0, 49.0, 61.0, 90.0, 145.0, 224.0, 420.0, 921.0, 2547.0, 10319.0, 60975.0, 581395.0, 3052186.0, 424720.0, 47671.0, 8384.0, 2261.0, 819.0, 384.0, 219.0, 129.0, 88.0, 75.0, 41.0, 31.0, 21.0, 6.0, 10.0, 1.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.89794921875, -16.3427734375, -15.78759765625, -15.232421875, -14.67724609375, -14.1220703125, -13.56689453125, -13.01171875, -12.45654296875, -11.9013671875, -11.34619140625, -10.791015625, -10.23583984375, -9.6806640625, -9.12548828125, -8.5703125, -8.01513671875, -7.4599609375, -6.90478515625, -6.349609375, -5.79443359375, -5.2392578125, -4.68408203125, -4.12890625, -3.57373046875, -3.0185546875, -2.46337890625, -1.908203125, -1.35302734375, -0.7978515625, -0.24267578125, 0.3125, 0.86767578125, 1.4228515625, 1.97802734375, 2.533203125, 3.08837890625, 3.6435546875, 4.19873046875, 4.75390625, 5.30908203125, 5.8642578125, 6.41943359375, 6.974609375, 7.52978515625, 8.0849609375, 8.64013671875, 9.1953125, 9.75048828125, 10.3056640625, 10.86083984375, 11.416015625, 11.97119140625, 12.5263671875, 13.08154296875, 13.63671875, 14.19189453125, 14.7470703125, 15.30224609375, 15.857421875, 16.41259765625, 16.9677734375, 17.52294921875, 18.078125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 7.0, 14.0, 12.0, 20.0, 27.0, 44.0, 57.0, 73.0, 82.0, 79.0, 82.0, 98.0, 102.0, 81.0, 81.0, 32.0, 40.0, 33.0, 15.0, 14.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.496315002441406, -45.19872283935547, -43.90113067626953, -42.60354232788086, -41.30595016479492, -40.008358001708984, -38.71076583862305, -37.41317367553711, -36.11558532714844, -34.8179931640625, -33.52040100097656, -32.22281265258789, -30.925220489501953, -29.627628326416016, -28.330036163330078, -27.03244400024414, -25.734851837158203, -24.437259674072266, -23.13966941833496, -21.842077255249023, -20.54448699951172, -19.24689483642578, -17.949302673339844, -16.651710510253906, -15.354120254516602, -14.05652904510498, -12.75893783569336, -11.461345672607422, -10.1637544631958, -8.86616325378418, -7.5685715675354, -6.270979881286621, -4.973392486572266, -3.6758010387420654, -2.3782095909118652, -1.080618143081665, 0.21697330474853516, 1.5145645141601562, 2.8121562004089355, 4.109747886657715, 5.407339096069336, 6.704930305480957, 8.002521514892578, 9.300113677978516, 10.597704887390137, 11.895296096801758, 13.192888259887695, 14.490479469299316, 15.788070678710938, 17.085662841796875, 18.38325309753418, 19.680845260620117, 20.978435516357422, 22.27602767944336, 23.573619842529297, 24.871212005615234, 26.16880226135254, 27.466394424438477, 28.76398468017578, 30.06157684326172, 31.359169006347656, 32.656761169433594, 33.954349517822266, 35.2519416809082, 36.54953384399414]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 4.0, 9.0, 10.0, 7.0, 4.0, 20.0, 12.0, 20.0, 16.0, 28.0, 16.0, 27.0, 32.0, 32.0, 36.0, 40.0, 42.0, 39.0, 46.0, 34.0, 32.0, 43.0, 40.0, 39.0, 41.0, 42.0, 33.0, 41.0, 27.0, 26.0, 27.0, 25.0, 17.0, 16.0, 13.0, 12.0, 8.0, 5.0, 7.0, 5.0, 6.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.886066436767578, -27.024349212646484, -26.162633895874023, -25.30091667175293, -24.439199447631836, -23.577484130859375, -22.71576690673828, -21.854049682617188, -20.992334365844727, -20.130617141723633, -19.268901824951172, -18.407184600830078, -17.545467376708984, -16.683752059936523, -15.82203483581543, -14.960318565368652, -14.098601341247559, -13.236885070800781, -12.375167846679688, -11.51345157623291, -10.651735305786133, -9.790018081665039, -8.928301811218262, -8.066585540771484, -7.204868793487549, -6.343152046203613, -5.481435775756836, -4.6197190284729, -3.758002519607544, -2.8962860107421875, -2.034569263458252, -1.1728529930114746, -0.31113624572753906, 0.5505803227424622, 1.4122968912124634, 2.2740135192871094, 3.135730028152466, 3.9974465370178223, 4.859163284301758, 5.720879554748535, 6.582596302032471, 7.444313049316406, 8.306029319763184, 9.167745590209961, 10.029462814331055, 10.891179084777832, 11.75289535522461, 12.614612579345703, 13.47632884979248, 14.338045120239258, 15.199762344360352, 16.061477661132812, 16.923194885253906, 17.784912109375, 18.646629333496094, 19.508344650268555, 20.37006187438965, 21.231779098510742, 22.093494415283203, 22.955211639404297, 23.81692886352539, 24.67864418029785, 25.540361404418945, 26.402076721191406, 27.2637939453125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 7.0, 6.0, 14.0, 14.0, 20.0, 17.0, 23.0, 25.0, 22.0, 19.0, 23.0, 34.0, 32.0, 35.0, 34.0, 30.0, 37.0, 41.0, 43.0, 38.0, 41.0, 42.0, 38.0, 34.0, 31.0, 35.0, 41.0, 25.0, 21.0, 23.0, 9.0, 30.0, 19.0, 13.0, 7.0, 19.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.478607177734375, -2.39276123046875, -2.306915283203125, -2.2210693359375, -2.135223388671875, -2.04937744140625, -1.963531494140625, -1.877685546875, -1.791839599609375, -1.70599365234375, -1.620147705078125, -1.5343017578125, -1.448455810546875, -1.36260986328125, -1.276763916015625, -1.19091796875, -1.105072021484375, -1.01922607421875, -0.933380126953125, -0.8475341796875, -0.761688232421875, -0.67584228515625, -0.589996337890625, -0.504150390625, -0.418304443359375, -0.33245849609375, -0.246612548828125, -0.1607666015625, -0.074920654296875, 0.01092529296875, 0.096771240234375, 0.1826171875, 0.268463134765625, 0.35430908203125, 0.440155029296875, 0.5260009765625, 0.611846923828125, 0.69769287109375, 0.783538818359375, 0.869384765625, 0.955230712890625, 1.04107666015625, 1.126922607421875, 1.2127685546875, 1.298614501953125, 1.38446044921875, 1.470306396484375, 1.55615234375, 1.641998291015625, 1.72784423828125, 1.813690185546875, 1.8995361328125, 1.985382080078125, 2.07122802734375, 2.157073974609375, 2.242919921875, 2.328765869140625, 2.41461181640625, 2.500457763671875, 2.5863037109375, 2.672149658203125, 2.75799560546875, 2.843841552734375, 2.9296875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 27.0, 25.0, 41.0, 77.0, 116.0, 152.0, 234.0, 405.0, 553.0, 858.0, 1321.0, 1935.0, 2974.0, 4473.0, 7091.0, 10711.0, 16661.0, 24968.0, 38253.0, 57530.0, 83798.0, 115941.0, 145616.0, 148402.0, 120641.0, 88238.0, 60298.0, 40160.0, 26552.0, 17266.0, 11466.0, 7572.0, 4887.0, 3252.0, 2053.0, 1389.0, 920.0, 580.0, 390.0, 230.0, 171.0, 93.0, 71.0, 57.0, 38.0, 18.0, 18.0, 9.0, 10.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.369873046875, -0.3579673767089844, -0.34606170654296875, -0.3341560363769531, -0.3222503662109375, -0.3103446960449219, -0.29843902587890625, -0.2865333557128906, -0.274627685546875, -0.2627220153808594, -0.25081634521484375, -0.23891067504882812, -0.2270050048828125, -0.21509933471679688, -0.20319366455078125, -0.19128799438476562, -0.17938232421875, -0.16747665405273438, -0.15557098388671875, -0.14366531372070312, -0.1317596435546875, -0.11985397338867188, -0.10794830322265625, -0.09604263305664062, -0.084136962890625, -0.07223129272460938, -0.06032562255859375, -0.048419952392578125, -0.0365142822265625, -0.024608612060546875, -0.01270294189453125, -0.000797271728515625, 0.0111083984375, 0.023014068603515625, 0.03491973876953125, 0.046825408935546875, 0.0587310791015625, 0.07063674926757812, 0.08254241943359375, 0.09444808959960938, 0.106353759765625, 0.11825942993164062, 0.13016510009765625, 0.14207077026367188, 0.1539764404296875, 0.16588211059570312, 0.17778778076171875, 0.18969345092773438, 0.20159912109375, 0.21350479125976562, 0.22541046142578125, 0.23731613159179688, 0.2492218017578125, 0.2611274719238281, 0.27303314208984375, 0.2849388122558594, 0.296844482421875, 0.3087501525878906, 0.32065582275390625, 0.3325614929199219, 0.3444671630859375, 0.3563728332519531, 0.36827850341796875, 0.3801841735839844, 0.39208984375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 5.0, 1.0, 7.0, 7.0, 6.0, 14.0, 11.0, 15.0, 17.0, 21.0, 16.0, 23.0, 30.0, 28.0, 32.0, 28.0, 36.0, 37.0, 34.0, 38.0, 42.0, 36.0, 1065.0, 34.0, 34.0, 40.0, 48.0, 29.0, 29.0, 31.0, 28.0, 25.0, 34.0, 31.0, 13.0, 25.0, 18.0, 12.0, 9.0, 3.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.029296875, -1.96820068359375, -1.9071044921875, -1.84600830078125, -1.784912109375, -1.72381591796875, -1.6627197265625, -1.60162353515625, -1.54052734375, -1.47943115234375, -1.4183349609375, -1.35723876953125, -1.296142578125, -1.23504638671875, -1.1739501953125, -1.11285400390625, -1.0517578125, -0.99066162109375, -0.9295654296875, -0.86846923828125, -0.807373046875, -0.74627685546875, -0.6851806640625, -0.62408447265625, -0.56298828125, -0.50189208984375, -0.4407958984375, -0.37969970703125, -0.318603515625, -0.25750732421875, -0.1964111328125, -0.13531494140625, -0.07421875, -0.01312255859375, 0.0479736328125, 0.10906982421875, 0.170166015625, 0.23126220703125, 0.2923583984375, 0.35345458984375, 0.41455078125, 0.47564697265625, 0.5367431640625, 0.59783935546875, 0.658935546875, 0.72003173828125, 0.7811279296875, 0.84222412109375, 0.9033203125, 0.96441650390625, 1.0255126953125, 1.08660888671875, 1.147705078125, 1.20880126953125, 1.2698974609375, 1.33099365234375, 1.39208984375, 1.45318603515625, 1.5142822265625, 1.57537841796875, 1.636474609375, 1.69757080078125, 1.7586669921875, 1.81976318359375, 1.880859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 7.0, 8.0, 16.0, 29.0, 31.0, 59.0, 84.0, 118.0, 147.0, 226.0, 307.0, 492.0, 684.0, 943.0, 1439.0, 2188.0, 3270.0, 4841.0, 7301.0, 10975.0, 16750.0, 25171.0, 37759.0, 55531.0, 79866.0, 110052.0, 140382.0, 1190928.0, 121864.0, 90592.0, 64018.0, 43556.0, 28972.0, 19533.0, 12884.0, 8651.0, 5607.0, 3900.0, 2553.0, 1756.0, 1136.0, 767.0, 512.0, 382.0, 284.0, 155.0, 123.0, 92.0, 68.0, 34.0, 27.0, 18.0, 15.0, 12.0, 8.0, 5.0, 2.0, 2.0], "bins": [-0.2366943359375, -0.22956275939941406, -0.22243118286132812, -0.2152996063232422, -0.20816802978515625, -0.2010364532470703, -0.19390487670898438, -0.18677330017089844, -0.1796417236328125, -0.17251014709472656, -0.16537857055664062, -0.1582469940185547, -0.15111541748046875, -0.1439838409423828, -0.13685226440429688, -0.12972068786621094, -0.122589111328125, -0.11545753479003906, -0.10832595825195312, -0.10119438171386719, -0.09406280517578125, -0.08693122863769531, -0.07979965209960938, -0.07266807556152344, -0.0655364990234375, -0.05840492248535156, -0.051273345947265625, -0.04414176940917969, -0.03701019287109375, -0.029878616333007812, -0.022747039794921875, -0.015615463256835938, -0.00848388671875, -0.0013523101806640625, 0.005779266357421875, 0.012910842895507812, 0.02004241943359375, 0.027173995971679688, 0.034305572509765625, 0.04143714904785156, 0.0485687255859375, 0.05570030212402344, 0.06283187866210938, 0.06996345520019531, 0.07709503173828125, 0.08422660827636719, 0.09135818481445312, 0.09848976135253906, 0.105621337890625, 0.11275291442871094, 0.11988449096679688, 0.1270160675048828, 0.13414764404296875, 0.1412792205810547, 0.14841079711914062, 0.15554237365722656, 0.1626739501953125, 0.16980552673339844, 0.17693710327148438, 0.1840686798095703, 0.19120025634765625, 0.1983318328857422, 0.20546340942382812, 0.21259498596191406, 0.2197265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 12.0, 11.0, 11.0, 17.0, 14.0, 21.0, 20.0, 28.0, 56.0, 60.0, 81.0, 80.0, 88.0, 101.0, 80.0, 73.0, 48.0, 37.0, 31.0, 19.0, 16.0, 17.0, 16.0, 4.0, 6.0, 10.0, 2.0, 10.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003780364990234375, -0.003661513328552246, -0.003542661666870117, -0.0034238100051879883, -0.0033049583435058594, -0.0031861066818237305, -0.0030672550201416016, -0.0029484033584594727, -0.0028295516967773438, -0.002710700035095215, -0.002591848373413086, -0.002472996711730957, -0.002354145050048828, -0.0022352933883666992, -0.0021164417266845703, -0.0019975900650024414, -0.0018787384033203125, -0.0017598867416381836, -0.0016410350799560547, -0.0015221834182739258, -0.0014033317565917969, -0.001284480094909668, -0.001165628433227539, -0.0010467767715454102, -0.0009279251098632812, -0.0008090734481811523, -0.0006902217864990234, -0.0005713701248168945, -0.0004525184631347656, -0.0003336668014526367, -0.0002148151397705078, -9.59634780883789e-05, 2.288818359375e-05, 0.0001417398452758789, 0.0002605915069580078, 0.0003794431686401367, 0.0004982948303222656, 0.0006171464920043945, 0.0007359981536865234, 0.0008548498153686523, 0.0009737014770507812, 0.0010925531387329102, 0.001211404800415039, 0.001330256462097168, 0.0014491081237792969, 0.0015679597854614258, 0.0016868114471435547, 0.0018056631088256836, 0.0019245147705078125, 0.0020433664321899414, 0.0021622180938720703, 0.0022810697555541992, 0.002399921417236328, 0.002518773078918457, 0.002637624740600586, 0.002756476402282715, 0.0028753280639648438, 0.0029941797256469727, 0.0031130313873291016, 0.0032318830490112305, 0.0033507347106933594, 0.0034695863723754883, 0.003588438034057617, 0.003707289695739746, 0.003826141357421875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 8.0, 7.0, 7.0, 12.0, 7.0, 7.0, 12.0, 19.0, 21.0, 29.0, 17.0, 34.0, 76.0, 102.0, 175.0, 418.0, 1886.0, 19522.0, 894594.0, 124697.0, 5317.0, 859.0, 263.0, 144.0, 74.0, 54.0, 51.0, 27.0, 20.0, 16.0, 14.0, 16.0, 10.0, 8.0, 4.0, 3.0, 4.0, 4.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0716552734375, -0.06953239440917969, -0.06740951538085938, -0.06528663635253906, -0.06316375732421875, -0.06104087829589844, -0.058917999267578125, -0.05679512023925781, -0.0546722412109375, -0.05254936218261719, -0.050426483154296875, -0.04830360412597656, -0.04618072509765625, -0.04405784606933594, -0.041934967041015625, -0.03981208801269531, -0.037689208984375, -0.03556632995605469, -0.033443450927734375, -0.03132057189941406, -0.02919769287109375, -0.027074813842773438, -0.024951934814453125, -0.022829055786132812, -0.0207061767578125, -0.018583297729492188, -0.016460418701171875, -0.014337539672851562, -0.01221466064453125, -0.010091781616210938, -0.007968902587890625, -0.0058460235595703125, -0.00372314453125, -0.0016002655029296875, 0.000522613525390625, 0.0026454925537109375, 0.00476837158203125, 0.0068912506103515625, 0.009014129638671875, 0.011137008666992188, 0.0132598876953125, 0.015382766723632812, 0.017505645751953125, 0.019628524780273438, 0.02175140380859375, 0.023874282836914062, 0.025997161865234375, 0.028120040893554688, 0.030242919921875, 0.03236579895019531, 0.034488677978515625, 0.03661155700683594, 0.03873443603515625, 0.04085731506347656, 0.042980194091796875, 0.04510307312011719, 0.0472259521484375, 0.04934883117675781, 0.051471710205078125, 0.05359458923339844, 0.05571746826171875, 0.05784034729003906, 0.059963226318359375, 0.06208610534667969, 0.064208984375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 6.0, 8.0, 16.0, 34.0, 41.0, 72.0, 131.0, 174.0, 185.0, 124.0, 87.0, 38.0, 29.0, 21.0, 11.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005816508084535599, -0.005526387132704258, -0.00523626571521163, -0.004946144297719002, -0.004656023345887661, -0.00436590239405632, -0.004075780976563692, -0.0037856597919017076, -0.003495538607239723, -0.0032054174225777388, -0.0029152962379157543, -0.00262517505325377, -0.0023350538685917854, -0.002044932683929801, -0.0017548114992678165, -0.001464690314605832, -0.0011745691299438477, -0.0008844479452818632, -0.0005943267606198788, -0.0003042055759578943, -1.4084391295909882e-05, 0.00027603679336607456, 0.000566157978028059, 0.0008562791626900434, 0.001146400347352028, 0.0014365215320140123, 0.0017266427166759968, 0.0020167639013379812, 0.0023068850859999657, 0.00259700627066195, 0.0028871274553239346, 0.003177248639985919, 0.003467368893325329, 0.0037574900779873133, 0.004047611262649298, 0.004337732680141926, 0.004627853631973267, 0.004917974583804607, 0.0052080960012972355, 0.005498217418789864, 0.005788338370621204, 0.006078459322452545, 0.006368580739945173, 0.006658702157437801, 0.006948823109269142, 0.007238944061100483, 0.007529065478593111, 0.00781918689608574, 0.00810930784791708, 0.00839942879974842, 0.008689550682902336, 0.008979671634733677, 0.009269792586565018, 0.009559913538396358, 0.0098500344902277, 0.010140156373381615, 0.010430277325212955, 0.010720398277044296, 0.011010520160198212, 0.011300641112029552, 0.011590762063860893, 0.011880883015692234, 0.012171003967523575, 0.01246112585067749, 0.012751246802508831]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 9.0, 11.0, 14.0, 7.0, 9.0, 16.0, 22.0, 13.0, 24.0, 21.0, 27.0, 22.0, 26.0, 29.0, 26.0, 44.0, 37.0, 41.0, 37.0, 42.0, 40.0, 40.0, 36.0, 35.0, 24.0, 33.0, 20.0, 32.0, 32.0, 25.0, 22.0, 26.0, 24.0, 23.0, 11.0, 25.0, 12.0, 16.0, 7.0, 6.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.001846909523010254, -0.001790374517440796, -0.0017338395118713379, -0.0016773045063018799, -0.0016207695007324219, -0.0015642344951629639, -0.0015076994895935059, -0.0014511644840240479, -0.0013946294784545898, -0.0013380944728851318, -0.0012815594673156738, -0.0012250244617462158, -0.0011684894561767578, -0.0011119544506072998, -0.0010554194450378418, -0.0009988844394683838, -0.0009423494338989258, -0.0008858144283294678, -0.0008292794227600098, -0.0007727444171905518, -0.0007162094116210938, -0.0006596744060516357, -0.0006031394004821777, -0.0005466043949127197, -0.0004900693893432617, -0.0004335343837738037, -0.0003769993782043457, -0.0003204643726348877, -0.0002639293670654297, -0.00020739436149597168, -0.00015085935592651367, -9.432435035705566e-05, -3.7789344787597656e-05, 1.874566078186035e-05, 7.528066635131836e-05, 0.00013181567192077637, 0.00018835067749023438, 0.0002448856830596924, 0.0003014206886291504, 0.0003579556941986084, 0.0004144906997680664, 0.0004710257053375244, 0.0005275607109069824, 0.0005840957164764404, 0.0006406307220458984, 0.0006971657276153564, 0.0007537007331848145, 0.0008102357387542725, 0.0008667707443237305, 0.0009233057498931885, 0.0009798407554626465, 0.0010363757610321045, 0.0010929107666015625, 0.0011494457721710205, 0.0012059807777404785, 0.0012625157833099365, 0.0013190507888793945, 0.0013755857944488525, 0.0014321208000183105, 0.0014886558055877686, 0.0015451908111572266, 0.0016017258167266846, 0.0016582608222961426, 0.0017147958278656006, 0.0017713308334350586]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 5.0, 9.0, 7.0, 6.0, 14.0, 14.0, 20.0, 17.0, 23.0, 25.0, 22.0, 19.0, 23.0, 34.0, 32.0, 35.0, 34.0, 30.0, 37.0, 42.0, 42.0, 38.0, 41.0, 42.0, 38.0, 34.0, 30.0, 36.0, 41.0, 25.0, 21.0, 23.0, 9.0, 30.0, 19.0, 13.0, 7.0, 19.0, 7.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.478607177734375, -2.39276123046875, -2.306915283203125, -2.2210693359375, -2.135223388671875, -2.04937744140625, -1.963531494140625, -1.877685546875, -1.791839599609375, -1.70599365234375, -1.620147705078125, -1.5343017578125, -1.448455810546875, -1.36260986328125, -1.276763916015625, -1.19091796875, -1.105072021484375, -1.01922607421875, -0.933380126953125, -0.8475341796875, -0.761688232421875, -0.67584228515625, -0.589996337890625, -0.504150390625, -0.418304443359375, -0.33245849609375, -0.246612548828125, -0.1607666015625, -0.074920654296875, 0.01092529296875, 0.096771240234375, 0.1826171875, 0.268463134765625, 0.35430908203125, 0.440155029296875, 0.5260009765625, 0.611846923828125, 0.69769287109375, 0.783538818359375, 0.869384765625, 0.955230712890625, 1.04107666015625, 1.126922607421875, 1.2127685546875, 1.298614501953125, 1.38446044921875, 1.470306396484375, 1.55615234375, 1.641998291015625, 1.72784423828125, 1.813690185546875, 1.8995361328125, 1.985382080078125, 2.07122802734375, 2.157073974609375, 2.242919921875, 2.328765869140625, 2.41461181640625, 2.500457763671875, 2.5863037109375, 2.672149658203125, 2.75799560546875, 2.843841552734375, 2.9296875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 6.0, 13.0, 15.0, 23.0, 40.0, 49.0, 71.0, 114.0, 177.0, 231.0, 338.0, 480.0, 744.0, 1183.0, 1644.0, 2337.0, 3621.0, 5544.0, 10201.0, 21472.0, 55867.0, 183592.0, 529682.0, 141867.0, 46312.0, 18511.0, 9099.0, 5184.0, 3195.0, 2153.0, 1526.0, 1056.0, 703.0, 504.0, 299.0, 207.0, 182.0, 106.0, 61.0, 38.0, 29.0, 26.0, 18.0, 11.0, 7.0, 2.0, 6.0, 4.0, 2.0, 3.0], "bins": [-4.09765625, -3.985107421875, -3.87255859375, -3.760009765625, -3.6474609375, -3.534912109375, -3.42236328125, -3.309814453125, -3.197265625, -3.084716796875, -2.97216796875, -2.859619140625, -2.7470703125, -2.634521484375, -2.52197265625, -2.409423828125, -2.296875, -2.184326171875, -2.07177734375, -1.959228515625, -1.8466796875, -1.734130859375, -1.62158203125, -1.509033203125, -1.396484375, -1.283935546875, -1.17138671875, -1.058837890625, -0.9462890625, -0.833740234375, -0.72119140625, -0.608642578125, -0.49609375, -0.383544921875, -0.27099609375, -0.158447265625, -0.0458984375, 0.066650390625, 0.17919921875, 0.291748046875, 0.404296875, 0.516845703125, 0.62939453125, 0.741943359375, 0.8544921875, 0.967041015625, 1.07958984375, 1.192138671875, 1.3046875, 1.417236328125, 1.52978515625, 1.642333984375, 1.7548828125, 1.867431640625, 1.97998046875, 2.092529296875, 2.205078125, 2.317626953125, 2.43017578125, 2.542724609375, 2.6552734375, 2.767822265625, 2.88037109375, 2.992919921875, 3.10546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 5.0, 3.0, 6.0, 6.0, 7.0, 9.0, 10.0, 18.0, 13.0, 12.0, 21.0, 24.0, 19.0, 22.0, 33.0, 41.0, 44.0, 53.0, 47.0, 68.0, 87.0, 224.0, 1521.0, 211.0, 102.0, 67.0, 40.0, 51.0, 34.0, 40.0, 31.0, 32.0, 28.0, 21.0, 21.0, 14.0, 14.0, 12.0, 14.0, 7.0, 3.0, 8.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.9375, -8.634521484375, -8.33154296875, -8.028564453125, -7.7255859375, -7.422607421875, -7.11962890625, -6.816650390625, -6.513671875, -6.210693359375, -5.90771484375, -5.604736328125, -5.3017578125, -4.998779296875, -4.69580078125, -4.392822265625, -4.08984375, -3.786865234375, -3.48388671875, -3.180908203125, -2.8779296875, -2.574951171875, -2.27197265625, -1.968994140625, -1.666015625, -1.363037109375, -1.06005859375, -0.757080078125, -0.4541015625, -0.151123046875, 0.15185546875, 0.454833984375, 0.7578125, 1.060791015625, 1.36376953125, 1.666748046875, 1.9697265625, 2.272705078125, 2.57568359375, 2.878662109375, 3.181640625, 3.484619140625, 3.78759765625, 4.090576171875, 4.3935546875, 4.696533203125, 4.99951171875, 5.302490234375, 5.60546875, 5.908447265625, 6.21142578125, 6.514404296875, 6.8173828125, 7.120361328125, 7.42333984375, 7.726318359375, 8.029296875, 8.332275390625, 8.63525390625, 8.938232421875, 9.2412109375, 9.544189453125, 9.84716796875, 10.150146484375, 10.453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 15.0, 20.0, 16.0, 22.0, 28.0, 44.0, 68.0, 63.0, 114.0, 197.0, 372.0, 1004.0, 5578.0, 71125.0, 3000096.0, 59740.0, 5236.0, 946.0, 365.0, 187.0, 135.0, 86.0, 51.0, 37.0, 29.0, 29.0, 23.0, 15.0, 21.0, 8.0, 3.0, 7.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.46533203125, -16.8056640625, -16.14599609375, -15.486328125, -14.82666015625, -14.1669921875, -13.50732421875, -12.84765625, -12.18798828125, -11.5283203125, -10.86865234375, -10.208984375, -9.54931640625, -8.8896484375, -8.22998046875, -7.5703125, -6.91064453125, -6.2509765625, -5.59130859375, -4.931640625, -4.27197265625, -3.6123046875, -2.95263671875, -2.29296875, -1.63330078125, -0.9736328125, -0.31396484375, 0.345703125, 1.00537109375, 1.6650390625, 2.32470703125, 2.984375, 3.64404296875, 4.3037109375, 4.96337890625, 5.623046875, 6.28271484375, 6.9423828125, 7.60205078125, 8.26171875, 8.92138671875, 9.5810546875, 10.24072265625, 10.900390625, 11.56005859375, 12.2197265625, 12.87939453125, 13.5390625, 14.19873046875, 14.8583984375, 15.51806640625, 16.177734375, 16.83740234375, 17.4970703125, 18.15673828125, 18.81640625, 19.47607421875, 20.1357421875, 20.79541015625, 21.455078125, 22.11474609375, 22.7744140625, 23.43408203125, 24.09375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [11.0, 216.0, 627.0, 151.0, 9.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60375452041626, -4.5172119140625, -1.430668830871582, 1.6558737754821777, 4.742416858673096, 7.828959941864014, 10.915502548217773, 14.002046585083008, 17.08858871459961, 20.17513084411621, 23.261674880981445, 26.348217010498047, 29.43476104736328, 32.52130126953125, 35.607845306396484, 38.69438934326172, 41.78092956542969, 44.86747360229492, 47.95401382446289, 51.040557861328125, 54.12710189819336, 57.213645935058594, 60.30018615722656, 63.3867301940918, 66.47327423095703, 69.559814453125, 72.6463623046875, 75.73290252685547, 78.81944274902344, 81.90599060058594, 84.9925308227539, 88.07907104492188, 91.16561126708984, 94.25215148925781, 97.33869934082031, 100.42523956298828, 103.51177978515625, 106.59832763671875, 109.68486785888672, 112.77140808105469, 115.85795593261719, 118.94449615478516, 122.03104400634766, 125.11758422851562, 128.20413208007812, 131.29066467285156, 134.37721252441406, 137.46376037597656, 140.55029296875, 143.6368408203125, 146.72337341308594, 149.80992126464844, 152.89646911621094, 155.98300170898438, 159.06954956054688, 162.15609741210938, 165.24264526367188, 168.32919311523438, 171.4157257080078, 174.5022735595703, 177.5888214111328, 180.67535400390625, 183.76190185546875, 186.84844970703125, 189.9349822998047]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 6.0, 2.0, 6.0, 3.0, 8.0, 10.0, 10.0, 6.0, 10.0, 12.0, 20.0, 20.0, 28.0, 20.0, 26.0, 26.0, 29.0, 35.0, 24.0, 32.0, 47.0, 34.0, 31.0, 44.0, 37.0, 39.0, 30.0, 43.0, 26.0, 42.0, 34.0, 30.0, 23.0, 28.0, 22.0, 30.0, 18.0, 17.0, 22.0, 9.0, 11.0, 3.0, 8.0, 9.0, 8.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-29.087255477905273, -28.213390350341797, -27.339527130126953, -26.465662002563477, -25.591796875, -24.717933654785156, -23.84406852722168, -22.970203399658203, -22.09634017944336, -21.222475051879883, -20.34861183166504, -19.474746704101562, -18.600881576538086, -17.72701644897461, -16.853153228759766, -15.979288101196289, -15.105422973632812, -14.231558799743652, -13.357693672180176, -12.483829498291016, -11.609964370727539, -10.736100196838379, -9.862236022949219, -8.988370895385742, -8.114506721496582, -7.240642070770264, -6.366777420043945, -5.492913246154785, -4.619048595428467, -3.7451839447021484, -2.8713197708129883, -1.99745512008667, -1.1235923767089844, -0.24972784519195557, 0.6241366863250732, 1.4980010986328125, 2.371865749359131, 3.245730400085449, 4.119594573974609, 4.993459224700928, 5.867323875427246, 6.7411885261535645, 7.615053176879883, 8.488917350769043, 9.362781524658203, 10.23664665222168, 11.11051082611084, 11.984375, 12.858240127563477, 13.732104301452637, 14.605969429016113, 15.479833602905273, 16.35369873046875, 17.227561950683594, 18.10142707824707, 18.975292205810547, 19.84915542602539, 20.723020553588867, 21.59688377380371, 22.470748901367188, 23.344614028930664, 24.21847915649414, 25.092342376708984, 25.96620750427246, 26.840072631835938]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 2.0, 5.0, 6.0, 12.0, 5.0, 12.0, 12.0, 19.0, 17.0, 18.0, 14.0, 28.0, 29.0, 29.0, 30.0, 31.0, 36.0, 29.0, 37.0, 38.0, 45.0, 39.0, 44.0, 38.0, 37.0, 42.0, 35.0, 32.0, 38.0, 30.0, 33.0, 26.0, 19.0, 19.0, 18.0, 18.0, 12.0, 15.0, 9.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.818359375, -2.72723388671875, -2.6361083984375, -2.54498291015625, -2.453857421875, -2.36273193359375, -2.2716064453125, -2.18048095703125, -2.08935546875, -1.99822998046875, -1.9071044921875, -1.81597900390625, -1.724853515625, -1.63372802734375, -1.5426025390625, -1.45147705078125, -1.3603515625, -1.26922607421875, -1.1781005859375, -1.08697509765625, -0.995849609375, -0.90472412109375, -0.8135986328125, -0.72247314453125, -0.63134765625, -0.54022216796875, -0.4490966796875, -0.35797119140625, -0.266845703125, -0.17572021484375, -0.0845947265625, 0.00653076171875, 0.09765625, 0.18878173828125, 0.2799072265625, 0.37103271484375, 0.462158203125, 0.55328369140625, 0.6444091796875, 0.73553466796875, 0.82666015625, 0.91778564453125, 1.0089111328125, 1.10003662109375, 1.191162109375, 1.28228759765625, 1.3734130859375, 1.46453857421875, 1.5556640625, 1.64678955078125, 1.7379150390625, 1.82904052734375, 1.920166015625, 2.01129150390625, 2.1024169921875, 2.19354248046875, 2.28466796875, 2.37579345703125, 2.4669189453125, 2.55804443359375, 2.649169921875, 2.74029541015625, 2.8314208984375, 2.92254638671875, 3.013671875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 11.0, 15.0, 17.0, 34.0, 52.0, 65.0, 94.0, 143.0, 218.0, 292.0, 510.0, 839.0, 1467.0, 2590.0, 4704.0, 9118.0, 18467.0, 39413.0, 88912.0, 233232.0, 739475.0, 1584971.0, 964373.0, 302348.0, 110082.0, 47081.0, 22250.0, 10821.0, 5591.0, 2883.0, 1583.0, 909.0, 563.0, 381.0, 242.0, 183.0, 107.0, 71.0, 59.0, 44.0, 17.0, 9.0, 15.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.5234375, -4.384765625, -4.24609375, -4.107421875, -3.96875, -3.830078125, -3.69140625, -3.552734375, -3.4140625, -3.275390625, -3.13671875, -2.998046875, -2.859375, -2.720703125, -2.58203125, -2.443359375, -2.3046875, -2.166015625, -2.02734375, -1.888671875, -1.75, -1.611328125, -1.47265625, -1.333984375, -1.1953125, -1.056640625, -0.91796875, -0.779296875, -0.640625, -0.501953125, -0.36328125, -0.224609375, -0.0859375, 0.052734375, 0.19140625, 0.330078125, 0.46875, 0.607421875, 0.74609375, 0.884765625, 1.0234375, 1.162109375, 1.30078125, 1.439453125, 1.578125, 1.716796875, 1.85546875, 1.994140625, 2.1328125, 2.271484375, 2.41015625, 2.548828125, 2.6875, 2.826171875, 2.96484375, 3.103515625, 3.2421875, 3.380859375, 3.51953125, 3.658203125, 3.796875, 3.935546875, 4.07421875, 4.212890625, 4.3515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 11.0, 16.0, 24.0, 41.0, 84.0, 124.0, 230.0, 294.0, 485.0, 669.0, 727.0, 468.0, 322.0, 212.0, 148.0, 81.0, 50.0, 29.0, 20.0, 9.0, 9.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.8560791015625, -10.438720703125, -10.0213623046875, -9.60400390625, -9.1866455078125, -8.769287109375, -8.3519287109375, -7.9345703125, -7.5172119140625, -7.099853515625, -6.6824951171875, -6.26513671875, -5.8477783203125, -5.430419921875, -5.0130615234375, -4.595703125, -4.1783447265625, -3.760986328125, -3.3436279296875, -2.92626953125, -2.5089111328125, -2.091552734375, -1.6741943359375, -1.2568359375, -0.8394775390625, -0.422119140625, -0.0047607421875, 0.41259765625, 0.8299560546875, 1.247314453125, 1.6646728515625, 2.08203125, 2.4993896484375, 2.916748046875, 3.3341064453125, 3.75146484375, 4.1688232421875, 4.586181640625, 5.0035400390625, 5.4208984375, 5.8382568359375, 6.255615234375, 6.6729736328125, 7.09033203125, 7.5076904296875, 7.925048828125, 8.3424072265625, 8.759765625, 9.1771240234375, 9.594482421875, 10.0118408203125, 10.42919921875, 10.8465576171875, 11.263916015625, 11.6812744140625, 12.0986328125, 12.5159912109375, 12.933349609375, 13.3507080078125, 13.76806640625, 14.1854248046875, 14.602783203125, 15.0201416015625, 15.4375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 13.0, 16.0, 23.0, 32.0, 41.0, 67.0, 117.0, 193.0, 380.0, 932.0, 2356.0, 8261.0, 43941.0, 366791.0, 2934160.0, 741545.0, 76915.0, 12966.0, 3232.0, 1154.0, 527.0, 258.0, 99.0, 83.0, 55.0, 33.0, 30.0, 19.0, 15.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.4375, -16.9033203125, -16.369140625, -15.8349609375, -15.30078125, -14.7666015625, -14.232421875, -13.6982421875, -13.1640625, -12.6298828125, -12.095703125, -11.5615234375, -11.02734375, -10.4931640625, -9.958984375, -9.4248046875, -8.890625, -8.3564453125, -7.822265625, -7.2880859375, -6.75390625, -6.2197265625, -5.685546875, -5.1513671875, -4.6171875, -4.0830078125, -3.548828125, -3.0146484375, -2.48046875, -1.9462890625, -1.412109375, -0.8779296875, -0.34375, 0.1904296875, 0.724609375, 1.2587890625, 1.79296875, 2.3271484375, 2.861328125, 3.3955078125, 3.9296875, 4.4638671875, 4.998046875, 5.5322265625, 6.06640625, 6.6005859375, 7.134765625, 7.6689453125, 8.203125, 8.7373046875, 9.271484375, 9.8056640625, 10.33984375, 10.8740234375, 11.408203125, 11.9423828125, 12.4765625, 13.0107421875, 13.544921875, 14.0791015625, 14.61328125, 15.1474609375, 15.681640625, 16.2158203125, 16.75]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 12.0, 20.0, 37.0, 95.0, 135.0, 208.0, 188.0, 131.0, 95.0, 50.0, 25.0, 11.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-132.37078857421875, -129.71942138671875, -127.06804656982422, -124.41667938232422, -121.76530456542969, -119.11393737792969, -116.46257019042969, -113.81119537353516, -111.15982818603516, -108.50846099853516, -105.85708618164062, -103.20571899414062, -100.5543441772461, -97.9029769897461, -95.25160217285156, -92.60023498535156, -89.94886779785156, -87.29750061035156, -84.64612579345703, -81.99475860595703, -79.3433837890625, -76.6920166015625, -74.0406494140625, -71.38927459716797, -68.73789978027344, -66.08653259277344, -63.435157775878906, -60.783790588378906, -58.13241958618164, -55.481048583984375, -52.82967758178711, -50.178306579589844, -47.526939392089844, -44.87556838989258, -42.22419738769531, -39.57283020019531, -36.92145919799805, -34.27008819580078, -31.618717193603516, -28.967348098754883, -26.315977096557617, -23.66460609436035, -21.01323699951172, -18.361865997314453, -15.710495948791504, -13.059125900268555, -10.407754898071289, -7.756385803222656, -5.105014801025391, -2.4536445140838623, 0.19772577285766602, 2.8490962982177734, 5.500466346740723, 8.151836395263672, 10.803207397460938, 13.45457649230957, 16.105947494506836, 18.7573184967041, 21.408687591552734, 24.06005859375, 26.711429595947266, 29.3627986907959, 32.01416778564453, 34.6655387878418, 37.31690979003906]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 4.0, 3.0, 11.0, 6.0, 6.0, 11.0, 8.0, 16.0, 17.0, 25.0, 23.0, 24.0, 30.0, 22.0, 25.0, 30.0, 30.0, 31.0, 29.0, 33.0, 32.0, 35.0, 39.0, 33.0, 37.0, 37.0, 41.0, 39.0, 38.0, 39.0, 38.0, 22.0, 30.0, 15.0, 14.0, 21.0, 13.0, 13.0, 11.0, 11.0, 11.0, 8.0, 5.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0], "bins": [-25.298538208007812, -24.53382682800293, -23.769115447998047, -23.004404067993164, -22.23969268798828, -21.4749813079834, -20.710269927978516, -19.945560455322266, -19.18084716796875, -18.416135787963867, -17.651424407958984, -16.8867130279541, -16.12200164794922, -15.357290267944336, -14.59257984161377, -13.827868461608887, -13.06315803527832, -12.298446655273438, -11.533735275268555, -10.769023895263672, -10.004312515258789, -9.239601135253906, -8.47489070892334, -7.710179328918457, -6.945467948913574, -6.180756568908691, -5.416045188903809, -4.651334285736084, -3.886622905731201, -3.1219115257263184, -2.3572006225585938, -1.592489242553711, -0.8277778625488281, -0.06306660175323486, 0.7016446590423584, 1.466355800628662, 2.231067180633545, 2.9957785606384277, 3.7604894638061523, 4.525200843811035, 5.289912223815918, 6.054623603820801, 6.819334983825684, 7.584045886993408, 8.348756790161133, 9.113468170166016, 9.878179550170898, 10.642890930175781, 11.407602310180664, 12.172313690185547, 12.93702507019043, 13.701736450195312, 14.466447830200195, 15.231159210205078, 15.995869636535645, 16.760581970214844, 17.525291442871094, 18.290002822875977, 19.05471420288086, 19.819425582885742, 20.584136962890625, 21.348848342895508, 22.11355972290039, 22.87826919555664, 23.642982482910156]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 4.0, 5.0, 12.0, 15.0, 13.0, 10.0, 27.0, 13.0, 25.0, 21.0, 30.0, 24.0, 43.0, 26.0, 38.0, 37.0, 36.0, 47.0, 48.0, 45.0, 52.0, 42.0, 39.0, 43.0, 30.0, 30.0, 41.0, 24.0, 31.0, 18.0, 16.0, 13.0, 16.0, 20.0, 11.0, 2.0, 7.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -3.0028076171875, -2.902099609375, -2.8013916015625, -2.70068359375, -2.5999755859375, -2.499267578125, -2.3985595703125, -2.2978515625, -2.1971435546875, -2.096435546875, -1.9957275390625, -1.89501953125, -1.7943115234375, -1.693603515625, -1.5928955078125, -1.4921875, -1.3914794921875, -1.290771484375, -1.1900634765625, -1.08935546875, -0.9886474609375, -0.887939453125, -0.7872314453125, -0.6865234375, -0.5858154296875, -0.485107421875, -0.3843994140625, -0.28369140625, -0.1829833984375, -0.082275390625, 0.0184326171875, 0.119140625, 0.2198486328125, 0.320556640625, 0.4212646484375, 0.52197265625, 0.6226806640625, 0.723388671875, 0.8240966796875, 0.9248046875, 1.0255126953125, 1.126220703125, 1.2269287109375, 1.32763671875, 1.4283447265625, 1.529052734375, 1.6297607421875, 1.73046875, 1.8311767578125, 1.931884765625, 2.0325927734375, 2.13330078125, 2.2340087890625, 2.334716796875, 2.4354248046875, 2.5361328125, 2.6368408203125, 2.737548828125, 2.8382568359375, 2.93896484375, 3.0396728515625, 3.140380859375, 3.2410888671875, 3.341796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 6.0, 18.0, 19.0, 37.0, 71.0, 124.0, 199.0, 331.0, 550.0, 1015.0, 1633.0, 2772.0, 4713.0, 8052.0, 13573.0, 23122.0, 39066.0, 65175.0, 104511.0, 156533.0, 193495.0, 159760.0, 107306.0, 67516.0, 40533.0, 24023.0, 14157.0, 8403.0, 4840.0, 2870.0, 1730.0, 998.0, 570.0, 346.0, 185.0, 131.0, 72.0, 42.0, 18.0, 11.0, 18.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54443359375, -0.5271682739257812, -0.5099029541015625, -0.49263763427734375, -0.475372314453125, -0.45810699462890625, -0.4408416748046875, -0.42357635498046875, -0.40631103515625, -0.38904571533203125, -0.3717803955078125, -0.35451507568359375, -0.337249755859375, -0.31998443603515625, -0.3027191162109375, -0.28545379638671875, -0.2681884765625, -0.25092315673828125, -0.2336578369140625, -0.21639251708984375, -0.199127197265625, -0.18186187744140625, -0.1645965576171875, -0.14733123779296875, -0.13006591796875, -0.11280059814453125, -0.0955352783203125, -0.07826995849609375, -0.061004638671875, -0.04373931884765625, -0.0264739990234375, -0.00920867919921875, 0.008056640625, 0.02532196044921875, 0.0425872802734375, 0.05985260009765625, 0.077117919921875, 0.09438323974609375, 0.1116485595703125, 0.12891387939453125, 0.14617919921875, 0.16344451904296875, 0.1807098388671875, 0.19797515869140625, 0.215240478515625, 0.23250579833984375, 0.2497711181640625, 0.26703643798828125, 0.2843017578125, 0.30156707763671875, 0.3188323974609375, 0.33609771728515625, 0.353363037109375, 0.37062835693359375, 0.3878936767578125, 0.40515899658203125, 0.42242431640625, 0.43968963623046875, 0.4569549560546875, 0.47422027587890625, 0.491485595703125, 0.5087509155273438, 0.5260162353515625, 0.5432815551757812, 0.560546875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 5.0, 6.0, 14.0, 15.0, 9.0, 12.0, 13.0, 11.0, 14.0, 13.0, 25.0, 20.0, 23.0, 25.0, 25.0, 25.0, 29.0, 36.0, 32.0, 31.0, 39.0, 32.0, 32.0, 1050.0, 29.0, 42.0, 36.0, 37.0, 14.0, 24.0, 32.0, 33.0, 15.0, 31.0, 33.0, 20.0, 23.0, 17.0, 16.0, 13.0, 13.0, 8.0, 6.0, 8.0, 8.0, 9.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.7587890625, -1.7045440673828125, -1.650299072265625, -1.5960540771484375, -1.54180908203125, -1.4875640869140625, -1.433319091796875, -1.3790740966796875, -1.3248291015625, -1.2705841064453125, -1.216339111328125, -1.1620941162109375, -1.10784912109375, -1.0536041259765625, -0.999359130859375, -0.9451141357421875, -0.890869140625, -0.8366241455078125, -0.782379150390625, -0.7281341552734375, -0.67388916015625, -0.6196441650390625, -0.565399169921875, -0.5111541748046875, -0.4569091796875, -0.4026641845703125, -0.348419189453125, -0.2941741943359375, -0.23992919921875, -0.1856842041015625, -0.131439208984375, -0.0771942138671875, -0.02294921875, 0.0312957763671875, 0.085540771484375, 0.1397857666015625, 0.19403076171875, 0.2482757568359375, 0.302520751953125, 0.3567657470703125, 0.4110107421875, 0.4652557373046875, 0.519500732421875, 0.5737457275390625, 0.62799072265625, 0.6822357177734375, 0.736480712890625, 0.7907257080078125, 0.844970703125, 0.8992156982421875, 0.953460693359375, 1.0077056884765625, 1.06195068359375, 1.1161956787109375, 1.170440673828125, 1.2246856689453125, 1.2789306640625, 1.3331756591796875, 1.387420654296875, 1.4416656494140625, 1.49591064453125, 1.5501556396484375, 1.604400634765625, 1.6586456298828125, 1.712890625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 9.0, 27.0, 30.0, 54.0, 79.0, 110.0, 180.0, 277.0, 417.0, 655.0, 1118.0, 1709.0, 2812.0, 4668.0, 7579.0, 12983.0, 21305.0, 35122.0, 57701.0, 90503.0, 136565.0, 1209971.0, 179608.0, 123816.0, 80234.0, 50953.0, 31040.0, 18868.0, 11290.0, 6750.0, 4023.0, 2476.0, 1516.0, 997.0, 621.0, 403.0, 218.0, 160.0, 105.0, 70.0, 40.0, 20.0, 16.0, 16.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.3001518249511719, -0.29073333740234375, -0.2813148498535156, -0.2718963623046875, -0.2624778747558594, -0.25305938720703125, -0.24364089965820312, -0.234222412109375, -0.22480392456054688, -0.21538543701171875, -0.20596694946289062, -0.1965484619140625, -0.18712997436523438, -0.17771148681640625, -0.16829299926757812, -0.15887451171875, -0.14945602416992188, -0.14003753662109375, -0.13061904907226562, -0.1212005615234375, -0.11178207397460938, -0.10236358642578125, -0.09294509887695312, -0.083526611328125, -0.07410812377929688, -0.06468963623046875, -0.055271148681640625, -0.0458526611328125, -0.036434173583984375, -0.02701568603515625, -0.017597198486328125, -0.0081787109375, 0.001239776611328125, 0.01065826416015625, 0.020076751708984375, 0.0294952392578125, 0.038913726806640625, 0.04833221435546875, 0.057750701904296875, 0.067169189453125, 0.07658767700195312, 0.08600616455078125, 0.09542465209960938, 0.1048431396484375, 0.11426162719726562, 0.12368011474609375, 0.13309860229492188, 0.14251708984375, 0.15193557739257812, 0.16135406494140625, 0.17077255249023438, 0.1801910400390625, 0.18960952758789062, 0.19902801513671875, 0.20844650268554688, 0.217864990234375, 0.22728347778320312, 0.23670196533203125, 0.24612045288085938, 0.2555389404296875, 0.2649574279785156, 0.27437591552734375, 0.2837944030761719, 0.293212890625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 7.0, 11.0, 18.0, 40.0, 58.0, 111.0, 214.0, 230.0, 98.0, 49.0, 31.0, 24.0, 18.0, 14.0, 9.0, 11.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01406097412109375, -0.013608694076538086, -0.013156414031982422, -0.012704133987426758, -0.012251853942871094, -0.01179957389831543, -0.011347293853759766, -0.010895013809204102, -0.010442733764648438, -0.009990453720092773, -0.00953817367553711, -0.009085893630981445, -0.008633613586425781, -0.008181333541870117, -0.007729053497314453, -0.007276773452758789, -0.006824493408203125, -0.006372213363647461, -0.005919933319091797, -0.005467653274536133, -0.005015373229980469, -0.004563093185424805, -0.004110813140869141, -0.0036585330963134766, -0.0032062530517578125, -0.0027539730072021484, -0.0023016929626464844, -0.0018494129180908203, -0.0013971328735351562, -0.0009448528289794922, -0.0004925727844238281, -4.029273986816406e-05, 0.0004119873046875, 0.0008642673492431641, 0.0013165473937988281, 0.0017688274383544922, 0.0022211074829101562, 0.0026733875274658203, 0.0031256675720214844, 0.0035779476165771484, 0.0040302276611328125, 0.0044825077056884766, 0.004934787750244141, 0.005387067794799805, 0.005839347839355469, 0.006291627883911133, 0.006743907928466797, 0.007196187973022461, 0.007648468017578125, 0.008100748062133789, 0.008553028106689453, 0.009005308151245117, 0.009457588195800781, 0.009909868240356445, 0.01036214828491211, 0.010814428329467773, 0.011266708374023438, 0.011718988418579102, 0.012171268463134766, 0.01262354850769043, 0.013075828552246094, 0.013528108596801758, 0.013980388641357422, 0.014432668685913086, 0.01488494873046875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 5.0, 6.0, 13.0, 12.0, 24.0, 27.0, 31.0, 43.0, 64.0, 129.0, 262.0, 2202.0, 901692.0, 142167.0, 1281.0, 239.0, 129.0, 63.0, 50.0, 20.0, 21.0, 17.0, 9.0, 7.0, 4.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2391357421875, -0.23186683654785156, -0.22459793090820312, -0.2173290252685547, -0.21006011962890625, -0.2027912139892578, -0.19552230834960938, -0.18825340270996094, -0.1809844970703125, -0.17371559143066406, -0.16644668579101562, -0.1591777801513672, -0.15190887451171875, -0.1446399688720703, -0.13737106323242188, -0.13010215759277344, -0.122833251953125, -0.11556434631347656, -0.10829544067382812, -0.10102653503417969, -0.09375762939453125, -0.08648872375488281, -0.07921981811523438, -0.07195091247558594, -0.0646820068359375, -0.05741310119628906, -0.050144195556640625, -0.04287528991699219, -0.03560638427734375, -0.028337478637695312, -0.021068572998046875, -0.013799667358398438, -0.00653076171875, 0.0007381439208984375, 0.008007049560546875, 0.015275955200195312, 0.02254486083984375, 0.029813766479492188, 0.037082672119140625, 0.04435157775878906, 0.0516204833984375, 0.05888938903808594, 0.06615829467773438, 0.07342720031738281, 0.08069610595703125, 0.08796501159667969, 0.09523391723632812, 0.10250282287597656, 0.109771728515625, 0.11704063415527344, 0.12430953979492188, 0.1315784454345703, 0.13884735107421875, 0.1461162567138672, 0.15338516235351562, 0.16065406799316406, 0.1679229736328125, 0.17519187927246094, 0.18246078491210938, 0.1897296905517578, 0.19699859619140625, 0.2042675018310547, 0.21153640747070312, 0.21880531311035156, 0.22607421875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 11.0, 120.0, 797.0, 82.0, 6.0, 1.0, 0.0, 1.0], "bins": [-0.19585345685482025, -0.19250300526618958, -0.1891525387763977, -0.18580208718776703, -0.18245162069797516, -0.17910116910934448, -0.1757507026195526, -0.17240025103092194, -0.16904978454113007, -0.1656993329524994, -0.16234886646270752, -0.15899841487407684, -0.15564794838428497, -0.1522974967956543, -0.14894703030586243, -0.14559657871723175, -0.14224611222743988, -0.1388956606388092, -0.13554519414901733, -0.13219474256038666, -0.1288442760705948, -0.1254938244819641, -0.12214335799217224, -0.11879289895296097, -0.11544244736433029, -0.11209198832511902, -0.10874152928590775, -0.10539107024669647, -0.1020406112074852, -0.09869015216827393, -0.09533969312906265, -0.09198923408985138, -0.0886387750506401, -0.08528831601142883, -0.08193785697221756, -0.07858739793300629, -0.07523693889379501, -0.07188647985458374, -0.06853602081537247, -0.0651855617761612, -0.06183510273694992, -0.05848464369773865, -0.055134184658527374, -0.0517837256193161, -0.04843326658010483, -0.045082807540893555, -0.04173234850168228, -0.03838188946247101, -0.035031430423259735, -0.03168097138404846, -0.02833051234483719, -0.024980053305625916, -0.021629594266414642, -0.01827913708984852, -0.014928678050637245, -0.011578219011425972, -0.008227761834859848, -0.004877302795648575, -0.001526844222098589, 0.001823614351451397, 0.00517407339066267, 0.008524531498551369, 0.011874990537762642, 0.015225449576973915, 0.01857590861618519]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 8.0, 10.0, 6.0, 13.0, 11.0, 15.0, 12.0, 13.0, 21.0, 29.0, 25.0, 31.0, 37.0, 38.0, 32.0, 38.0, 39.0, 38.0, 43.0, 38.0, 43.0, 39.0, 44.0, 41.0, 34.0, 50.0, 31.0, 32.0, 24.0, 18.0, 22.0, 19.0, 24.0, 11.0, 13.0, 10.0, 11.0, 7.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010565042495727539, -0.010221204720437527, -0.009877366945147514, -0.009533529169857502, -0.00918969139456749, -0.008845853619277477, -0.008502015843987465, -0.008158178068697453, -0.00781434029340744, -0.007470502518117428, -0.0071266647428274155, -0.006782826967537403, -0.006438989192247391, -0.006095151416957378, -0.005751313641667366, -0.005407475866377354, -0.005063638091087341, -0.004719800315797329, -0.004375962540507317, -0.004032124765217304, -0.003688286989927292, -0.0033444492146372795, -0.003000611439347267, -0.002656773664057255, -0.0023129358887672424, -0.00196909811347723, -0.0016252603381872177, -0.0012814225628972054, -0.000937584787607193, -0.0005937470123171806, -0.0002499092370271683, 9.392853826284409e-05, 0.00043776631355285645, 0.0007816040888428688, 0.0011254418641328812, 0.0014692796394228935, 0.0018131174147129059, 0.0021569551900029182, 0.0025007929652929306, 0.002844630740582943, 0.0031884685158729553, 0.0035323062911629677, 0.00387614406645298, 0.004219981841742992, 0.004563819617033005, 0.004907657392323017, 0.0052514951676130295, 0.005595332942903042, 0.005939170718193054, 0.0062830084934830666, 0.006626846268773079, 0.006970684044063091, 0.007314521819353104, 0.007658359594643116, 0.008002197369933128, 0.00834603514522314, 0.008689872920513153, 0.009033710695803165, 0.009377548471093178, 0.00972138624638319, 0.010065224021673203, 0.010409061796963215, 0.010752899572253227, 0.01109673734754324, 0.011440575122833252]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 4.0, 5.0, 12.0, 15.0, 13.0, 10.0, 27.0, 13.0, 25.0, 21.0, 30.0, 24.0, 43.0, 26.0, 38.0, 37.0, 36.0, 47.0, 48.0, 45.0, 52.0, 42.0, 39.0, 43.0, 30.0, 30.0, 41.0, 24.0, 31.0, 18.0, 16.0, 13.0, 16.0, 20.0, 11.0, 2.0, 6.0, 8.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.103515625, -3.0028076171875, -2.902099609375, -2.8013916015625, -2.70068359375, -2.5999755859375, -2.499267578125, -2.3985595703125, -2.2978515625, -2.1971435546875, -2.096435546875, -1.9957275390625, -1.89501953125, -1.7943115234375, -1.693603515625, -1.5928955078125, -1.4921875, -1.3914794921875, -1.290771484375, -1.1900634765625, -1.08935546875, -0.9886474609375, -0.887939453125, -0.7872314453125, -0.6865234375, -0.5858154296875, -0.485107421875, -0.3843994140625, -0.28369140625, -0.1829833984375, -0.082275390625, 0.0184326171875, 0.119140625, 0.2198486328125, 0.320556640625, 0.4212646484375, 0.52197265625, 0.6226806640625, 0.723388671875, 0.8240966796875, 0.9248046875, 1.0255126953125, 1.126220703125, 1.2269287109375, 1.32763671875, 1.4283447265625, 1.529052734375, 1.6297607421875, 1.73046875, 1.8311767578125, 1.931884765625, 2.0325927734375, 2.13330078125, 2.2340087890625, 2.334716796875, 2.4354248046875, 2.5361328125, 2.6368408203125, 2.737548828125, 2.8382568359375, 2.93896484375, 3.0396728515625, 3.140380859375, 3.2410888671875, 3.341796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 3.0, 4.0, 6.0, 11.0, 18.0, 11.0, 26.0, 44.0, 45.0, 80.0, 98.0, 164.0, 236.0, 365.0, 569.0, 861.0, 1458.0, 2434.0, 4129.0, 7065.0, 12946.0, 26462.0, 70406.0, 308530.0, 445927.0, 97991.0, 33174.0, 15307.0, 8190.0, 4717.0, 2774.0, 1626.0, 1023.0, 597.0, 409.0, 280.0, 171.0, 120.0, 77.0, 55.0, 51.0, 28.0, 26.0, 15.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.382965087890625, -3.24835205078125, -3.113739013671875, -2.9791259765625, -2.844512939453125, -2.70989990234375, -2.575286865234375, -2.440673828125, -2.306060791015625, -2.17144775390625, -2.036834716796875, -1.9022216796875, -1.767608642578125, -1.63299560546875, -1.498382568359375, -1.36376953125, -1.229156494140625, -1.09454345703125, -0.959930419921875, -0.8253173828125, -0.690704345703125, -0.55609130859375, -0.421478271484375, -0.286865234375, -0.152252197265625, -0.01763916015625, 0.116973876953125, 0.2515869140625, 0.386199951171875, 0.52081298828125, 0.655426025390625, 0.7900390625, 0.924652099609375, 1.05926513671875, 1.193878173828125, 1.3284912109375, 1.463104248046875, 1.59771728515625, 1.732330322265625, 1.866943359375, 2.001556396484375, 2.13616943359375, 2.270782470703125, 2.4053955078125, 2.540008544921875, 2.67462158203125, 2.809234619140625, 2.94384765625, 3.078460693359375, 3.21307373046875, 3.347686767578125, 3.4822998046875, 3.616912841796875, 3.75152587890625, 3.886138916015625, 4.020751953125, 4.155364990234375, 4.28997802734375, 4.424591064453125, 4.5592041015625, 4.693817138671875, 4.82843017578125, 4.963043212890625, 5.09765625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 3.0, 9.0, 7.0, 10.0, 9.0, 18.0, 24.0, 16.0, 18.0, 27.0, 34.0, 29.0, 38.0, 43.0, 42.0, 63.0, 90.0, 159.0, 1562.0, 282.0, 112.0, 69.0, 62.0, 51.0, 38.0, 37.0, 29.0, 29.0, 32.0, 22.0, 25.0, 11.0, 14.0, 8.0, 4.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.8792724609375, -11.492919921875, -11.1065673828125, -10.72021484375, -10.3338623046875, -9.947509765625, -9.5611572265625, -9.1748046875, -8.7884521484375, -8.402099609375, -8.0157470703125, -7.62939453125, -7.2430419921875, -6.856689453125, -6.4703369140625, -6.083984375, -5.6976318359375, -5.311279296875, -4.9249267578125, -4.53857421875, -4.1522216796875, -3.765869140625, -3.3795166015625, -2.9931640625, -2.6068115234375, -2.220458984375, -1.8341064453125, -1.44775390625, -1.0614013671875, -0.675048828125, -0.2886962890625, 0.09765625, 0.4840087890625, 0.870361328125, 1.2567138671875, 1.64306640625, 2.0294189453125, 2.415771484375, 2.8021240234375, 3.1884765625, 3.5748291015625, 3.961181640625, 4.3475341796875, 4.73388671875, 5.1202392578125, 5.506591796875, 5.8929443359375, 6.279296875, 6.6656494140625, 7.052001953125, 7.4383544921875, 7.82470703125, 8.2110595703125, 8.597412109375, 8.9837646484375, 9.3701171875, 9.7564697265625, 10.142822265625, 10.5291748046875, 10.91552734375, 11.3018798828125, 11.688232421875, 12.0745849609375, 12.4609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 12.0, 14.0, 16.0, 30.0, 33.0, 34.0, 54.0, 72.0, 125.0, 188.0, 316.0, 632.0, 2438.0, 25613.0, 2936493.0, 171123.0, 6297.0, 1072.0, 401.0, 208.0, 125.0, 97.0, 67.0, 45.0, 38.0, 26.0, 26.0, 20.0, 5.0, 18.0, 7.0, 12.0, 6.0, 5.0, 4.0, 4.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.32861328125, -22.5166015625, -21.70458984375, -20.892578125, -20.08056640625, -19.2685546875, -18.45654296875, -17.64453125, -16.83251953125, -16.0205078125, -15.20849609375, -14.396484375, -13.58447265625, -12.7724609375, -11.96044921875, -11.1484375, -10.33642578125, -9.5244140625, -8.71240234375, -7.900390625, -7.08837890625, -6.2763671875, -5.46435546875, -4.65234375, -3.84033203125, -3.0283203125, -2.21630859375, -1.404296875, -0.59228515625, 0.2197265625, 1.03173828125, 1.84375, 2.65576171875, 3.4677734375, 4.27978515625, 5.091796875, 5.90380859375, 6.7158203125, 7.52783203125, 8.33984375, 9.15185546875, 9.9638671875, 10.77587890625, 11.587890625, 12.39990234375, 13.2119140625, 14.02392578125, 14.8359375, 15.64794921875, 16.4599609375, 17.27197265625, 18.083984375, 18.89599609375, 19.7080078125, 20.52001953125, 21.33203125, 22.14404296875, 22.9560546875, 23.76806640625, 24.580078125, 25.39208984375, 26.2041015625, 27.01611328125, 27.828125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 9.0, 73.0, 231.0, 397.0, 245.0, 47.0, 11.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.897819519042969, -8.89847183227539, -6.8991241455078125, -4.899775981903076, -2.900428295135498, -0.9010801315307617, 1.0982675552368164, 3.0976152420043945, 5.096962928771973, 7.096310615539551, 9.095658302307129, 11.095006942749023, 13.094354629516602, 15.09370231628418, 17.093050003051758, 19.092397689819336, 21.091745376586914, 23.091093063354492, 25.09044075012207, 27.08978843688965, 29.089136123657227, 31.088485717773438, 33.087833404541016, 35.087181091308594, 37.08652877807617, 39.08587646484375, 41.08522415161133, 43.084571838378906, 45.083919525146484, 47.08326721191406, 49.08261489868164, 51.08196258544922, 53.0813102722168, 55.080657958984375, 57.08000564575195, 59.07935333251953, 61.07870101928711, 63.07804870605469, 65.07740020751953, 67.07674407958984, 69.07609558105469, 71.07544708251953, 73.07479095458984, 75.07414245605469, 77.073486328125, 79.07283782958984, 81.07218170166016, 83.071533203125, 85.07087707519531, 87.07022857666016, 89.06957244873047, 91.06892395019531, 93.06826782226562, 95.06761932373047, 97.06696319580078, 99.06631469726562, 101.06565856933594, 103.06501007080078, 105.0643539428711, 107.06370544433594, 109.06304931640625, 111.0624008178711, 113.0617446899414, 115.06109619140625, 117.06044006347656]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 10.0, 9.0, 6.0, 9.0, 12.0, 10.0, 13.0, 14.0, 16.0, 30.0, 20.0, 32.0, 26.0, 25.0, 34.0, 35.0, 28.0, 41.0, 25.0, 36.0, 34.0, 34.0, 47.0, 35.0, 41.0, 38.0, 41.0, 39.0, 29.0, 34.0, 29.0, 19.0, 19.0, 17.0, 14.0, 18.0, 21.0, 12.0, 8.0, 10.0, 7.0, 5.0, 5.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.471710205078125, -25.62822151184082, -24.784732818603516, -23.94124412536621, -23.097755432128906, -22.2542667388916, -21.410778045654297, -20.567291259765625, -19.723800659179688, -18.880311965942383, -18.036823272705078, -17.193334579467773, -16.34984588623047, -15.506357192993164, -14.662869453430176, -13.819380760192871, -12.975893020629883, -12.132404327392578, -11.288915634155273, -10.445426940917969, -9.601938247680664, -8.75844955444336, -7.914961814880371, -7.071473121643066, -6.227984428405762, -5.384495735168457, -4.541007041931152, -3.697518825531006, -2.854030132293701, -2.0105414390563965, -1.16705322265625, -0.3235645294189453, 0.5199241638183594, 1.3634127378463745, 2.2069013118743896, 3.0503897666931152, 3.89387845993042, 4.737367153167725, 5.580855369567871, 6.424344062805176, 7.2678327560424805, 8.111321449279785, 8.95481014251709, 9.798297882080078, 10.641786575317383, 11.485275268554688, 12.328763961791992, 13.172252655029297, 14.015741348266602, 14.859230041503906, 15.702718734741211, 16.546207427978516, 17.38969612121582, 18.233184814453125, 19.076671600341797, 19.920162200927734, 20.763648986816406, 21.60713768005371, 22.450626373291016, 23.29411506652832, 24.137603759765625, 24.98109245300293, 25.824581146240234, 26.668067932128906, 27.511558532714844]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 3.0, 5.0, 8.0, 7.0, 9.0, 6.0, 16.0, 11.0, 23.0, 22.0, 22.0, 26.0, 25.0, 19.0, 36.0, 44.0, 27.0, 39.0, 36.0, 39.0, 38.0, 51.0, 47.0, 39.0, 49.0, 38.0, 33.0, 34.0, 37.0, 34.0, 22.0, 22.0, 20.0, 12.0, 17.0, 15.0, 21.0, 5.0, 5.0, 7.0, 5.0, 5.0, 9.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.24951171875, -3.1455078125, -3.04150390625, -2.9375, -2.83349609375, -2.7294921875, -2.62548828125, -2.521484375, -2.41748046875, -2.3134765625, -2.20947265625, -2.10546875, -2.00146484375, -1.8974609375, -1.79345703125, -1.689453125, -1.58544921875, -1.4814453125, -1.37744140625, -1.2734375, -1.16943359375, -1.0654296875, -0.96142578125, -0.857421875, -0.75341796875, -0.6494140625, -0.54541015625, -0.44140625, -0.33740234375, -0.2333984375, -0.12939453125, -0.025390625, 0.07861328125, 0.1826171875, 0.28662109375, 0.390625, 0.49462890625, 0.5986328125, 0.70263671875, 0.806640625, 0.91064453125, 1.0146484375, 1.11865234375, 1.22265625, 1.32666015625, 1.4306640625, 1.53466796875, 1.638671875, 1.74267578125, 1.8466796875, 1.95068359375, 2.0546875, 2.15869140625, 2.2626953125, 2.36669921875, 2.470703125, 2.57470703125, 2.6787109375, 2.78271484375, 2.88671875, 2.99072265625, 3.0947265625, 3.19873046875, 3.302734375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 7.0, 8.0, 10.0, 8.0, 11.0, 16.0, 12.0, 16.0, 27.0, 26.0, 26.0, 42.0, 62.0, 88.0, 164.0, 383.0, 1023.0, 3410.0, 14436.0, 93929.0, 1304520.0, 2554909.0, 188205.0, 24744.0, 5437.0, 1563.0, 517.0, 230.0, 129.0, 78.0, 51.0, 31.0, 36.0, 32.0, 19.0, 17.0, 14.0, 11.0, 6.0, 10.0, 2.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.9140625, -12.512451171875, -12.11083984375, -11.709228515625, -11.3076171875, -10.906005859375, -10.50439453125, -10.102783203125, -9.701171875, -9.299560546875, -8.89794921875, -8.496337890625, -8.0947265625, -7.693115234375, -7.29150390625, -6.889892578125, -6.48828125, -6.086669921875, -5.68505859375, -5.283447265625, -4.8818359375, -4.480224609375, -4.07861328125, -3.677001953125, -3.275390625, -2.873779296875, -2.47216796875, -2.070556640625, -1.6689453125, -1.267333984375, -0.86572265625, -0.464111328125, -0.0625, 0.339111328125, 0.74072265625, 1.142333984375, 1.5439453125, 1.945556640625, 2.34716796875, 2.748779296875, 3.150390625, 3.552001953125, 3.95361328125, 4.355224609375, 4.7568359375, 5.158447265625, 5.56005859375, 5.961669921875, 6.36328125, 6.764892578125, 7.16650390625, 7.568115234375, 7.9697265625, 8.371337890625, 8.77294921875, 9.174560546875, 9.576171875, 9.977783203125, 10.37939453125, 10.781005859375, 11.1826171875, 11.584228515625, 11.98583984375, 12.387451171875, 12.7890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 2.0, 5.0, 13.0, 19.0, 28.0, 43.0, 73.0, 102.0, 148.0, 238.0, 393.0, 538.0, 681.0, 613.0, 435.0, 280.0, 161.0, 111.0, 65.0, 48.0, 35.0, 10.0, 7.0, 9.0, 3.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.515625, -16.0877685546875, -15.659912109375, -15.2320556640625, -14.80419921875, -14.3763427734375, -13.948486328125, -13.5206298828125, -13.0927734375, -12.6649169921875, -12.237060546875, -11.8092041015625, -11.38134765625, -10.9534912109375, -10.525634765625, -10.0977783203125, -9.669921875, -9.2420654296875, -8.814208984375, -8.3863525390625, -7.95849609375, -7.5306396484375, -7.102783203125, -6.6749267578125, -6.2470703125, -5.8192138671875, -5.391357421875, -4.9635009765625, -4.53564453125, -4.1077880859375, -3.679931640625, -3.2520751953125, -2.82421875, -2.3963623046875, -1.968505859375, -1.5406494140625, -1.11279296875, -0.6849365234375, -0.257080078125, 0.1707763671875, 0.5986328125, 1.0264892578125, 1.454345703125, 1.8822021484375, 2.31005859375, 2.7379150390625, 3.165771484375, 3.5936279296875, 4.021484375, 4.4493408203125, 4.877197265625, 5.3050537109375, 5.73291015625, 6.1607666015625, 6.588623046875, 7.0164794921875, 7.4443359375, 7.8721923828125, 8.300048828125, 8.7279052734375, 9.15576171875, 9.5836181640625, 10.011474609375, 10.4393310546875, 10.8671875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 8.0, 18.0, 36.0, 64.0, 81.0, 160.0, 281.0, 666.0, 2285.0, 24112.0, 1833337.0, 2300891.0, 28511.0, 2383.0, 710.0, 315.0, 171.0, 88.0, 53.0, 33.0, 26.0, 13.0, 5.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.125, -28.005859375, -26.88671875, -25.767578125, -24.6484375, -23.529296875, -22.41015625, -21.291015625, -20.171875, -19.052734375, -17.93359375, -16.814453125, -15.6953125, -14.576171875, -13.45703125, -12.337890625, -11.21875, -10.099609375, -8.98046875, -7.861328125, -6.7421875, -5.623046875, -4.50390625, -3.384765625, -2.265625, -1.146484375, -0.02734375, 1.091796875, 2.2109375, 3.330078125, 4.44921875, 5.568359375, 6.6875, 7.806640625, 8.92578125, 10.044921875, 11.1640625, 12.283203125, 13.40234375, 14.521484375, 15.640625, 16.759765625, 17.87890625, 18.998046875, 20.1171875, 21.236328125, 22.35546875, 23.474609375, 24.59375, 25.712890625, 26.83203125, 27.951171875, 29.0703125, 30.189453125, 31.30859375, 32.427734375, 33.546875, 34.666015625, 35.78515625, 36.904296875, 38.0234375, 39.142578125, 40.26171875, 41.380859375, 42.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 14.0, 12.0, 26.0, 32.0, 55.0, 66.0, 69.0, 88.0, 96.0, 121.0, 102.0, 111.0, 59.0, 45.0, 35.0, 19.0, 22.0, 11.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.02934646606445, -49.54859161376953, -48.06783676147461, -46.58708190917969, -45.1063232421875, -43.62556838989258, -42.144813537597656, -40.664058685302734, -39.18330383300781, -37.70254898071289, -36.22179412841797, -34.74103546142578, -33.26028060913086, -31.779525756835938, -30.298770904541016, -28.818016052246094, -27.33725929260254, -25.856504440307617, -24.375747680664062, -22.89499282836914, -21.41423797607422, -19.933483123779297, -18.452726364135742, -16.97197151184082, -15.491215705871582, -14.010459899902344, -12.529705047607422, -11.048949241638184, -9.568193435668945, -8.087438583374023, -6.606682777404785, -5.125927925109863, -3.645172119140625, -2.164416790008545, -0.6836612224578857, 0.7970943450927734, 2.2778496742248535, 3.7586050033569336, 5.239360809326172, 6.720115661621094, 8.200871467590332, 9.68162727355957, 11.162382125854492, 12.64313793182373, 14.123893737792969, 15.60464859008789, 17.085403442382812, 18.566158294677734, 20.04691505432129, 21.52766990661621, 23.008426666259766, 24.489181518554688, 25.96993637084961, 27.45069122314453, 28.931447982788086, 30.412202835083008, 31.892959594726562, 33.373714447021484, 34.854469299316406, 36.335227966308594, 37.815982818603516, 39.29673767089844, 40.77749252319336, 42.25824737548828, 43.7390022277832]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 5.0, 10.0, 7.0, 8.0, 13.0, 12.0, 14.0, 18.0, 24.0, 20.0, 30.0, 29.0, 26.0, 27.0, 27.0, 36.0, 36.0, 46.0, 42.0, 46.0, 39.0, 39.0, 45.0, 39.0, 30.0, 26.0, 37.0, 39.0, 29.0, 27.0, 27.0, 14.0, 17.0, 15.0, 21.0, 12.0, 9.0, 16.0, 9.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-29.0323486328125, -28.081628799438477, -27.130910873413086, -26.180191040039062, -25.229473114013672, -24.27875328063965, -23.328035354614258, -22.377315521240234, -21.426597595214844, -20.47587776184082, -19.52515983581543, -18.574440002441406, -17.623722076416016, -16.673002243041992, -15.722284317016602, -14.771564483642578, -13.820845603942871, -12.870126724243164, -11.919407844543457, -10.96868896484375, -10.017970085144043, -9.067251205444336, -8.116531372070312, -7.165812969207764, -6.215094089508057, -5.26437520980835, -4.313656330108643, -3.3629372119903564, -2.4122183322906494, -1.4614992141723633, -0.5107803344726562, 0.4399385452270508, 1.3906574249267578, 2.341376304626465, 3.292095184326172, 4.242814064025879, 5.193532943725586, 6.144252300262451, 7.094971179962158, 8.045690536499023, 8.996408462524414, 9.947127342224121, 10.897846221923828, 11.848565101623535, 12.799283981323242, 13.750003814697266, 14.700721740722656, 15.65144157409668, 16.602161407470703, 17.552881240844727, 18.503599166870117, 19.45431900024414, 20.40503692626953, 21.355756759643555, 22.306474685668945, 23.25719451904297, 24.20791244506836, 25.158632278442383, 26.109350204467773, 27.060070037841797, 28.010787963867188, 28.96150779724121, 29.9122257232666, 30.862945556640625, 31.813663482666016]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 8.0, 8.0, 7.0, 10.0, 4.0, 12.0, 16.0, 20.0, 24.0, 22.0, 20.0, 30.0, 31.0, 25.0, 33.0, 36.0, 37.0, 35.0, 54.0, 28.0, 52.0, 36.0, 43.0, 45.0, 26.0, 35.0, 37.0, 27.0, 36.0, 28.0, 27.0, 30.0, 15.0, 15.0, 15.0, 10.0, 9.0, 8.0, 11.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.4765625, -3.372222900390625, -3.26788330078125, -3.163543701171875, -3.0592041015625, -2.954864501953125, -2.85052490234375, -2.746185302734375, -2.641845703125, -2.537506103515625, -2.43316650390625, -2.328826904296875, -2.2244873046875, -2.120147705078125, -2.01580810546875, -1.911468505859375, -1.80712890625, -1.702789306640625, -1.59844970703125, -1.494110107421875, -1.3897705078125, -1.285430908203125, -1.18109130859375, -1.076751708984375, -0.972412109375, -0.868072509765625, -0.76373291015625, -0.659393310546875, -0.5550537109375, -0.450714111328125, -0.34637451171875, -0.242034912109375, -0.1376953125, -0.033355712890625, 0.07098388671875, 0.175323486328125, 0.2796630859375, 0.384002685546875, 0.48834228515625, 0.592681884765625, 0.697021484375, 0.801361083984375, 0.90570068359375, 1.010040283203125, 1.1143798828125, 1.218719482421875, 1.32305908203125, 1.427398681640625, 1.53173828125, 1.636077880859375, 1.74041748046875, 1.844757080078125, 1.9490966796875, 2.053436279296875, 2.15777587890625, 2.262115478515625, 2.366455078125, 2.470794677734375, 2.57513427734375, 2.679473876953125, 2.7838134765625, 2.888153076171875, 2.99249267578125, 3.096832275390625, 3.201171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 13.0, 24.0, 31.0, 55.0, 79.0, 140.0, 173.0, 303.0, 442.0, 638.0, 870.0, 1238.0, 1874.0, 2851.0, 4189.0, 6059.0, 8811.0, 12751.0, 18988.0, 27255.0, 39222.0, 56953.0, 80299.0, 109375.0, 138696.0, 142973.0, 114567.0, 85108.0, 59971.0, 42067.0, 29005.0, 20235.0, 13835.0, 9402.0, 6366.0, 4291.0, 3002.0, 2041.0, 1378.0, 998.0, 671.0, 433.0, 300.0, 204.0, 128.0, 81.0, 56.0, 40.0, 20.0, 18.0, 14.0, 10.0, 4.0, 3.0, 3.0], "bins": [-0.5009765625, -0.4862785339355469, -0.47158050537109375, -0.4568824768066406, -0.4421844482421875, -0.4274864196777344, -0.41278839111328125, -0.3980903625488281, -0.383392333984375, -0.3686943054199219, -0.35399627685546875, -0.3392982482910156, -0.3246002197265625, -0.3099021911621094, -0.29520416259765625, -0.2805061340332031, -0.26580810546875, -0.2511100769042969, -0.23641204833984375, -0.22171401977539062, -0.2070159912109375, -0.19231796264648438, -0.17761993408203125, -0.16292190551757812, -0.148223876953125, -0.13352584838867188, -0.11882781982421875, -0.10412979125976562, -0.0894317626953125, -0.07473373413085938, -0.06003570556640625, -0.045337677001953125, -0.0306396484375, -0.015941619873046875, -0.00124359130859375, 0.013454437255859375, 0.0281524658203125, 0.042850494384765625, 0.05754852294921875, 0.07224655151367188, 0.086944580078125, 0.10164260864257812, 0.11634063720703125, 0.13103866577148438, 0.1457366943359375, 0.16043472290039062, 0.17513275146484375, 0.18983078002929688, 0.20452880859375, 0.21922683715820312, 0.23392486572265625, 0.24862289428710938, 0.2633209228515625, 0.2780189514160156, 0.29271697998046875, 0.3074150085449219, 0.322113037109375, 0.3368110656738281, 0.35150909423828125, 0.3662071228027344, 0.3809051513671875, 0.3956031799316406, 0.41030120849609375, 0.4249992370605469, 0.439697265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 11.0, 12.0, 11.0, 11.0, 10.0, 7.0, 14.0, 22.0, 20.0, 28.0, 19.0, 29.0, 34.0, 25.0, 37.0, 32.0, 27.0, 34.0, 28.0, 28.0, 38.0, 1061.0, 35.0, 37.0, 30.0, 29.0, 41.0, 29.0, 29.0, 28.0, 28.0, 18.0, 22.0, 21.0, 19.0, 16.0, 14.0, 11.0, 11.0, 10.0, 6.0, 11.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.029296875, -1.9670867919921875, -1.904876708984375, -1.8426666259765625, -1.78045654296875, -1.7182464599609375, -1.656036376953125, -1.5938262939453125, -1.5316162109375, -1.4694061279296875, -1.407196044921875, -1.3449859619140625, -1.28277587890625, -1.2205657958984375, -1.158355712890625, -1.0961456298828125, -1.033935546875, -0.9717254638671875, -0.909515380859375, -0.8473052978515625, -0.78509521484375, -0.7228851318359375, -0.660675048828125, -0.5984649658203125, -0.5362548828125, -0.4740447998046875, -0.411834716796875, -0.3496246337890625, -0.28741455078125, -0.2252044677734375, -0.162994384765625, -0.1007843017578125, -0.03857421875, 0.0236358642578125, 0.085845947265625, 0.1480560302734375, 0.21026611328125, 0.2724761962890625, 0.334686279296875, 0.3968963623046875, 0.4591064453125, 0.5213165283203125, 0.583526611328125, 0.6457366943359375, 0.70794677734375, 0.7701568603515625, 0.832366943359375, 0.8945770263671875, 0.956787109375, 1.0189971923828125, 1.081207275390625, 1.1434173583984375, 1.20562744140625, 1.2678375244140625, 1.330047607421875, 1.3922576904296875, 1.4544677734375, 1.5166778564453125, 1.578887939453125, 1.6410980224609375, 1.70330810546875, 1.7655181884765625, 1.827728271484375, 1.8899383544921875, 1.9521484375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 11.0, 26.0, 29.0, 47.0, 72.0, 98.0, 138.0, 218.0, 334.0, 444.0, 703.0, 1013.0, 1639.0, 2380.0, 3700.0, 5586.0, 8408.0, 13222.0, 19976.0, 30263.0, 45343.0, 66834.0, 95414.0, 127034.0, 1193546.0, 137593.0, 108255.0, 77417.0, 53623.0, 35907.0, 23374.0, 15326.0, 9860.0, 6609.0, 4216.0, 2816.0, 1794.0, 1261.0, 883.0, 554.0, 358.0, 269.0, 192.0, 112.0, 74.0, 51.0, 46.0, 29.0, 17.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.2802734375, -0.2717018127441406, -0.26313018798828125, -0.2545585632324219, -0.2459869384765625, -0.23741531372070312, -0.22884368896484375, -0.22027206420898438, -0.211700439453125, -0.20312881469726562, -0.19455718994140625, -0.18598556518554688, -0.1774139404296875, -0.16884231567382812, -0.16027069091796875, -0.15169906616210938, -0.14312744140625, -0.13455581665039062, -0.12598419189453125, -0.11741256713867188, -0.1088409423828125, -0.10026931762695312, -0.09169769287109375, -0.08312606811523438, -0.074554443359375, -0.06598281860351562, -0.05741119384765625, -0.048839569091796875, -0.0402679443359375, -0.031696319580078125, -0.02312469482421875, -0.014553070068359375, -0.0059814453125, 0.002590179443359375, 0.01116180419921875, 0.019733428955078125, 0.0283050537109375, 0.036876678466796875, 0.04544830322265625, 0.054019927978515625, 0.062591552734375, 0.07116317749023438, 0.07973480224609375, 0.08830642700195312, 0.0968780517578125, 0.10544967651367188, 0.11402130126953125, 0.12259292602539062, 0.13116455078125, 0.13973617553710938, 0.14830780029296875, 0.15687942504882812, 0.1654510498046875, 0.17402267456054688, 0.18259429931640625, 0.19116592407226562, 0.199737548828125, 0.20830917358398438, 0.21688079833984375, 0.22545242309570312, 0.2340240478515625, 0.24259567260742188, 0.25116729736328125, 0.2597389221191406, 0.268310546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 10.0, 6.0, 9.0, 9.0, 22.0, 28.0, 31.0, 47.0, 77.0, 147.0, 202.0, 137.0, 73.0, 36.0, 31.0, 23.0, 18.0, 14.0, 11.0, 8.0, 8.0, 8.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006473541259765625, -0.006228506565093994, -0.005983471870422363, -0.005738437175750732, -0.0054934024810791016, -0.005248367786407471, -0.00500333309173584, -0.004758298397064209, -0.004513263702392578, -0.004268229007720947, -0.004023194313049316, -0.0037781596183776855, -0.0035331249237060547, -0.003288090229034424, -0.003043055534362793, -0.002798020839691162, -0.0025529861450195312, -0.0023079514503479004, -0.0020629167556762695, -0.0018178820610046387, -0.0015728473663330078, -0.001327812671661377, -0.001082777976989746, -0.0008377432823181152, -0.0005927085876464844, -0.0003476738929748535, -0.00010263919830322266, 0.0001423954963684082, 0.00038743019104003906, 0.0006324648857116699, 0.0008774995803833008, 0.0011225342750549316, 0.0013675689697265625, 0.0016126036643981934, 0.0018576383590698242, 0.002102673053741455, 0.002347707748413086, 0.002592742443084717, 0.0028377771377563477, 0.0030828118324279785, 0.0033278465270996094, 0.0035728812217712402, 0.003817915916442871, 0.004062950611114502, 0.004307985305786133, 0.004553020000457764, 0.0047980546951293945, 0.005043089389801025, 0.005288124084472656, 0.005533158779144287, 0.005778193473815918, 0.006023228168487549, 0.00626826286315918, 0.0065132975578308105, 0.006758332252502441, 0.007003366947174072, 0.007248401641845703, 0.007493436336517334, 0.007738471031188965, 0.007983505725860596, 0.008228540420532227, 0.008473575115203857, 0.008718609809875488, 0.00896364450454712, 0.00920867919921875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 9.0, 8.0, 10.0, 20.0, 30.0, 35.0, 51.0, 97.0, 197.0, 428.0, 1385.0, 5529.0, 96567.0, 923368.0, 16741.0, 2649.0, 773.0, 286.0, 126.0, 76.0, 39.0, 24.0, 18.0, 6.0, 12.0, 7.0, 9.0, 7.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12772464752197266, -0.12410163879394531, -0.12047863006591797, -0.11685562133789062, -0.11323261260986328, -0.10960960388183594, -0.1059865951538086, -0.10236358642578125, -0.0987405776977539, -0.09511756896972656, -0.09149456024169922, -0.08787155151367188, -0.08424854278564453, -0.08062553405761719, -0.07700252532958984, -0.0733795166015625, -0.06975650787353516, -0.06613349914550781, -0.06251049041748047, -0.058887481689453125, -0.05526447296142578, -0.05164146423339844, -0.048018455505371094, -0.04439544677734375, -0.040772438049316406, -0.03714942932128906, -0.03352642059326172, -0.029903411865234375, -0.02628040313720703, -0.022657394409179688, -0.019034385681152344, -0.015411376953125, -0.011788368225097656, -0.008165359497070312, -0.004542350769042969, -0.000919342041015625, 0.0027036666870117188, 0.0063266754150390625, 0.009949684143066406, 0.01357269287109375, 0.017195701599121094, 0.020818710327148438, 0.02444171905517578, 0.028064727783203125, 0.03168773651123047, 0.03531074523925781, 0.038933753967285156, 0.0425567626953125, 0.046179771423339844, 0.04980278015136719, 0.05342578887939453, 0.057048797607421875, 0.06067180633544922, 0.06429481506347656, 0.0679178237915039, 0.07154083251953125, 0.0751638412475586, 0.07878684997558594, 0.08240985870361328, 0.08603286743164062, 0.08965587615966797, 0.09327888488769531, 0.09690189361572266, 0.10052490234375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 18.0, 39.0, 58.0, 143.0, 235.0, 249.0, 126.0, 61.0, 25.0, 22.0, 9.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.039618588984012604, -0.038856588304042816, -0.03809459134936333, -0.03733259066939354, -0.03657058998942375, -0.03580859303474426, -0.035046592354774475, -0.03428459167480469, -0.0335225909948349, -0.03276059031486511, -0.03199859336018562, -0.031236592680215836, -0.030474592000246048, -0.02971259318292141, -0.02895059436559677, -0.028188593685626984, -0.027426596730947495, -0.026664597913622856, -0.02590259723365307, -0.02514059841632843, -0.024378597736358643, -0.023616598919034004, -0.022854600101709366, -0.022092599421739578, -0.02133060060441494, -0.0205686017870903, -0.019806601107120514, -0.019044602289795876, -0.018282603472471237, -0.01752060279250145, -0.01675860397517681, -0.015996605157852173, -0.015234602615237236, -0.014472602866590023, -0.01371060311794281, -0.012948604300618172, -0.012186604551970959, -0.011424604803323746, -0.010662605985999107, -0.009900606237351894, -0.009138606488704681, -0.008376606740057468, -0.007614607457071543, -0.006852608174085617, -0.006090608425438404, -0.005328608676791191, -0.004566609393805265, -0.0038046101108193398, -0.0030426103621721268, -0.0022806108463555574, -0.0015186113305389881, -0.0007566118147224188, 5.387701094150543e-06, 0.0007673872169107199, 0.0015293867327272892, 0.002291386015713215, 0.003053385764360428, 0.003815385280176997, 0.0045773847959935665, 0.005339384078979492, 0.006101383827626705, 0.006863383576273918, 0.007625382859259844, 0.00838738214224577, 0.009149381890892982]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 7.0, 5.0, 5.0, 4.0, 6.0, 8.0, 8.0, 7.0, 13.0, 19.0, 25.0, 19.0, 27.0, 21.0, 21.0, 26.0, 31.0, 33.0, 31.0, 51.0, 44.0, 37.0, 35.0, 35.0, 31.0, 44.0, 36.0, 42.0, 30.0, 37.0, 33.0, 23.0, 25.0, 38.0, 17.0, 18.0, 22.0, 18.0, 14.0, 15.0, 4.0, 11.0, 5.0, 6.0, 3.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0], "bins": [-0.003855407238006592, -0.0037495968863368034, -0.003643786534667015, -0.0035379761829972267, -0.0034321658313274384, -0.00332635547965765, -0.0032205451279878616, -0.0031147347763180733, -0.003008924424648285, -0.0029031140729784966, -0.002797303721308708, -0.00269149336963892, -0.0025856830179691315, -0.002479872666299343, -0.0023740623146295547, -0.0022682519629597664, -0.002162441611289978, -0.0020566312596201897, -0.0019508209079504013, -0.001845010556280613, -0.0017392002046108246, -0.0016333898529410362, -0.0015275795012712479, -0.0014217691496014595, -0.0013159587979316711, -0.0012101484462618828, -0.0011043380945920944, -0.000998527742922306, -0.0008927173912525177, -0.0007869070395827293, -0.000681096687912941, -0.0005752863362431526, -0.00046947598457336426, -0.0003636656329035759, -0.00025785528123378754, -0.00015204492956399918, -4.6234577894210815e-05, 5.9575773775577545e-05, 0.0001653861254453659, 0.00027119647711515427, 0.0003770068287849426, 0.000482817180454731, 0.0005886275321245193, 0.0006944378837943077, 0.0008002482354640961, 0.0009060585871338844, 0.0010118689388036728, 0.0011176792904734612, 0.0012234896421432495, 0.0013292999938130379, 0.0014351103454828262, 0.0015409206971526146, 0.001646731048822403, 0.0017525414004921913, 0.0018583517521619797, 0.001964162103831768, 0.0020699724555015564, 0.0021757828071713448, 0.002281593158841133, 0.0023874035105109215, 0.00249321386218071, 0.002599024213850498, 0.0027048345655202866, 0.002810644917190075, 0.0029164552688598633]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 5.0, 8.0, 8.0, 8.0, 9.0, 4.0, 12.0, 16.0, 20.0, 24.0, 22.0, 20.0, 30.0, 30.0, 26.0, 33.0, 36.0, 37.0, 35.0, 55.0, 27.0, 52.0, 36.0, 43.0, 44.0, 27.0, 35.0, 37.0, 27.0, 37.0, 27.0, 27.0, 30.0, 15.0, 15.0, 15.0, 10.0, 9.0, 8.0, 11.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.4765625, -3.372222900390625, -3.26788330078125, -3.163543701171875, -3.0592041015625, -2.954864501953125, -2.85052490234375, -2.746185302734375, -2.641845703125, -2.537506103515625, -2.43316650390625, -2.328826904296875, -2.2244873046875, -2.120147705078125, -2.01580810546875, -1.911468505859375, -1.80712890625, -1.702789306640625, -1.59844970703125, -1.494110107421875, -1.3897705078125, -1.285430908203125, -1.18109130859375, -1.076751708984375, -0.972412109375, -0.868072509765625, -0.76373291015625, -0.659393310546875, -0.5550537109375, -0.450714111328125, -0.34637451171875, -0.242034912109375, -0.1376953125, -0.033355712890625, 0.07098388671875, 0.175323486328125, 0.2796630859375, 0.384002685546875, 0.48834228515625, 0.592681884765625, 0.697021484375, 0.801361083984375, 0.90570068359375, 1.010040283203125, 1.1143798828125, 1.218719482421875, 1.32305908203125, 1.427398681640625, 1.53173828125, 1.636077880859375, 1.74041748046875, 1.844757080078125, 1.9490966796875, 2.053436279296875, 2.15777587890625, 2.262115478515625, 2.366455078125, 2.470794677734375, 2.57513427734375, 2.679473876953125, 2.7838134765625, 2.888153076171875, 2.99249267578125, 3.096832275390625, 3.201171875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 11.0, 11.0, 11.0, 26.0, 32.0, 41.0, 80.0, 126.0, 185.0, 311.0, 506.0, 887.0, 1502.0, 2696.0, 4730.0, 8265.0, 14471.0, 26224.0, 48138.0, 99825.0, 269949.0, 326563.0, 120559.0, 55628.0, 29361.0, 16349.0, 9364.0, 5377.0, 3054.0, 1736.0, 1043.0, 563.0, 371.0, 221.0, 129.0, 88.0, 50.0, 20.0, 19.0, 14.0, 10.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.94140625, -2.84979248046875, -2.7581787109375, -2.66656494140625, -2.574951171875, -2.48333740234375, -2.3917236328125, -2.30010986328125, -2.20849609375, -2.11688232421875, -2.0252685546875, -1.93365478515625, -1.842041015625, -1.75042724609375, -1.6588134765625, -1.56719970703125, -1.4755859375, -1.38397216796875, -1.2923583984375, -1.20074462890625, -1.109130859375, -1.01751708984375, -0.9259033203125, -0.83428955078125, -0.74267578125, -0.65106201171875, -0.5594482421875, -0.46783447265625, -0.376220703125, -0.28460693359375, -0.1929931640625, -0.10137939453125, -0.009765625, 0.08184814453125, 0.1734619140625, 0.26507568359375, 0.356689453125, 0.44830322265625, 0.5399169921875, 0.63153076171875, 0.72314453125, 0.81475830078125, 0.9063720703125, 0.99798583984375, 1.089599609375, 1.18121337890625, 1.2728271484375, 1.36444091796875, 1.4560546875, 1.54766845703125, 1.6392822265625, 1.73089599609375, 1.822509765625, 1.91412353515625, 2.0057373046875, 2.09735107421875, 2.18896484375, 2.28057861328125, 2.3721923828125, 2.46380615234375, 2.555419921875, 2.64703369140625, 2.7386474609375, 2.83026123046875, 2.921875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 1.0, 2.0, 5.0, 8.0, 11.0, 11.0, 14.0, 20.0, 21.0, 23.0, 33.0, 32.0, 42.0, 45.0, 56.0, 60.0, 93.0, 145.0, 1472.0, 376.0, 118.0, 70.0, 68.0, 62.0, 46.0, 34.0, 30.0, 31.0, 27.0, 24.0, 16.0, 11.0, 13.0, 8.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.453125, -15.99462890625, -15.5361328125, -15.07763671875, -14.619140625, -14.16064453125, -13.7021484375, -13.24365234375, -12.78515625, -12.32666015625, -11.8681640625, -11.40966796875, -10.951171875, -10.49267578125, -10.0341796875, -9.57568359375, -9.1171875, -8.65869140625, -8.2001953125, -7.74169921875, -7.283203125, -6.82470703125, -6.3662109375, -5.90771484375, -5.44921875, -4.99072265625, -4.5322265625, -4.07373046875, -3.615234375, -3.15673828125, -2.6982421875, -2.23974609375, -1.78125, -1.32275390625, -0.8642578125, -0.40576171875, 0.052734375, 0.51123046875, 0.9697265625, 1.42822265625, 1.88671875, 2.34521484375, 2.8037109375, 3.26220703125, 3.720703125, 4.17919921875, 4.6376953125, 5.09619140625, 5.5546875, 6.01318359375, 6.4716796875, 6.93017578125, 7.388671875, 7.84716796875, 8.3056640625, 8.76416015625, 9.22265625, 9.68115234375, 10.1396484375, 10.59814453125, 11.056640625, 11.51513671875, 11.9736328125, 12.43212890625, 12.890625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 15.0, 33.0, 33.0, 58.0, 86.0, 146.0, 230.0, 559.0, 2300.0, 221779.0, 2913845.0, 5093.0, 724.0, 304.0, 165.0, 113.0, 71.0, 46.0, 27.0, 14.0, 11.0, 5.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.36669921875, -34.9208984375, -33.47509765625, -32.029296875, -30.58349609375, -29.1376953125, -27.69189453125, -26.24609375, -24.80029296875, -23.3544921875, -21.90869140625, -20.462890625, -19.01708984375, -17.5712890625, -16.12548828125, -14.6796875, -13.23388671875, -11.7880859375, -10.34228515625, -8.896484375, -7.45068359375, -6.0048828125, -4.55908203125, -3.11328125, -1.66748046875, -0.2216796875, 1.22412109375, 2.669921875, 4.11572265625, 5.5615234375, 7.00732421875, 8.453125, 9.89892578125, 11.3447265625, 12.79052734375, 14.236328125, 15.68212890625, 17.1279296875, 18.57373046875, 20.01953125, 21.46533203125, 22.9111328125, 24.35693359375, 25.802734375, 27.24853515625, 28.6943359375, 30.14013671875, 31.5859375, 33.03173828125, 34.4775390625, 35.92333984375, 37.369140625, 38.81494140625, 40.2607421875, 41.70654296875, 43.15234375, 44.59814453125, 46.0439453125, 47.48974609375, 48.935546875, 50.38134765625, 51.8271484375, 53.27294921875, 54.71875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 16.0, 23.0, 50.0, 75.0, 117.0, 123.0, 137.0, 135.0, 117.0, 95.0, 58.0, 30.0, 13.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.66596031188965, -25.77388572692871, -24.881811141967773, -23.989736557006836, -23.0976619720459, -22.20558738708496, -21.313512802124023, -20.421438217163086, -19.52936363220215, -18.63728904724121, -17.745214462280273, -16.853139877319336, -15.961065292358398, -15.068990707397461, -14.176916122436523, -13.284841537475586, -12.392767906188965, -11.500693321228027, -10.60861873626709, -9.716544151306152, -8.824469566345215, -7.9323954582214355, -7.040320873260498, -6.1482462882995605, -5.256171703338623, -4.3640971183776855, -3.472022533416748, -2.5799481868743896, -1.6878736019134521, -0.7957992553710938, 0.09627532958984375, 0.9883499145507812, 1.8804244995117188, 2.7724990844726562, 3.6645736694335938, 4.556648254394531, 5.448722839355469, 6.340796947479248, 7.2328715324401855, 8.124946594238281, 9.017021179199219, 9.909095764160156, 10.801170349121094, 11.693244934082031, 12.585319519042969, 13.477394104003906, 14.369468688964844, 15.261543273925781, 16.15361785888672, 17.045692443847656, 17.937767028808594, 18.82984161376953, 19.72191619873047, 20.613990783691406, 21.506065368652344, 22.39813995361328, 23.290212631225586, 24.182287216186523, 25.07436180114746, 25.9664363861084, 26.858510971069336, 27.750585556030273, 28.64266014099121, 29.53473472595215, 30.426809310913086]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 11.0, 23.0, 22.0, 25.0, 27.0, 27.0, 24.0, 24.0, 31.0, 38.0, 55.0, 44.0, 51.0, 48.0, 52.0, 44.0, 53.0, 41.0, 38.0, 35.0, 51.0, 21.0, 27.0, 28.0, 27.0, 23.0, 22.0, 16.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.16105651855469, -30.962444305419922, -29.763832092285156, -28.56521987915039, -27.366607666015625, -26.16799545288086, -24.969383239746094, -23.770771026611328, -22.572158813476562, -21.373546600341797, -20.17493438720703, -18.976322174072266, -17.7777099609375, -16.579097747802734, -15.380486488342285, -14.18187427520752, -12.98326301574707, -11.784650802612305, -10.586038589477539, -9.387426376342773, -8.188814163208008, -6.9902024269104, -5.791590690612793, -4.592978477478027, -3.3943662643432617, -2.195754051208496, -0.9971420764923096, 0.20146989822387695, 1.4000821113586426, 2.598694324493408, 3.7973060607910156, 4.995918273925781, 6.194530487060547, 7.3931427001953125, 8.591754913330078, 9.790367126464844, 10.98897933959961, 12.187591552734375, 13.386202812194824, 14.58481502532959, 15.783427238464355, 16.982038497924805, 18.18065071105957, 19.379262924194336, 20.5778751373291, 21.776487350463867, 22.975099563598633, 24.1737117767334, 25.372323989868164, 26.57093620300293, 27.769548416137695, 28.96816062927246, 30.166772842407227, 31.365385055541992, 32.563995361328125, 33.76260757446289, 34.961219787597656, 36.15983200073242, 37.35844421386719, 38.55705642700195, 39.75566864013672, 40.954280853271484, 42.15289306640625, 43.351505279541016, 44.55011749267578]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 3.0, 7.0, 6.0, 6.0, 10.0, 9.0, 8.0, 8.0, 14.0, 23.0, 21.0, 24.0, 32.0, 23.0, 23.0, 20.0, 30.0, 30.0, 37.0, 45.0, 39.0, 36.0, 38.0, 47.0, 37.0, 39.0, 46.0, 27.0, 37.0, 36.0, 31.0, 28.0, 22.0, 23.0, 23.0, 29.0, 17.0, 11.0, 4.0, 11.0, 10.0, 10.0, 6.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.69921875, -3.58953857421875, -3.4798583984375, -3.37017822265625, -3.260498046875, -3.15081787109375, -3.0411376953125, -2.93145751953125, -2.82177734375, -2.71209716796875, -2.6024169921875, -2.49273681640625, -2.383056640625, -2.27337646484375, -2.1636962890625, -2.05401611328125, -1.9443359375, -1.83465576171875, -1.7249755859375, -1.61529541015625, -1.505615234375, -1.39593505859375, -1.2862548828125, -1.17657470703125, -1.06689453125, -0.95721435546875, -0.8475341796875, -0.73785400390625, -0.628173828125, -0.51849365234375, -0.4088134765625, -0.29913330078125, -0.189453125, -0.07977294921875, 0.0299072265625, 0.13958740234375, 0.249267578125, 0.35894775390625, 0.4686279296875, 0.57830810546875, 0.68798828125, 0.79766845703125, 0.9073486328125, 1.01702880859375, 1.126708984375, 1.23638916015625, 1.3460693359375, 1.45574951171875, 1.5654296875, 1.67510986328125, 1.7847900390625, 1.89447021484375, 2.004150390625, 2.11383056640625, 2.2235107421875, 2.33319091796875, 2.44287109375, 2.55255126953125, 2.6622314453125, 2.77191162109375, 2.881591796875, 2.99127197265625, 3.1009521484375, 3.21063232421875, 3.3203125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 3.0, 5.0, 6.0, 16.0, 21.0, 16.0, 34.0, 42.0, 63.0, 65.0, 112.0, 161.0, 243.0, 470.0, 798.0, 1705.0, 3749.0, 8939.0, 22968.0, 66661.0, 226912.0, 935825.0, 1868261.0, 777475.0, 186929.0, 56947.0, 20645.0, 8158.0, 3394.0, 1634.0, 773.0, 451.0, 243.0, 165.0, 103.0, 75.0, 57.0, 55.0, 29.0, 15.0, 12.0, 15.0, 11.0, 11.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6796875, -5.47991943359375, -5.2801513671875, -5.08038330078125, -4.880615234375, -4.68084716796875, -4.4810791015625, -4.28131103515625, -4.08154296875, -3.88177490234375, -3.6820068359375, -3.48223876953125, -3.282470703125, -3.08270263671875, -2.8829345703125, -2.68316650390625, -2.4833984375, -2.28363037109375, -2.0838623046875, -1.88409423828125, -1.684326171875, -1.48455810546875, -1.2847900390625, -1.08502197265625, -0.88525390625, -0.68548583984375, -0.4857177734375, -0.28594970703125, -0.086181640625, 0.11358642578125, 0.3133544921875, 0.51312255859375, 0.712890625, 0.91265869140625, 1.1124267578125, 1.31219482421875, 1.511962890625, 1.71173095703125, 1.9114990234375, 2.11126708984375, 2.31103515625, 2.51080322265625, 2.7105712890625, 2.91033935546875, 3.110107421875, 3.30987548828125, 3.5096435546875, 3.70941162109375, 3.9091796875, 4.10894775390625, 4.3087158203125, 4.50848388671875, 4.708251953125, 4.90802001953125, 5.1077880859375, 5.30755615234375, 5.50732421875, 5.70709228515625, 5.9068603515625, 6.10662841796875, 6.306396484375, 6.50616455078125, 6.7059326171875, 6.90570068359375, 7.10546875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 11.0, 17.0, 25.0, 44.0, 76.0, 144.0, 208.0, 310.0, 548.0, 767.0, 690.0, 466.0, 286.0, 203.0, 105.0, 60.0, 44.0, 23.0, 19.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.875, -22.3863525390625, -21.897705078125, -21.4090576171875, -20.92041015625, -20.4317626953125, -19.943115234375, -19.4544677734375, -18.9658203125, -18.4771728515625, -17.988525390625, -17.4998779296875, -17.01123046875, -16.5225830078125, -16.033935546875, -15.5452880859375, -15.056640625, -14.5679931640625, -14.079345703125, -13.5906982421875, -13.10205078125, -12.6134033203125, -12.124755859375, -11.6361083984375, -11.1474609375, -10.6588134765625, -10.170166015625, -9.6815185546875, -9.19287109375, -8.7042236328125, -8.215576171875, -7.7269287109375, -7.23828125, -6.7496337890625, -6.260986328125, -5.7723388671875, -5.28369140625, -4.7950439453125, -4.306396484375, -3.8177490234375, -3.3291015625, -2.8404541015625, -2.351806640625, -1.8631591796875, -1.37451171875, -0.8858642578125, -0.397216796875, 0.0914306640625, 0.580078125, 1.0687255859375, 1.557373046875, 2.0460205078125, 2.53466796875, 3.0233154296875, 3.511962890625, 4.0006103515625, 4.4892578125, 4.9779052734375, 5.466552734375, 5.9552001953125, 6.44384765625, 6.9324951171875, 7.421142578125, 7.9097900390625, 8.3984375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 20.0, 15.0, 24.0, 49.0, 87.0, 159.0, 245.0, 512.0, 1770.0, 13934.0, 415126.0, 3604877.0, 148354.0, 7079.0, 1118.0, 387.0, 219.0, 115.0, 85.0, 45.0, 23.0, 16.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.609375, -15.653076171875, -14.69677734375, -13.740478515625, -12.7841796875, -11.827880859375, -10.87158203125, -9.915283203125, -8.958984375, -8.002685546875, -7.04638671875, -6.090087890625, -5.1337890625, -4.177490234375, -3.22119140625, -2.264892578125, -1.30859375, -0.352294921875, 0.60400390625, 1.560302734375, 2.5166015625, 3.472900390625, 4.42919921875, 5.385498046875, 6.341796875, 7.298095703125, 8.25439453125, 9.210693359375, 10.1669921875, 11.123291015625, 12.07958984375, 13.035888671875, 13.9921875, 14.948486328125, 15.90478515625, 16.861083984375, 17.8173828125, 18.773681640625, 19.72998046875, 20.686279296875, 21.642578125, 22.598876953125, 23.55517578125, 24.511474609375, 25.4677734375, 26.424072265625, 27.38037109375, 28.336669921875, 29.29296875, 30.249267578125, 31.20556640625, 32.161865234375, 33.1181640625, 34.074462890625, 35.03076171875, 35.987060546875, 36.943359375, 37.899658203125, 38.85595703125, 39.812255859375, 40.7685546875, 41.724853515625, 42.68115234375, 43.637451171875, 44.59375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 19.0, 34.0, 59.0, 93.0, 128.0, 146.0, 152.0, 132.0, 100.0, 71.0, 33.0, 23.0, 9.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.00104522705078, -116.72124481201172, -114.44144439697266, -112.1616439819336, -109.88184356689453, -107.60203552246094, -105.32223510742188, -103.04243469238281, -100.76263427734375, -98.48283386230469, -96.20303344726562, -93.92323303222656, -91.6434326171875, -89.36363220214844, -87.08383178710938, -84.80402374267578, -82.52423095703125, -80.24443054199219, -77.96463012695312, -75.68482971191406, -73.405029296875, -71.12522888183594, -68.84542846679688, -66.56562042236328, -64.28582000732422, -62.006019592285156, -59.726219177246094, -57.44641876220703, -55.1666145324707, -52.88681411743164, -50.60701370239258, -48.327213287353516, -46.04740524291992, -43.76760482788086, -41.4878044128418, -39.20800018310547, -36.928199768066406, -34.648399353027344, -32.36859893798828, -30.08879852294922, -27.808996200561523, -25.52919578552246, -23.249393463134766, -20.969593048095703, -18.68979263305664, -16.409990310668945, -14.130189895629883, -11.850388526916504, -9.570587158203125, -7.290785789489746, -5.010984897613525, -2.7311840057373047, -0.4513826370239258, 1.8284187316894531, 4.108219146728516, 6.3880205154418945, 8.667821884155273, 10.947623252868652, 13.227424621582031, 15.507225036621094, 17.787025451660156, 20.06682777404785, 22.346628189086914, 24.62643051147461, 26.906230926513672]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 4.0, 9.0, 6.0, 3.0, 8.0, 13.0, 13.0, 12.0, 22.0, 24.0, 36.0, 23.0, 35.0, 29.0, 42.0, 28.0, 36.0, 42.0, 45.0, 38.0, 39.0, 37.0, 45.0, 46.0, 28.0, 44.0, 38.0, 31.0, 23.0, 28.0, 22.0, 26.0, 22.0, 14.0, 12.0, 10.0, 16.0, 9.0, 7.0, 8.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.35723876953125, -28.36712074279785, -27.377004623413086, -26.386886596679688, -25.39676856994629, -24.40665054321289, -23.416534423828125, -22.426416397094727, -21.436298370361328, -20.44618034362793, -19.456064224243164, -18.465946197509766, -17.475828170776367, -16.48571014404297, -15.495594024658203, -14.505475997924805, -13.515359878540039, -12.525242805480957, -11.535124778747559, -10.545007705688477, -9.554889678955078, -8.564772605895996, -7.574655532836914, -6.584537982940674, -5.594420433044434, -4.604302883148193, -3.6141855716705322, -2.624068260192871, -1.6339507102966309, -0.6438331604003906, 0.3462839126586914, 1.3364014625549316, 2.326519012451172, 3.316636562347412, 4.306754112243652, 5.296871185302734, 6.286988735198975, 7.277106285095215, 8.267223358154297, 9.257341384887695, 10.247458457946777, 11.23757553100586, 12.227693557739258, 13.21781063079834, 14.207927703857422, 15.19804573059082, 16.18816375732422, 17.178279876708984, 18.168397903442383, 19.15851593017578, 20.148632049560547, 21.138750076293945, 22.128868103027344, 23.11898422241211, 24.109102249145508, 25.099220275878906, 26.089336395263672, 27.07945442199707, 28.069570541381836, 29.059688568115234, 30.049806594848633, 31.03992462158203, 32.0300407409668, 33.02015686035156, 34.010276794433594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 4.0, 12.0, 12.0, 16.0, 16.0, 15.0, 14.0, 24.0, 21.0, 29.0, 38.0, 27.0, 35.0, 26.0, 44.0, 44.0, 41.0, 45.0, 47.0, 41.0, 33.0, 44.0, 31.0, 49.0, 39.0, 21.0, 25.0, 32.0, 17.0, 29.0, 19.0, 16.0, 16.0, 15.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.2421875, -4.122314453125, -4.00244140625, -3.882568359375, -3.7626953125, -3.642822265625, -3.52294921875, -3.403076171875, -3.283203125, -3.163330078125, -3.04345703125, -2.923583984375, -2.8037109375, -2.683837890625, -2.56396484375, -2.444091796875, -2.32421875, -2.204345703125, -2.08447265625, -1.964599609375, -1.8447265625, -1.724853515625, -1.60498046875, -1.485107421875, -1.365234375, -1.245361328125, -1.12548828125, -1.005615234375, -0.8857421875, -0.765869140625, -0.64599609375, -0.526123046875, -0.40625, -0.286376953125, -0.16650390625, -0.046630859375, 0.0732421875, 0.193115234375, 0.31298828125, 0.432861328125, 0.552734375, 0.672607421875, 0.79248046875, 0.912353515625, 1.0322265625, 1.152099609375, 1.27197265625, 1.391845703125, 1.51171875, 1.631591796875, 1.75146484375, 1.871337890625, 1.9912109375, 2.111083984375, 2.23095703125, 2.350830078125, 2.470703125, 2.590576171875, 2.71044921875, 2.830322265625, 2.9501953125, 3.070068359375, 3.18994140625, 3.309814453125, 3.4296875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 6.0, 14.0, 14.0, 34.0, 32.0, 66.0, 85.0, 149.0, 241.0, 424.0, 697.0, 1111.0, 2004.0, 3583.0, 6117.0, 10632.0, 18427.0, 31117.0, 52396.0, 86477.0, 135163.0, 185645.0, 181689.0, 129730.0, 81973.0, 49918.0, 29813.0, 17379.0, 9928.0, 5794.0, 3174.0, 1887.0, 1120.0, 638.0, 396.0, 230.0, 162.0, 108.0, 64.0, 40.0, 31.0, 18.0, 7.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.7900390625, -0.7674331665039062, -0.7448272705078125, -0.7222213745117188, -0.699615478515625, -0.6770095825195312, -0.6544036865234375, -0.6317977905273438, -0.60919189453125, -0.5865859985351562, -0.5639801025390625, -0.5413742065429688, -0.518768310546875, -0.49616241455078125, -0.4735565185546875, -0.45095062255859375, -0.4283447265625, -0.40573883056640625, -0.3831329345703125, -0.36052703857421875, -0.337921142578125, -0.31531524658203125, -0.2927093505859375, -0.27010345458984375, -0.24749755859375, -0.22489166259765625, -0.2022857666015625, -0.17967987060546875, -0.157073974609375, -0.13446807861328125, -0.1118621826171875, -0.08925628662109375, -0.066650390625, -0.04404449462890625, -0.0214385986328125, 0.00116729736328125, 0.023773193359375, 0.04637908935546875, 0.0689849853515625, 0.09159088134765625, 0.11419677734375, 0.13680267333984375, 0.1594085693359375, 0.18201446533203125, 0.204620361328125, 0.22722625732421875, 0.2498321533203125, 0.27243804931640625, 0.2950439453125, 0.31764984130859375, 0.3402557373046875, 0.36286163330078125, 0.385467529296875, 0.40807342529296875, 0.4306793212890625, 0.45328521728515625, 0.47589111328125, 0.49849700927734375, 0.5211029052734375, 0.5437088012695312, 0.566314697265625, 0.5889205932617188, 0.6115264892578125, 0.6341323852539062, 0.65673828125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 9.0, 6.0, 14.0, 15.0, 12.0, 11.0, 11.0, 16.0, 22.0, 25.0, 23.0, 27.0, 30.0, 33.0, 51.0, 13.0, 32.0, 37.0, 42.0, 1062.0, 33.0, 43.0, 40.0, 33.0, 45.0, 27.0, 29.0, 29.0, 32.0, 33.0, 31.0, 26.0, 35.0, 15.0, 20.0, 6.0, 13.0, 10.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.266845703125, -2.18798828125, -2.109130859375, -2.0302734375, -1.951416015625, -1.87255859375, -1.793701171875, -1.71484375, -1.635986328125, -1.55712890625, -1.478271484375, -1.3994140625, -1.320556640625, -1.24169921875, -1.162841796875, -1.083984375, -1.005126953125, -0.92626953125, -0.847412109375, -0.7685546875, -0.689697265625, -0.61083984375, -0.531982421875, -0.453125, -0.374267578125, -0.29541015625, -0.216552734375, -0.1376953125, -0.058837890625, 0.02001953125, 0.098876953125, 0.177734375, 0.256591796875, 0.33544921875, 0.414306640625, 0.4931640625, 0.572021484375, 0.65087890625, 0.729736328125, 0.80859375, 0.887451171875, 0.96630859375, 1.045166015625, 1.1240234375, 1.202880859375, 1.28173828125, 1.360595703125, 1.439453125, 1.518310546875, 1.59716796875, 1.676025390625, 1.7548828125, 1.833740234375, 1.91259765625, 1.991455078125, 2.0703125, 2.149169921875, 2.22802734375, 2.306884765625, 2.3857421875, 2.464599609375, 2.54345703125, 2.622314453125, 2.701171875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 9.0, 21.0, 26.0, 29.0, 45.0, 67.0, 109.0, 153.0, 247.0, 383.0, 529.0, 885.0, 1307.0, 2064.0, 3169.0, 5142.0, 8410.0, 13718.0, 21741.0, 34974.0, 54834.0, 84115.0, 122299.0, 250013.0, 1115494.0, 128683.0, 89935.0, 59077.0, 37424.0, 23415.0, 14586.0, 8877.0, 5564.0, 3505.0, 2177.0, 1441.0, 870.0, 608.0, 397.0, 257.0, 176.0, 121.0, 82.0, 56.0, 36.0, 17.0, 19.0, 13.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33935546875, -0.3287773132324219, -0.31819915771484375, -0.3076210021972656, -0.2970428466796875, -0.2864646911621094, -0.27588653564453125, -0.2653083801269531, -0.254730224609375, -0.24415206909179688, -0.23357391357421875, -0.22299575805664062, -0.2124176025390625, -0.20183944702148438, -0.19126129150390625, -0.18068313598632812, -0.17010498046875, -0.15952682495117188, -0.14894866943359375, -0.13837051391601562, -0.1277923583984375, -0.11721420288085938, -0.10663604736328125, -0.09605789184570312, -0.085479736328125, -0.07490158081054688, -0.06432342529296875, -0.053745269775390625, -0.0431671142578125, -0.032588958740234375, -0.02201080322265625, -0.011432647705078125, -0.0008544921875, 0.009723663330078125, 0.02030181884765625, 0.030879974365234375, 0.0414581298828125, 0.052036285400390625, 0.06261444091796875, 0.07319259643554688, 0.083770751953125, 0.09434890747070312, 0.10492706298828125, 0.11550521850585938, 0.1260833740234375, 0.13666152954101562, 0.14723968505859375, 0.15781784057617188, 0.16839599609375, 0.17897415161132812, 0.18955230712890625, 0.20013046264648438, 0.2107086181640625, 0.22128677368164062, 0.23186492919921875, 0.24244308471679688, 0.253021240234375, 0.2635993957519531, 0.27417755126953125, 0.2847557067871094, 0.2953338623046875, 0.3059120178222656, 0.31649017333984375, 0.3270683288574219, 0.337646484375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 3.0, 6.0, 15.0, 13.0, 13.0, 15.0, 24.0, 17.0, 37.0, 38.0, 38.0, 41.0, 34.0, 51.0, 102.0, 139.0, 55.0, 38.0, 41.0, 33.0, 35.0, 29.0, 27.0, 18.0, 11.0, 24.0, 20.0, 19.0, 6.0, 5.0, 5.0, 5.0, 1.0, 5.0, 4.0, 1.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0193023681640625, -0.01864004135131836, -0.01797771453857422, -0.017315387725830078, -0.016653060913085938, -0.015990734100341797, -0.015328407287597656, -0.014666080474853516, -0.014003753662109375, -0.013341426849365234, -0.012679100036621094, -0.012016773223876953, -0.011354446411132812, -0.010692119598388672, -0.010029792785644531, -0.00936746597290039, -0.00870513916015625, -0.00804281234741211, -0.007380485534667969, -0.006718158721923828, -0.0060558319091796875, -0.005393505096435547, -0.004731178283691406, -0.004068851470947266, -0.003406524658203125, -0.0027441978454589844, -0.0020818710327148438, -0.0014195442199707031, -0.0007572174072265625, -9.489059448242188e-05, 0.0005674362182617188, 0.0012297630310058594, 0.00189208984375, 0.0025544166564941406, 0.0032167434692382812, 0.003879070281982422, 0.0045413970947265625, 0.005203723907470703, 0.005866050720214844, 0.006528377532958984, 0.007190704345703125, 0.007853031158447266, 0.008515357971191406, 0.009177684783935547, 0.009840011596679688, 0.010502338409423828, 0.011164665222167969, 0.01182699203491211, 0.01248931884765625, 0.01315164566040039, 0.013813972473144531, 0.014476299285888672, 0.015138626098632812, 0.015800952911376953, 0.016463279724121094, 0.017125606536865234, 0.017787933349609375, 0.018450260162353516, 0.019112586975097656, 0.019774913787841797, 0.020437240600585938, 0.021099567413330078, 0.02176189422607422, 0.02242422103881836, 0.0230865478515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 6.0, 4.0, 5.0, 10.0, 16.0, 21.0, 26.0, 22.0, 28.0, 46.0, 54.0, 98.0, 147.0, 226.0, 429.0, 1479.0, 146466.0, 895532.0, 2570.0, 544.0, 294.0, 150.0, 103.0, 55.0, 45.0, 40.0, 25.0, 22.0, 15.0, 14.0, 13.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.44580078125, -0.43310546875, -0.42041015625, -0.40771484375, -0.39501953125, -0.38232421875, -0.36962890625, -0.35693359375, -0.34423828125, -0.33154296875, -0.31884765625, -0.30615234375, -0.29345703125, -0.28076171875, -0.26806640625, -0.25537109375, -0.24267578125, -0.22998046875, -0.21728515625, -0.20458984375, -0.19189453125, -0.17919921875, -0.16650390625, -0.15380859375, -0.14111328125, -0.12841796875, -0.11572265625, -0.10302734375, -0.09033203125, -0.07763671875, -0.06494140625, -0.05224609375, -0.03955078125, -0.02685546875, -0.01416015625, -0.00146484375, 0.01123046875, 0.02392578125, 0.03662109375, 0.04931640625, 0.06201171875, 0.07470703125, 0.08740234375, 0.10009765625, 0.11279296875, 0.12548828125, 0.13818359375, 0.15087890625, 0.16357421875, 0.17626953125, 0.18896484375, 0.20166015625, 0.21435546875, 0.22705078125, 0.23974609375, 0.25244140625, 0.26513671875, 0.27783203125, 0.29052734375, 0.30322265625, 0.31591796875, 0.32861328125, 0.34130859375, 0.35400390625, 0.36669921875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 136.0, 847.0, 26.0, 3.0, 0.0, 1.0], "bins": [-0.7807208299636841, -0.7675497531890869, -0.7543787360191345, -0.7412076592445374, -0.728036642074585, -0.7148655652999878, -0.7016944885253906, -0.6885234713554382, -0.6753523945808411, -0.6621813178062439, -0.6490103006362915, -0.6358392238616943, -0.6226682066917419, -0.6094971299171448, -0.5963261127471924, -0.5831550359725952, -0.5699840188026428, -0.5568129420280457, -0.5436419248580933, -0.5304708480834961, -0.5172998309135437, -0.5041287541389465, -0.49095770716667175, -0.477786660194397, -0.4646155834197998, -0.451444536447525, -0.43827348947525024, -0.4251024127006531, -0.4119313657283783, -0.3987603187561035, -0.38558927178382874, -0.37241822481155396, -0.3592471480369568, -0.346076101064682, -0.3329050540924072, -0.31973397731781006, -0.3065629303455353, -0.2933918833732605, -0.2802208364009857, -0.26704978942871094, -0.25387874245643616, -0.24070769548416138, -0.2275366336107254, -0.21436558663845062, -0.20119453966617584, -0.18802347779273987, -0.1748524308204651, -0.1616813838481903, -0.14851033687591553, -0.13533928990364075, -0.12216823548078537, -0.10899718105792999, -0.09582613408565521, -0.08265507966279984, -0.06948402523994446, -0.05631297826766968, -0.043141916394233704, -0.029970865696668625, -0.016799813136458397, -0.003628760576248169, 0.00954229012131691, 0.02271334081888199, 0.035884395241737366, 0.049055442214012146, 0.06222649663686752]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 2.0, 11.0, 9.0, 10.0, 27.0, 18.0, 20.0, 18.0, 46.0, 24.0, 33.0, 31.0, 29.0, 36.0, 30.0, 48.0, 55.0, 48.0, 41.0, 37.0, 39.0, 33.0, 42.0, 45.0, 39.0, 23.0, 34.0, 32.0, 20.0, 19.0, 15.0, 15.0, 8.0, 7.0, 11.0, 13.0, 3.0, 6.0, 4.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04860180616378784, -0.04721115157008171, -0.04582049697637558, -0.04442983865737915, -0.04303918406367302, -0.04164852946996689, -0.04025787115097046, -0.03886721655726433, -0.0374765619635582, -0.036085907369852066, -0.034695252776145935, -0.033304594457149506, -0.031913939863443375, -0.030523285269737244, -0.029132628813385963, -0.027741972357034683, -0.026351317763328552, -0.02496066316962242, -0.02357000671327114, -0.02217935025691986, -0.02078869566321373, -0.0193980410695076, -0.01800738461315632, -0.01661672815680504, -0.015226073563098907, -0.013835418038070202, -0.012444762513041496, -0.01105410698801279, -0.009663451462984085, -0.00827279593795538, -0.006882140412926674, -0.005491484887897968, -0.004100829362869263, -0.002710173837840557, -0.0013195183128118515, 7.11372122168541e-05, 0.0014617927372455597, 0.0028524482622742653, 0.004243103787302971, 0.0056337593123316765, 0.007024414837360382, 0.008415070362389088, 0.009805725887417793, 0.011196381412446499, 0.012587036937475204, 0.01397769246250391, 0.015368347987532616, 0.016759004443883896, 0.018149659037590027, 0.019540313631296158, 0.020930970087647438, 0.022321626543998718, 0.02371228113770485, 0.02510293573141098, 0.02649359218776226, 0.02788424864411354, 0.02927490323781967, 0.030665557831525803, 0.032056212425231934, 0.03344687074422836, 0.034837525337934494, 0.036228179931640625, 0.037618838250637054, 0.039009492844343185, 0.040400147438049316]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 11.0, 4.0, 12.0, 12.0, 16.0, 16.0, 15.0, 15.0, 23.0, 22.0, 28.0, 38.0, 27.0, 35.0, 26.0, 44.0, 45.0, 40.0, 46.0, 46.0, 43.0, 31.0, 44.0, 30.0, 50.0, 39.0, 21.0, 26.0, 31.0, 16.0, 30.0, 19.0, 15.0, 17.0, 15.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.2421875, -4.122314453125, -4.00244140625, -3.882568359375, -3.7626953125, -3.642822265625, -3.52294921875, -3.403076171875, -3.283203125, -3.163330078125, -3.04345703125, -2.923583984375, -2.8037109375, -2.683837890625, -2.56396484375, -2.444091796875, -2.32421875, -2.204345703125, -2.08447265625, -1.964599609375, -1.8447265625, -1.724853515625, -1.60498046875, -1.485107421875, -1.365234375, -1.245361328125, -1.12548828125, -1.005615234375, -0.8857421875, -0.765869140625, -0.64599609375, -0.526123046875, -0.40625, -0.286376953125, -0.16650390625, -0.046630859375, 0.0732421875, 0.193115234375, 0.31298828125, 0.432861328125, 0.552734375, 0.672607421875, 0.79248046875, 0.912353515625, 1.0322265625, 1.152099609375, 1.27197265625, 1.391845703125, 1.51171875, 1.631591796875, 1.75146484375, 1.871337890625, 1.9912109375, 2.111083984375, 2.23095703125, 2.350830078125, 2.470703125, 2.590576171875, 2.71044921875, 2.830322265625, 2.9501953125, 3.070068359375, 3.18994140625, 3.309814453125, 3.4296875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 21.0, 24.0, 33.0, 56.0, 97.0, 114.0, 211.0, 349.0, 535.0, 944.0, 1532.0, 2549.0, 4462.0, 7931.0, 14200.0, 24847.0, 45034.0, 84832.0, 178943.0, 301586.0, 186402.0, 88208.0, 46016.0, 25670.0, 14550.0, 8165.0, 4672.0, 2562.0, 1553.0, 904.0, 559.0, 376.0, 222.0, 154.0, 71.0, 70.0, 40.0, 19.0, 12.0, 11.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.05078125, -2.950836181640625, -2.85089111328125, -2.750946044921875, -2.6510009765625, -2.551055908203125, -2.45111083984375, -2.351165771484375, -2.251220703125, -2.151275634765625, -2.05133056640625, -1.951385498046875, -1.8514404296875, -1.751495361328125, -1.65155029296875, -1.551605224609375, -1.45166015625, -1.351715087890625, -1.25177001953125, -1.151824951171875, -1.0518798828125, -0.951934814453125, -0.85198974609375, -0.752044677734375, -0.652099609375, -0.552154541015625, -0.45220947265625, -0.352264404296875, -0.2523193359375, -0.152374267578125, -0.05242919921875, 0.047515869140625, 0.1474609375, 0.247406005859375, 0.34735107421875, 0.447296142578125, 0.5472412109375, 0.647186279296875, 0.74713134765625, 0.847076416015625, 0.947021484375, 1.046966552734375, 1.14691162109375, 1.246856689453125, 1.3468017578125, 1.446746826171875, 1.54669189453125, 1.646636962890625, 1.74658203125, 1.846527099609375, 1.94647216796875, 2.046417236328125, 2.1463623046875, 2.246307373046875, 2.34625244140625, 2.446197509765625, 2.546142578125, 2.646087646484375, 2.74603271484375, 2.845977783203125, 2.9459228515625, 3.045867919921875, 3.14581298828125, 3.245758056640625, 3.345703125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 6.0, 4.0, 10.0, 8.0, 16.0, 17.0, 10.0, 14.0, 21.0, 27.0, 24.0, 32.0, 36.0, 41.0, 47.0, 53.0, 97.0, 162.0, 339.0, 1390.0, 182.0, 96.0, 61.0, 51.0, 37.0, 27.0, 31.0, 37.0, 26.0, 19.0, 21.0, 14.0, 11.0, 10.0, 8.0, 6.0, 11.0, 6.0, 7.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5859375, -13.149658203125, -12.71337890625, -12.277099609375, -11.8408203125, -11.404541015625, -10.96826171875, -10.531982421875, -10.095703125, -9.659423828125, -9.22314453125, -8.786865234375, -8.3505859375, -7.914306640625, -7.47802734375, -7.041748046875, -6.60546875, -6.169189453125, -5.73291015625, -5.296630859375, -4.8603515625, -4.424072265625, -3.98779296875, -3.551513671875, -3.115234375, -2.678955078125, -2.24267578125, -1.806396484375, -1.3701171875, -0.933837890625, -0.49755859375, -0.061279296875, 0.375, 0.811279296875, 1.24755859375, 1.683837890625, 2.1201171875, 2.556396484375, 2.99267578125, 3.428955078125, 3.865234375, 4.301513671875, 4.73779296875, 5.174072265625, 5.6103515625, 6.046630859375, 6.48291015625, 6.919189453125, 7.35546875, 7.791748046875, 8.22802734375, 8.664306640625, 9.1005859375, 9.536865234375, 9.97314453125, 10.409423828125, 10.845703125, 11.281982421875, 11.71826171875, 12.154541015625, 12.5908203125, 13.027099609375, 13.46337890625, 13.899658203125, 14.3359375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 8.0, 5.0, 5.0, 5.0, 15.0, 17.0, 13.0, 15.0, 22.0, 19.0, 39.0, 39.0, 69.0, 77.0, 95.0, 140.0, 210.0, 306.0, 574.0, 2230.0, 23157.0, 2828467.0, 281566.0, 6056.0, 1139.0, 412.0, 265.0, 197.0, 142.0, 82.0, 54.0, 51.0, 43.0, 39.0, 39.0, 23.0, 13.0, 15.0, 7.0, 6.0, 7.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-30.09375, -29.17529296875, -28.2568359375, -27.33837890625, -26.419921875, -25.50146484375, -24.5830078125, -23.66455078125, -22.74609375, -21.82763671875, -20.9091796875, -19.99072265625, -19.072265625, -18.15380859375, -17.2353515625, -16.31689453125, -15.3984375, -14.47998046875, -13.5615234375, -12.64306640625, -11.724609375, -10.80615234375, -9.8876953125, -8.96923828125, -8.05078125, -7.13232421875, -6.2138671875, -5.29541015625, -4.376953125, -3.45849609375, -2.5400390625, -1.62158203125, -0.703125, 0.21533203125, 1.1337890625, 2.05224609375, 2.970703125, 3.88916015625, 4.8076171875, 5.72607421875, 6.64453125, 7.56298828125, 8.4814453125, 9.39990234375, 10.318359375, 11.23681640625, 12.1552734375, 13.07373046875, 13.9921875, 14.91064453125, 15.8291015625, 16.74755859375, 17.666015625, 18.58447265625, 19.5029296875, 20.42138671875, 21.33984375, 22.25830078125, 23.1767578125, 24.09521484375, 25.013671875, 25.93212890625, 26.8505859375, 27.76904296875, 28.6875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 10.0, 775.0, 234.0], "bins": [-565.662841796875, -556.6517333984375, -547.640625, -538.6295776367188, -529.6184692382812, -520.6073608398438, -511.59625244140625, -502.5851745605469, -493.5740661621094, -484.5629577636719, -475.5518798828125, -466.540771484375, -457.5296936035156, -448.5185852050781, -439.50750732421875, -430.49639892578125, -421.48529052734375, -412.47418212890625, -403.4631042480469, -394.4519958496094, -385.44091796875, -376.4298095703125, -367.418701171875, -358.4076232910156, -349.39654541015625, -340.38543701171875, -331.3743591308594, -322.3632507324219, -313.3521728515625, -304.341064453125, -295.3299560546875, -286.3188781738281, -277.3077392578125, -268.296630859375, -259.2855529785156, -250.27444458007812, -241.2633514404297, -232.25225830078125, -223.2411651611328, -214.23007202148438, -205.21897888183594, -196.2078857421875, -187.19679260253906, -178.18569946289062, -169.17459106445312, -160.1634979248047, -151.15240478515625, -142.1413116455078, -133.1302032470703, -124.11911010742188, -115.1080093383789, -106.09691619873047, -97.0858154296875, -88.07472229003906, -79.06362915039062, -70.05253601074219, -61.04144287109375, -52.03034591674805, -43.019248962402344, -34.008155822753906, -24.997058868408203, -15.9859619140625, -6.9748687744140625, 2.0362281799316406, 11.04732608795166]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 13.0, 3.0, 8.0, 10.0, 10.0, 15.0, 13.0, 20.0, 20.0, 23.0, 20.0, 23.0, 33.0, 34.0, 31.0, 32.0, 34.0, 37.0, 44.0, 55.0, 43.0, 49.0, 30.0, 38.0, 39.0, 30.0, 36.0, 29.0, 33.0, 30.0, 28.0, 21.0, 21.0, 15.0, 19.0, 14.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-33.69690704345703, -32.65312957763672, -31.60934829711914, -30.565570831298828, -29.521791458129883, -28.478012084960938, -27.434232711791992, -26.390453338623047, -25.346675872802734, -24.30289649963379, -23.259117126464844, -22.21533966064453, -21.171560287475586, -20.12778091430664, -19.084001541137695, -18.04022216796875, -16.996442794799805, -15.95266342163086, -14.90888500213623, -13.865105628967285, -12.821327209472656, -11.777547836303711, -10.733768463134766, -9.68998908996582, -8.646210670471191, -7.602431774139404, -6.558652877807617, -5.514873504638672, -4.471094608306885, -3.4273157119750977, -2.3835363388061523, -1.3397574424743652, -0.2959785461425781, 0.7478004693984985, 1.7915794849395752, 2.8353586196899414, 3.8791375160217285, 4.922916412353516, 5.966695785522461, 7.010474681854248, 8.054253578186035, 9.09803295135498, 10.14181137084961, 11.185590744018555, 12.2293701171875, 13.273148536682129, 14.316927909851074, 15.360706329345703, 16.40448570251465, 17.448265075683594, 18.49204444885254, 19.535823822021484, 20.579601287841797, 21.623380661010742, 22.667160034179688, 23.710939407348633, 24.754718780517578, 25.798498153686523, 26.84227752685547, 27.88605499267578, 28.929834365844727, 29.973613739013672, 31.017393112182617, 32.06117248535156, 33.104949951171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 10.0, 9.0, 11.0, 11.0, 13.0, 12.0, 18.0, 14.0, 21.0, 24.0, 22.0, 28.0, 28.0, 41.0, 36.0, 51.0, 42.0, 34.0, 39.0, 44.0, 39.0, 36.0, 42.0, 27.0, 37.0, 30.0, 27.0, 24.0, 23.0, 25.0, 24.0, 28.0, 16.0, 19.0, 15.0, 10.0, 18.0, 6.0, 6.0, 6.0, 7.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.23828125, -4.118896484375, -3.99951171875, -3.880126953125, -3.7607421875, -3.641357421875, -3.52197265625, -3.402587890625, -3.283203125, -3.163818359375, -3.04443359375, -2.925048828125, -2.8056640625, -2.686279296875, -2.56689453125, -2.447509765625, -2.328125, -2.208740234375, -2.08935546875, -1.969970703125, -1.8505859375, -1.731201171875, -1.61181640625, -1.492431640625, -1.373046875, -1.253662109375, -1.13427734375, -1.014892578125, -0.8955078125, -0.776123046875, -0.65673828125, -0.537353515625, -0.41796875, -0.298583984375, -0.17919921875, -0.059814453125, 0.0595703125, 0.178955078125, 0.29833984375, 0.417724609375, 0.537109375, 0.656494140625, 0.77587890625, 0.895263671875, 1.0146484375, 1.134033203125, 1.25341796875, 1.372802734375, 1.4921875, 1.611572265625, 1.73095703125, 1.850341796875, 1.9697265625, 2.089111328125, 2.20849609375, 2.327880859375, 2.447265625, 2.566650390625, 2.68603515625, 2.805419921875, 2.9248046875, 3.044189453125, 3.16357421875, 3.282958984375, 3.40234375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 9.0, 19.0, 14.0, 21.0, 14.0, 32.0, 30.0, 60.0, 75.0, 155.0, 307.0, 849.0, 3206.0, 17713.0, 166785.0, 2420441.0, 1478721.0, 90995.0, 11256.0, 2274.0, 655.0, 203.0, 133.0, 62.0, 52.0, 28.0, 27.0, 25.0, 16.0, 15.0, 19.0, 9.0, 9.0, 8.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.625, -16.1741943359375, -15.723388671875, -15.2725830078125, -14.82177734375, -14.3709716796875, -13.920166015625, -13.4693603515625, -13.0185546875, -12.5677490234375, -12.116943359375, -11.6661376953125, -11.21533203125, -10.7645263671875, -10.313720703125, -9.8629150390625, -9.412109375, -8.9613037109375, -8.510498046875, -8.0596923828125, -7.60888671875, -7.1580810546875, -6.707275390625, -6.2564697265625, -5.8056640625, -5.3548583984375, -4.904052734375, -4.4532470703125, -4.00244140625, -3.5516357421875, -3.100830078125, -2.6500244140625, -2.19921875, -1.7484130859375, -1.297607421875, -0.8468017578125, -0.39599609375, 0.0548095703125, 0.505615234375, 0.9564208984375, 1.4072265625, 1.8580322265625, 2.308837890625, 2.7596435546875, 3.21044921875, 3.6612548828125, 4.112060546875, 4.5628662109375, 5.013671875, 5.4644775390625, 5.915283203125, 6.3660888671875, 6.81689453125, 7.2677001953125, 7.718505859375, 8.1693115234375, 8.6201171875, 9.0709228515625, 9.521728515625, 9.9725341796875, 10.42333984375, 10.8741455078125, 11.324951171875, 11.7757568359375, 12.2265625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 16.0, 29.0, 29.0, 40.0, 49.0, 84.0, 95.0, 137.0, 187.0, 287.0, 330.0, 450.0, 467.0, 461.0, 357.0, 284.0, 191.0, 146.0, 108.0, 70.0, 59.0, 44.0, 34.0, 27.0, 21.0, 9.0, 14.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.4222412109375, -11.110107421875, -10.7979736328125, -10.48583984375, -10.1737060546875, -9.861572265625, -9.5494384765625, -9.2373046875, -8.9251708984375, -8.613037109375, -8.3009033203125, -7.98876953125, -7.6766357421875, -7.364501953125, -7.0523681640625, -6.740234375, -6.4281005859375, -6.115966796875, -5.8038330078125, -5.49169921875, -5.1795654296875, -4.867431640625, -4.5552978515625, -4.2431640625, -3.9310302734375, -3.618896484375, -3.3067626953125, -2.99462890625, -2.6824951171875, -2.370361328125, -2.0582275390625, -1.74609375, -1.4339599609375, -1.121826171875, -0.8096923828125, -0.49755859375, -0.1854248046875, 0.126708984375, 0.4388427734375, 0.7509765625, 1.0631103515625, 1.375244140625, 1.6873779296875, 1.99951171875, 2.3116455078125, 2.623779296875, 2.9359130859375, 3.248046875, 3.5601806640625, 3.872314453125, 4.1844482421875, 4.49658203125, 4.8087158203125, 5.120849609375, 5.4329833984375, 5.7451171875, 6.0572509765625, 6.369384765625, 6.6815185546875, 6.99365234375, 7.3057861328125, 7.617919921875, 7.9300537109375, 8.2421875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 23.0, 25.0, 39.0, 53.0, 78.0, 109.0, 151.0, 269.0, 623.0, 2125.0, 18092.0, 394207.0, 3522775.0, 240025.0, 12601.0, 1796.0, 475.0, 297.0, 161.0, 107.0, 67.0, 64.0, 36.0, 19.0, 16.0, 16.0, 10.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.1708984375, -22.326171875, -21.4814453125, -20.63671875, -19.7919921875, -18.947265625, -18.1025390625, -17.2578125, -16.4130859375, -15.568359375, -14.7236328125, -13.87890625, -13.0341796875, -12.189453125, -11.3447265625, -10.5, -9.6552734375, -8.810546875, -7.9658203125, -7.12109375, -6.2763671875, -5.431640625, -4.5869140625, -3.7421875, -2.8974609375, -2.052734375, -1.2080078125, -0.36328125, 0.4814453125, 1.326171875, 2.1708984375, 3.015625, 3.8603515625, 4.705078125, 5.5498046875, 6.39453125, 7.2392578125, 8.083984375, 8.9287109375, 9.7734375, 10.6181640625, 11.462890625, 12.3076171875, 13.15234375, 13.9970703125, 14.841796875, 15.6865234375, 16.53125, 17.3759765625, 18.220703125, 19.0654296875, 19.91015625, 20.7548828125, 21.599609375, 22.4443359375, 23.2890625, 24.1337890625, 24.978515625, 25.8232421875, 26.66796875, 27.5126953125, 28.357421875, 29.2021484375, 30.046875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 14.0, 45.0, 94.0, 168.0, 205.0, 193.0, 140.0, 88.0, 43.0, 11.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.27609634399414, -30.27997589111328, -27.283857345581055, -24.287738800048828, -21.29161834716797, -18.29549789428711, -15.299379348754883, -12.303260803222656, -9.307140350341797, -6.311020851135254, -3.314901351928711, -0.31878185272216797, 2.677337646484375, 5.673457145690918, 8.669576644897461, 11.665695190429688, 14.661815643310547, 17.657936096191406, 20.654054641723633, 23.65017318725586, 26.64629364013672, 29.642414093017578, 32.63853454589844, 35.63465118408203, 38.63077163696289, 41.62689208984375, 44.623008728027344, 47.6191291809082, 50.61524963378906, 53.61137008666992, 56.60749053955078, 59.603607177734375, 62.5997314453125, 65.5958480834961, 68.59197235107422, 71.58808898925781, 74.58421325683594, 77.58032989501953, 80.57644653320312, 83.57257080078125, 86.56868743896484, 89.56480407714844, 92.56092834472656, 95.55704498291016, 98.55316162109375, 101.54928588867188, 104.54540252685547, 107.54151916503906, 110.53764343261719, 113.53376007080078, 116.5298843383789, 119.5260009765625, 122.52212524414062, 125.51824188232422, 128.5143585205078, 131.51048278808594, 134.506591796875, 137.50271606445312, 140.4988250732422, 143.4949493408203, 146.49107360839844, 149.4871826171875, 152.48330688476562, 155.47943115234375, 158.47555541992188]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 5.0, 10.0, 6.0, 10.0, 9.0, 19.0, 21.0, 18.0, 26.0, 20.0, 26.0, 26.0, 29.0, 38.0, 29.0, 44.0, 42.0, 30.0, 41.0, 36.0, 26.0, 38.0, 39.0, 43.0, 29.0, 39.0, 33.0, 29.0, 26.0, 23.0, 24.0, 14.0, 13.0, 21.0, 18.0, 13.0, 13.0, 10.0, 12.0, 10.0, 6.0, 1.0, 3.0, 7.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0], "bins": [-30.022262573242188, -29.117998123168945, -28.213733673095703, -27.30946922302246, -26.40520477294922, -25.500938415527344, -24.5966739654541, -23.69240951538086, -22.788145065307617, -21.883880615234375, -20.979616165161133, -20.07535171508789, -19.171085357666016, -18.266822814941406, -17.36255645751953, -16.45829200744629, -15.554027557373047, -14.649763107299805, -13.745498657226562, -12.841233253479004, -11.936968803405762, -11.03270435333252, -10.128438949584961, -9.224174499511719, -8.319910049438477, -7.415645599365234, -6.511380672454834, -5.607115745544434, -4.702851295471191, -3.798586845397949, -2.894321918487549, -1.9900569915771484, -1.0857925415039062, -0.18152785301208496, 0.7227368354797363, 1.6270015239715576, 2.531266212463379, 3.435530662536621, 4.3397955894470215, 5.244060516357422, 6.148324966430664, 7.052589416503906, 7.956854343414307, 8.861119270324707, 9.76538372039795, 10.669648170471191, 11.57391357421875, 12.478178024291992, 13.382442474365234, 14.286706924438477, 15.190971374511719, 16.09523582458496, 16.999500274658203, 17.903766632080078, 18.80803108215332, 19.712295532226562, 20.616559982299805, 21.520824432373047, 22.42508888244629, 23.32935333251953, 24.233619689941406, 25.137882232666016, 26.04214859008789, 26.946413040161133, 27.850677490234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 10.0, 13.0, 6.0, 12.0, 15.0, 22.0, 20.0, 23.0, 16.0, 23.0, 33.0, 29.0, 33.0, 40.0, 35.0, 45.0, 41.0, 40.0, 43.0, 42.0, 48.0, 35.0, 39.0, 32.0, 38.0, 40.0, 27.0, 21.0, 28.0, 22.0, 15.0, 20.0, 16.0, 14.0, 16.0, 10.0, 6.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.75421142578125, -3.6314697265625, -3.50872802734375, -3.385986328125, -3.26324462890625, -3.1405029296875, -3.01776123046875, -2.89501953125, -2.77227783203125, -2.6495361328125, -2.52679443359375, -2.404052734375, -2.28131103515625, -2.1585693359375, -2.03582763671875, -1.9130859375, -1.79034423828125, -1.6676025390625, -1.54486083984375, -1.422119140625, -1.29937744140625, -1.1766357421875, -1.05389404296875, -0.93115234375, -0.80841064453125, -0.6856689453125, -0.56292724609375, -0.440185546875, -0.31744384765625, -0.1947021484375, -0.07196044921875, 0.05078125, 0.17352294921875, 0.2962646484375, 0.41900634765625, 0.541748046875, 0.66448974609375, 0.7872314453125, 0.90997314453125, 1.03271484375, 1.15545654296875, 1.2781982421875, 1.40093994140625, 1.523681640625, 1.64642333984375, 1.7691650390625, 1.89190673828125, 2.0146484375, 2.13739013671875, 2.2601318359375, 2.38287353515625, 2.505615234375, 2.62835693359375, 2.7510986328125, 2.87384033203125, 2.99658203125, 3.11932373046875, 3.2420654296875, 3.36480712890625, 3.487548828125, 3.61029052734375, 3.7330322265625, 3.85577392578125, 3.978515625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 7.0, 7.0, 7.0, 21.0, 21.0, 35.0, 44.0, 64.0, 103.0, 140.0, 216.0, 333.0, 471.0, 705.0, 1086.0, 1552.0, 2190.0, 3200.0, 4800.0, 6959.0, 10207.0, 15140.0, 21857.0, 32099.0, 46145.0, 66792.0, 91407.0, 119621.0, 139805.0, 129974.0, 103810.0, 76666.0, 54182.0, 37641.0, 25531.0, 17760.0, 12211.0, 8176.0, 5376.0, 3931.0, 2588.0, 1873.0, 1268.0, 776.0, 533.0, 425.0, 282.0, 174.0, 120.0, 63.0, 55.0, 43.0, 22.0, 21.0, 8.0, 11.0, 7.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.53955078125, -0.5225372314453125, -0.505523681640625, -0.4885101318359375, -0.47149658203125, -0.4544830322265625, -0.437469482421875, -0.4204559326171875, -0.4034423828125, -0.3864288330078125, -0.369415283203125, -0.3524017333984375, -0.33538818359375, -0.3183746337890625, -0.301361083984375, -0.2843475341796875, -0.267333984375, -0.2503204345703125, -0.233306884765625, -0.2162933349609375, -0.19927978515625, -0.1822662353515625, -0.165252685546875, -0.1482391357421875, -0.1312255859375, -0.1142120361328125, -0.097198486328125, -0.0801849365234375, -0.06317138671875, -0.0461578369140625, -0.029144287109375, -0.0121307373046875, 0.0048828125, 0.0218963623046875, 0.038909912109375, 0.0559234619140625, 0.07293701171875, 0.0899505615234375, 0.106964111328125, 0.1239776611328125, 0.1409912109375, 0.1580047607421875, 0.175018310546875, 0.1920318603515625, 0.20904541015625, 0.2260589599609375, 0.243072509765625, 0.2600860595703125, 0.277099609375, 0.2941131591796875, 0.311126708984375, 0.3281402587890625, 0.34515380859375, 0.3621673583984375, 0.379180908203125, 0.3961944580078125, 0.4132080078125, 0.4302215576171875, 0.447235107421875, 0.4642486572265625, 0.48126220703125, 0.4982757568359375, 0.515289306640625, 0.5323028564453125, 0.54931640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 13.0, 9.0, 10.0, 22.0, 14.0, 21.0, 22.0, 26.0, 31.0, 49.0, 38.0, 28.0, 38.0, 26.0, 31.0, 40.0, 41.0, 34.0, 1066.0, 37.0, 28.0, 35.0, 35.0, 39.0, 30.0, 30.0, 16.0, 28.0, 28.0, 19.0, 20.0, 13.0, 18.0, 19.0, 12.0, 7.0, 12.0, 4.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-2.63671875, -2.559906005859375, -2.48309326171875, -2.406280517578125, -2.3294677734375, -2.252655029296875, -2.17584228515625, -2.099029541015625, -2.022216796875, -1.945404052734375, -1.86859130859375, -1.791778564453125, -1.7149658203125, -1.638153076171875, -1.56134033203125, -1.484527587890625, -1.40771484375, -1.330902099609375, -1.25408935546875, -1.177276611328125, -1.1004638671875, -1.023651123046875, -0.94683837890625, -0.870025634765625, -0.793212890625, -0.716400146484375, -0.63958740234375, -0.562774658203125, -0.4859619140625, -0.409149169921875, -0.33233642578125, -0.255523681640625, -0.1787109375, -0.101898193359375, -0.02508544921875, 0.051727294921875, 0.1285400390625, 0.205352783203125, 0.28216552734375, 0.358978271484375, 0.435791015625, 0.512603759765625, 0.58941650390625, 0.666229248046875, 0.7430419921875, 0.819854736328125, 0.89666748046875, 0.973480224609375, 1.05029296875, 1.127105712890625, 1.20391845703125, 1.280731201171875, 1.3575439453125, 1.434356689453125, 1.51116943359375, 1.587982177734375, 1.664794921875, 1.741607666015625, 1.81842041015625, 1.895233154296875, 1.9720458984375, 2.048858642578125, 2.12567138671875, 2.202484130859375, 2.279296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 11.0, 8.0, 9.0, 17.0, 13.0, 31.0, 44.0, 76.0, 98.0, 124.0, 213.0, 272.0, 452.0, 661.0, 919.0, 1356.0, 2052.0, 3017.0, 4554.0, 6890.0, 10464.0, 15726.0, 23046.0, 34293.0, 49241.0, 70694.0, 97072.0, 125100.0, 1185706.0, 129451.0, 100631.0, 73958.0, 51585.0, 35796.0, 24239.0, 16347.0, 10729.0, 7321.0, 4902.0, 3224.0, 2173.0, 1490.0, 987.0, 672.0, 499.0, 305.0, 201.0, 166.0, 97.0, 71.0, 44.0, 35.0, 26.0, 17.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.297119140625, -0.2877044677734375, -0.278289794921875, -0.2688751220703125, -0.25946044921875, -0.2500457763671875, -0.240631103515625, -0.2312164306640625, -0.2218017578125, -0.2123870849609375, -0.202972412109375, -0.1935577392578125, -0.18414306640625, -0.1747283935546875, -0.165313720703125, -0.1558990478515625, -0.146484375, -0.1370697021484375, -0.127655029296875, -0.1182403564453125, -0.10882568359375, -0.0994110107421875, -0.089996337890625, -0.0805816650390625, -0.0711669921875, -0.0617523193359375, -0.052337646484375, -0.0429229736328125, -0.03350830078125, -0.0240936279296875, -0.014678955078125, -0.0052642822265625, 0.004150390625, 0.0135650634765625, 0.022979736328125, 0.0323944091796875, 0.04180908203125, 0.0512237548828125, 0.060638427734375, 0.0700531005859375, 0.0794677734375, 0.0888824462890625, 0.098297119140625, 0.1077117919921875, 0.11712646484375, 0.1265411376953125, 0.135955810546875, 0.1453704833984375, 0.15478515625, 0.1641998291015625, 0.173614501953125, 0.1830291748046875, 0.19244384765625, 0.2018585205078125, 0.211273193359375, 0.2206878662109375, 0.2301025390625, 0.2395172119140625, 0.248931884765625, 0.2583465576171875, 0.26776123046875, 0.2771759033203125, 0.286590576171875, 0.2960052490234375, 0.305419921875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 8.0, 6.0, 10.0, 15.0, 15.0, 27.0, 20.0, 30.0, 33.0, 29.0, 42.0, 60.0, 75.0, 89.0, 106.0, 67.0, 60.0, 45.0, 44.0, 34.0, 27.0, 21.0, 22.0, 14.0, 14.0, 8.0, 6.0, 8.0, 10.0, 2.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.019683837890625, -0.019071340560913086, -0.018458843231201172, -0.017846345901489258, -0.017233848571777344, -0.01662135124206543, -0.016008853912353516, -0.015396356582641602, -0.014783859252929688, -0.014171361923217773, -0.01355886459350586, -0.012946367263793945, -0.012333869934082031, -0.011721372604370117, -0.011108875274658203, -0.010496377944946289, -0.009883880615234375, -0.009271383285522461, -0.008658885955810547, -0.008046388626098633, -0.007433891296386719, -0.006821393966674805, -0.006208896636962891, -0.0055963993072509766, -0.0049839019775390625, -0.0043714046478271484, -0.0037589073181152344, -0.0031464099884033203, -0.0025339126586914062, -0.0019214153289794922, -0.0013089179992675781, -0.0006964206695556641, -8.392333984375e-05, 0.0005285739898681641, 0.0011410713195800781, 0.0017535686492919922, 0.0023660659790039062, 0.0029785633087158203, 0.0035910606384277344, 0.0042035579681396484, 0.0048160552978515625, 0.0054285526275634766, 0.006041049957275391, 0.006653547286987305, 0.007266044616699219, 0.007878541946411133, 0.008491039276123047, 0.009103536605834961, 0.009716033935546875, 0.010328531265258789, 0.010941028594970703, 0.011553525924682617, 0.012166023254394531, 0.012778520584106445, 0.01339101791381836, 0.014003515243530273, 0.014616012573242188, 0.015228509902954102, 0.015841007232666016, 0.01645350456237793, 0.017066001892089844, 0.017678499221801758, 0.018290996551513672, 0.018903493881225586, 0.0195159912109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 6.0, 17.0, 13.0, 12.0, 20.0, 29.0, 30.0, 41.0, 70.0, 109.0, 138.0, 274.0, 509.0, 2624.0, 718084.0, 323189.0, 2149.0, 477.0, 234.0, 155.0, 72.0, 64.0, 40.0, 45.0, 31.0, 20.0, 14.0, 11.0, 13.0, 8.0, 5.0, 12.0, 1.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36279296875, -0.35068511962890625, -0.3385772705078125, -0.32646942138671875, -0.314361572265625, -0.30225372314453125, -0.2901458740234375, -0.27803802490234375, -0.26593017578125, -0.25382232666015625, -0.2417144775390625, -0.22960662841796875, -0.217498779296875, -0.20539093017578125, -0.1932830810546875, -0.18117523193359375, -0.1690673828125, -0.15695953369140625, -0.1448516845703125, -0.13274383544921875, -0.120635986328125, -0.10852813720703125, -0.0964202880859375, -0.08431243896484375, -0.07220458984375, -0.06009674072265625, -0.0479888916015625, -0.03588104248046875, -0.023773193359375, -0.01166534423828125, 0.0004425048828125, 0.01255035400390625, 0.024658203125, 0.03676605224609375, 0.0488739013671875, 0.06098175048828125, 0.073089599609375, 0.08519744873046875, 0.0973052978515625, 0.10941314697265625, 0.12152099609375, 0.13362884521484375, 0.1457366943359375, 0.15784454345703125, 0.169952392578125, 0.18206024169921875, 0.1941680908203125, 0.20627593994140625, 0.2183837890625, 0.23049163818359375, 0.2425994873046875, 0.25470733642578125, 0.266815185546875, 0.27892303466796875, 0.2910308837890625, 0.30313873291015625, 0.31524658203125, 0.32735443115234375, 0.3394622802734375, 0.35157012939453125, 0.363677978515625, 0.37578582763671875, 0.3878936767578125, 0.40000152587890625, 0.412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 126.0, 803.0, 74.0, 3.0, 0.0, 1.0], "bins": [-0.6436715722084045, -0.6328349113464355, -0.6219981908798218, -0.6111615300178528, -0.6003248691558838, -0.5894882082939148, -0.578651487827301, -0.567814826965332, -0.556978166103363, -0.546141505241394, -0.5353047847747803, -0.5244681239128113, -0.5136314630508423, -0.5027948021888733, -0.4919581115245819, -0.4811214208602905, -0.47028475999832153, -0.45944806933403015, -0.44861140847206116, -0.4377747178077698, -0.4269380569458008, -0.4161013662815094, -0.4052647054195404, -0.394428014755249, -0.38359132409095764, -0.37275463342666626, -0.36191797256469727, -0.3510812819004059, -0.3402446210384369, -0.3294079303741455, -0.3185712695121765, -0.30773457884788513, -0.2968979477882385, -0.28606125712394714, -0.27522459626197815, -0.26438790559768677, -0.2535512447357178, -0.24271456897258759, -0.2318778932094574, -0.22104120254516602, -0.21020452678203583, -0.19936785101890564, -0.18853117525577545, -0.17769449949264526, -0.16685782372951508, -0.1560211479663849, -0.1451844573020935, -0.1343477964401245, -0.12351111322641373, -0.11267443746328354, -0.10183776170015335, -0.09100107848644257, -0.08016440272331238, -0.06932772696018219, -0.058491051197052, -0.047654375433921814, -0.036817699670791626, -0.025981023907661438, -0.0151443462818861, -0.0043076686561107635, 0.0065290071070194244, 0.017365682870149612, 0.0282023623585701, 0.03903903812170029, 0.049875713884830475]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 9.0, 9.0, 8.0, 14.0, 11.0, 18.0, 14.0, 26.0, 26.0, 23.0, 22.0, 31.0, 31.0, 40.0, 40.0, 36.0, 30.0, 36.0, 32.0, 41.0, 42.0, 28.0, 34.0, 38.0, 47.0, 31.0, 39.0, 34.0, 26.0, 28.0, 20.0, 18.0, 13.0, 14.0, 14.0, 15.0, 7.0, 12.0, 4.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0465584397315979, -0.045241862535476685, -0.04392528161406517, -0.042608700692653656, -0.04129212349653244, -0.039975546300411224, -0.03865896537899971, -0.037342384457588196, -0.03602580726146698, -0.034709230065345764, -0.03339264914393425, -0.032076068222522736, -0.03075949102640152, -0.029442911967635155, -0.02812633290886879, -0.026809753850102425, -0.02549317479133606, -0.024176595732569695, -0.02286001667380333, -0.021543437615036964, -0.0202268585562706, -0.018910279497504234, -0.01759370043873787, -0.016277121379971504, -0.01496054232120514, -0.013643963262438774, -0.012327384203672409, -0.011010805144906044, -0.009694226086139679, -0.008377647027373314, -0.007061067968606949, -0.005744488909840584, -0.004427909851074219, -0.0031113307923078537, -0.0017947517335414886, -0.0004781726747751236, 0.0008384063839912415, 0.0021549854427576065, 0.0034715645015239716, 0.004788143560290337, 0.006104722619056702, 0.007421301677823067, 0.008737880736589432, 0.010054459795355797, 0.011371038854122162, 0.012687617912888527, 0.014004196971654892, 0.015320776030421257, 0.016637355089187622, 0.017953934147953987, 0.019270513206720352, 0.020587092265486717, 0.021903671324253082, 0.023220250383019447, 0.024536829441785812, 0.025853408500552177, 0.027169987559318542, 0.028486566618084908, 0.029803145676851273, 0.031119724735617638, 0.032436303794384, 0.03375288099050522, 0.03506946191191673, 0.03638604283332825, 0.03770262002944946]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 3.0, 10.0, 13.0, 6.0, 12.0, 15.0, 22.0, 20.0, 23.0, 16.0, 23.0, 31.0, 31.0, 33.0, 39.0, 36.0, 45.0, 41.0, 39.0, 41.0, 45.0, 47.0, 33.0, 42.0, 31.0, 39.0, 39.0, 28.0, 21.0, 27.0, 22.0, 15.0, 21.0, 15.0, 15.0, 16.0, 10.0, 6.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.7542724609375, -3.631591796875, -3.5089111328125, -3.38623046875, -3.2635498046875, -3.140869140625, -3.0181884765625, -2.8955078125, -2.7728271484375, -2.650146484375, -2.5274658203125, -2.40478515625, -2.2821044921875, -2.159423828125, -2.0367431640625, -1.9140625, -1.7913818359375, -1.668701171875, -1.5460205078125, -1.42333984375, -1.3006591796875, -1.177978515625, -1.0552978515625, -0.9326171875, -0.8099365234375, -0.687255859375, -0.5645751953125, -0.44189453125, -0.3192138671875, -0.196533203125, -0.0738525390625, 0.048828125, 0.1715087890625, 0.294189453125, 0.4168701171875, 0.53955078125, 0.6622314453125, 0.784912109375, 0.9075927734375, 1.0302734375, 1.1529541015625, 1.275634765625, 1.3983154296875, 1.52099609375, 1.6436767578125, 1.766357421875, 1.8890380859375, 2.01171875, 2.1343994140625, 2.257080078125, 2.3797607421875, 2.50244140625, 2.6251220703125, 2.747802734375, 2.8704833984375, 2.9931640625, 3.1158447265625, 3.238525390625, 3.3612060546875, 3.48388671875, 3.6065673828125, 3.729248046875, 3.8519287109375, 3.974609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 3.0, 13.0, 7.0, 18.0, 26.0, 43.0, 51.0, 64.0, 88.0, 152.0, 230.0, 351.0, 555.0, 929.0, 1555.0, 2729.0, 4903.0, 8831.0, 17458.0, 35152.0, 79258.0, 198160.0, 397357.0, 166742.0, 68757.0, 31191.0, 15369.0, 7940.0, 4428.0, 2339.0, 1402.0, 877.0, 552.0, 340.0, 221.0, 152.0, 104.0, 64.0, 48.0, 37.0, 22.0, 12.0, 11.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.722503662109375, -3.59149169921875, -3.460479736328125, -3.3294677734375, -3.198455810546875, -3.06744384765625, -2.936431884765625, -2.805419921875, -2.674407958984375, -2.54339599609375, -2.412384033203125, -2.2813720703125, -2.150360107421875, -2.01934814453125, -1.888336181640625, -1.75732421875, -1.626312255859375, -1.49530029296875, -1.364288330078125, -1.2332763671875, -1.102264404296875, -0.97125244140625, -0.840240478515625, -0.709228515625, -0.578216552734375, -0.44720458984375, -0.316192626953125, -0.1851806640625, -0.054168701171875, 0.07684326171875, 0.207855224609375, 0.3388671875, 0.469879150390625, 0.60089111328125, 0.731903076171875, 0.8629150390625, 0.993927001953125, 1.12493896484375, 1.255950927734375, 1.386962890625, 1.517974853515625, 1.64898681640625, 1.779998779296875, 1.9110107421875, 2.042022705078125, 2.17303466796875, 2.304046630859375, 2.43505859375, 2.566070556640625, 2.69708251953125, 2.828094482421875, 2.9591064453125, 3.090118408203125, 3.22113037109375, 3.352142333984375, 3.483154296875, 3.614166259765625, 3.74517822265625, 3.876190185546875, 4.0072021484375, 4.138214111328125, 4.26922607421875, 4.400238037109375, 4.53125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 8.0, 16.0, 17.0, 14.0, 21.0, 16.0, 22.0, 22.0, 33.0, 38.0, 46.0, 34.0, 28.0, 40.0, 57.0, 93.0, 220.0, 1419.0, 265.0, 122.0, 82.0, 45.0, 52.0, 44.0, 44.0, 34.0, 19.0, 31.0, 21.0, 23.0, 22.0, 15.0, 12.0, 10.0, 6.0, 10.0, 5.0, 4.0, 4.0, 7.0, 7.0, 1.0, 3.0, 2.0, 2.0], "bins": [-14.515625, -14.1195068359375, -13.723388671875, -13.3272705078125, -12.93115234375, -12.5350341796875, -12.138916015625, -11.7427978515625, -11.3466796875, -10.9505615234375, -10.554443359375, -10.1583251953125, -9.76220703125, -9.3660888671875, -8.969970703125, -8.5738525390625, -8.177734375, -7.7816162109375, -7.385498046875, -6.9893798828125, -6.59326171875, -6.1971435546875, -5.801025390625, -5.4049072265625, -5.0087890625, -4.6126708984375, -4.216552734375, -3.8204345703125, -3.42431640625, -3.0281982421875, -2.632080078125, -2.2359619140625, -1.83984375, -1.4437255859375, -1.047607421875, -0.6514892578125, -0.25537109375, 0.1407470703125, 0.536865234375, 0.9329833984375, 1.3291015625, 1.7252197265625, 2.121337890625, 2.5174560546875, 2.91357421875, 3.3096923828125, 3.705810546875, 4.1019287109375, 4.498046875, 4.8941650390625, 5.290283203125, 5.6864013671875, 6.08251953125, 6.4786376953125, 6.874755859375, 7.2708740234375, 7.6669921875, 8.0631103515625, 8.459228515625, 8.8553466796875, 9.25146484375, 9.6475830078125, 10.043701171875, 10.4398193359375, 10.8359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 9.0, 14.0, 18.0, 22.0, 50.0, 72.0, 76.0, 159.0, 327.0, 767.0, 7218.0, 3093836.0, 41057.0, 1172.0, 377.0, 221.0, 119.0, 67.0, 54.0, 30.0, 15.0, 11.0, 3.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.875, -53.08544921875, -51.2958984375, -49.50634765625, -47.716796875, -45.92724609375, -44.1376953125, -42.34814453125, -40.55859375, -38.76904296875, -36.9794921875, -35.18994140625, -33.400390625, -31.61083984375, -29.8212890625, -28.03173828125, -26.2421875, -24.45263671875, -22.6630859375, -20.87353515625, -19.083984375, -17.29443359375, -15.5048828125, -13.71533203125, -11.92578125, -10.13623046875, -8.3466796875, -6.55712890625, -4.767578125, -2.97802734375, -1.1884765625, 0.60107421875, 2.390625, 4.18017578125, 5.9697265625, 7.75927734375, 9.548828125, 11.33837890625, 13.1279296875, 14.91748046875, 16.70703125, 18.49658203125, 20.2861328125, 22.07568359375, 23.865234375, 25.65478515625, 27.4443359375, 29.23388671875, 31.0234375, 32.81298828125, 34.6025390625, 36.39208984375, 38.181640625, 39.97119140625, 41.7607421875, 43.55029296875, 45.33984375, 47.12939453125, 48.9189453125, 50.70849609375, 52.498046875, 54.28759765625, 56.0771484375, 57.86669921875, 59.65625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 134.0, 690.0, 185.0, 8.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-276.05120849609375, -271.1698303222656, -266.2884521484375, -261.4070739746094, -256.52569580078125, -251.64431762695312, -246.762939453125, -241.88156127929688, -237.00018310546875, -232.11880493164062, -227.2374267578125, -222.35604858398438, -217.47467041015625, -212.59329223632812, -207.7119140625, -202.83053588867188, -197.9491424560547, -193.06776428222656, -188.18638610839844, -183.3050079345703, -178.4236297607422, -173.54225158691406, -168.66087341308594, -163.77947998046875, -158.89810180664062, -154.0167236328125, -149.13534545898438, -144.25396728515625, -139.37258911132812, -134.4912109375, -129.60983276367188, -124.72844696044922, -119.84708404541016, -114.96570587158203, -110.0843276977539, -105.20294952392578, -100.32156372070312, -95.440185546875, -90.55880737304688, -85.67742919921875, -80.79605102539062, -75.9146728515625, -71.03329467773438, -66.15191650390625, -61.27053451538086, -56.389156341552734, -51.507774353027344, -46.62639617919922, -41.745018005371094, -36.86363983154297, -31.98225975036621, -27.100879669189453, -22.219501495361328, -17.338123321533203, -12.456743240356445, -7.5753631591796875, -2.6939849853515625, 2.187394142150879, 7.06877326965332, 11.950152397155762, 16.831531524658203, 21.712909698486328, 26.594289779663086, 31.475669860839844, 36.35704803466797]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 3.0, 6.0, 15.0, 13.0, 14.0, 12.0, 17.0, 22.0, 31.0, 23.0, 27.0, 36.0, 32.0, 33.0, 49.0, 31.0, 36.0, 36.0, 39.0, 63.0, 55.0, 48.0, 38.0, 44.0, 44.0, 30.0, 24.0, 34.0, 14.0, 18.0, 20.0, 16.0, 24.0, 10.0, 9.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.00629425048828, -32.72724533081055, -31.448196411132812, -30.169147491455078, -28.890098571777344, -27.61104965209961, -26.332000732421875, -25.05295181274414, -23.773902893066406, -22.494853973388672, -21.215805053710938, -19.936756134033203, -18.65770721435547, -17.378658294677734, -16.099609375, -14.820560455322266, -13.541511535644531, -12.262462615966797, -10.983413696289062, -9.704364776611328, -8.425315856933594, -7.146266937255859, -5.867218017578125, -4.588169097900391, -3.3091201782226562, -2.030071258544922, -0.7510223388671875, 0.5280265808105469, 1.8070755004882812, 3.0861244201660156, 4.36517333984375, 5.644222259521484, 6.923271179199219, 8.202320098876953, 9.481369018554688, 10.760417938232422, 12.039466857910156, 13.31851577758789, 14.597564697265625, 15.87661361694336, 17.155662536621094, 18.434711456298828, 19.713760375976562, 20.992809295654297, 22.27185821533203, 23.550907135009766, 24.8299560546875, 26.109004974365234, 27.38805389404297, 28.667102813720703, 29.946151733398438, 31.225200653076172, 32.504249572753906, 33.78329849243164, 35.062347412109375, 36.34139633178711, 37.620445251464844, 38.89949417114258, 40.17854309082031, 41.45759201049805, 42.73664093017578, 44.015689849853516, 45.29473876953125, 46.573787689208984, 47.85283660888672]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 1.0, 5.0, 6.0, 7.0, 10.0, 10.0, 14.0, 18.0, 16.0, 25.0, 18.0, 15.0, 29.0, 22.0, 27.0, 41.0, 32.0, 34.0, 46.0, 47.0, 42.0, 34.0, 41.0, 32.0, 43.0, 40.0, 43.0, 34.0, 29.0, 28.0, 28.0, 25.0, 24.0, 21.0, 18.0, 13.0, 18.0, 13.0, 12.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.08984375, -3.96075439453125, -3.8316650390625, -3.70257568359375, -3.573486328125, -3.44439697265625, -3.3153076171875, -3.18621826171875, -3.05712890625, -2.92803955078125, -2.7989501953125, -2.66986083984375, -2.540771484375, -2.41168212890625, -2.2825927734375, -2.15350341796875, -2.0244140625, -1.89532470703125, -1.7662353515625, -1.63714599609375, -1.508056640625, -1.37896728515625, -1.2498779296875, -1.12078857421875, -0.99169921875, -0.86260986328125, -0.7335205078125, -0.60443115234375, -0.475341796875, -0.34625244140625, -0.2171630859375, -0.08807373046875, 0.041015625, 0.17010498046875, 0.2991943359375, 0.42828369140625, 0.557373046875, 0.68646240234375, 0.8155517578125, 0.94464111328125, 1.07373046875, 1.20281982421875, 1.3319091796875, 1.46099853515625, 1.590087890625, 1.71917724609375, 1.8482666015625, 1.97735595703125, 2.1064453125, 2.23553466796875, 2.3646240234375, 2.49371337890625, 2.622802734375, 2.75189208984375, 2.8809814453125, 3.01007080078125, 3.13916015625, 3.26824951171875, 3.3973388671875, 3.52642822265625, 3.655517578125, 3.78460693359375, 3.9136962890625, 4.04278564453125, 4.171875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 5.0, 1.0, 11.0, 8.0, 11.0, 10.0, 16.0, 12.0, 18.0, 28.0, 28.0, 35.0, 61.0, 121.0, 201.0, 410.0, 1089.0, 3955.0, 21248.0, 182478.0, 2203575.0, 1635789.0, 124471.0, 15813.0, 3102.0, 948.0, 325.0, 169.0, 98.0, 66.0, 40.0, 33.0, 28.0, 17.0, 17.0, 18.0, 1.0, 8.0, 6.0, 9.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.5, -14.072509765625, -13.64501953125, -13.217529296875, -12.7900390625, -12.362548828125, -11.93505859375, -11.507568359375, -11.080078125, -10.652587890625, -10.22509765625, -9.797607421875, -9.3701171875, -8.942626953125, -8.51513671875, -8.087646484375, -7.66015625, -7.232666015625, -6.80517578125, -6.377685546875, -5.9501953125, -5.522705078125, -5.09521484375, -4.667724609375, -4.240234375, -3.812744140625, -3.38525390625, -2.957763671875, -2.5302734375, -2.102783203125, -1.67529296875, -1.247802734375, -0.8203125, -0.392822265625, 0.03466796875, 0.462158203125, 0.8896484375, 1.317138671875, 1.74462890625, 2.172119140625, 2.599609375, 3.027099609375, 3.45458984375, 3.882080078125, 4.3095703125, 4.737060546875, 5.16455078125, 5.592041015625, 6.01953125, 6.447021484375, 6.87451171875, 7.302001953125, 7.7294921875, 8.156982421875, 8.58447265625, 9.011962890625, 9.439453125, 9.866943359375, 10.29443359375, 10.721923828125, 11.1494140625, 11.576904296875, 12.00439453125, 12.431884765625, 12.859375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 10.0, 11.0, 9.0, 7.0, 23.0, 22.0, 37.0, 30.0, 45.0, 53.0, 77.0, 86.0, 103.0, 112.0, 165.0, 208.0, 228.0, 303.0, 353.0, 363.0, 334.0, 283.0, 225.0, 183.0, 168.0, 118.0, 104.0, 94.0, 57.0, 47.0, 38.0, 41.0, 30.0, 22.0, 20.0, 9.0, 14.0, 6.0, 7.0, 5.0, 5.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-8.5390625, -8.2979736328125, -8.056884765625, -7.8157958984375, -7.57470703125, -7.3336181640625, -7.092529296875, -6.8514404296875, -6.6103515625, -6.3692626953125, -6.128173828125, -5.8870849609375, -5.64599609375, -5.4049072265625, -5.163818359375, -4.9227294921875, -4.681640625, -4.4405517578125, -4.199462890625, -3.9583740234375, -3.71728515625, -3.4761962890625, -3.235107421875, -2.9940185546875, -2.7529296875, -2.5118408203125, -2.270751953125, -2.0296630859375, -1.78857421875, -1.5474853515625, -1.306396484375, -1.0653076171875, -0.82421875, -0.5831298828125, -0.342041015625, -0.1009521484375, 0.14013671875, 0.3812255859375, 0.622314453125, 0.8634033203125, 1.1044921875, 1.3455810546875, 1.586669921875, 1.8277587890625, 2.06884765625, 2.3099365234375, 2.551025390625, 2.7921142578125, 3.033203125, 3.2742919921875, 3.515380859375, 3.7564697265625, 3.99755859375, 4.2386474609375, 4.479736328125, 4.7208251953125, 4.9619140625, 5.2030029296875, 5.444091796875, 5.6851806640625, 5.92626953125, 6.1673583984375, 6.408447265625, 6.6495361328125, 6.890625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 13.0, 10.0, 10.0, 14.0, 21.0, 31.0, 35.0, 43.0, 54.0, 65.0, 91.0, 117.0, 148.0, 220.0, 274.0, 543.0, 1699.0, 12236.0, 204699.0, 3394011.0, 549721.0, 25408.0, 2810.0, 721.0, 331.0, 197.0, 162.0, 131.0, 100.0, 91.0, 54.0, 43.0, 44.0, 28.0, 21.0, 22.0, 6.0, 12.0, 13.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.701171875, -20.88671875, -20.072265625, -19.2578125, -18.443359375, -17.62890625, -16.814453125, -16.0, -15.185546875, -14.37109375, -13.556640625, -12.7421875, -11.927734375, -11.11328125, -10.298828125, -9.484375, -8.669921875, -7.85546875, -7.041015625, -6.2265625, -5.412109375, -4.59765625, -3.783203125, -2.96875, -2.154296875, -1.33984375, -0.525390625, 0.2890625, 1.103515625, 1.91796875, 2.732421875, 3.546875, 4.361328125, 5.17578125, 5.990234375, 6.8046875, 7.619140625, 8.43359375, 9.248046875, 10.0625, 10.876953125, 11.69140625, 12.505859375, 13.3203125, 14.134765625, 14.94921875, 15.763671875, 16.578125, 17.392578125, 18.20703125, 19.021484375, 19.8359375, 20.650390625, 21.46484375, 22.279296875, 23.09375, 23.908203125, 24.72265625, 25.537109375, 26.3515625, 27.166015625, 27.98046875, 28.794921875, 29.609375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 21.0, 92.0, 185.0, 319.0, 258.0, 108.0, 27.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.4193115234375, -144.7062530517578, -139.99319458007812, -135.2801513671875, -130.5670928955078, -125.85403442382812, -121.14098358154297, -116.42793273925781, -111.71487426757812, -107.00181579589844, -102.28876495361328, -97.57571411132812, -92.86265563964844, -88.14959716796875, -83.4365463256836, -78.72349548339844, -74.01043701171875, -69.29737854003906, -64.5843276977539, -59.871273040771484, -55.15821838378906, -50.44516372680664, -45.73210906982422, -41.0190544128418, -36.305999755859375, -31.592945098876953, -26.87989044189453, -22.16683578491211, -17.453781127929688, -12.740726470947266, -8.027671813964844, -3.314617156982422, 1.3984222412109375, 6.111476898193359, 10.824531555175781, 15.537586212158203, 20.250640869140625, 24.963695526123047, 29.67675018310547, 34.38980484008789, 39.10285949707031, 43.815914154052734, 48.528968811035156, 53.24202346801758, 57.955078125, 62.66813278198242, 67.38118743896484, 72.09423828125, 76.80729675292969, 81.52035522460938, 86.23340606689453, 90.94645690917969, 95.65951538085938, 100.37257385253906, 105.08562469482422, 109.79867553710938, 114.51173400878906, 119.22479248046875, 123.9378433227539, 128.65089416503906, 133.36395263671875, 138.07701110839844, 142.79006958007812, 147.50311279296875, 152.21617126464844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 8.0, 8.0, 7.0, 19.0, 23.0, 24.0, 15.0, 18.0, 28.0, 23.0, 29.0, 35.0, 35.0, 37.0, 43.0, 57.0, 47.0, 42.0, 40.0, 38.0, 44.0, 38.0, 51.0, 38.0, 26.0, 22.0, 37.0, 23.0, 25.0, 8.0, 18.0, 12.0, 14.0, 11.0, 8.0, 15.0, 8.0, 1.0, 3.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.82273864746094, -31.79857635498047, -30.774415969848633, -29.750253677368164, -28.726093292236328, -27.70193099975586, -26.67776870727539, -25.653606414794922, -24.629446029663086, -23.605283737182617, -22.58112335205078, -21.556961059570312, -20.532798767089844, -19.508638381958008, -18.48447608947754, -17.460315704345703, -16.436153411865234, -15.411992073059082, -14.38783073425293, -13.363668441772461, -12.339507102966309, -11.315345764160156, -10.291183471679688, -9.267022132873535, -8.242860794067383, -7.2186994552612305, -6.19453763961792, -5.170375823974609, -4.146214485168457, -3.1220531463623047, -2.097891330718994, -1.0737295150756836, -0.04956817626953125, 0.9745934009552002, 1.9987549781799316, 3.022916555404663, 4.0470781326293945, 5.071239471435547, 6.095401287078857, 7.119563102722168, 8.14372444152832, 9.167885780334473, 10.192047119140625, 11.216209411621094, 12.240370750427246, 13.264532089233398, 14.288694381713867, 15.31285572052002, 16.337017059326172, 17.36117935180664, 18.385339736938477, 19.409502029418945, 20.43366241455078, 21.45782470703125, 22.48198699951172, 23.506149291992188, 24.530309677124023, 25.554471969604492, 26.578632354736328, 27.602794647216797, 28.626956939697266, 29.6511173248291, 30.67527961730957, 31.699440002441406, 32.723602294921875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 11.0, 11.0, 15.0, 15.0, 19.0, 21.0, 29.0, 28.0, 32.0, 33.0, 20.0, 44.0, 43.0, 40.0, 41.0, 48.0, 45.0, 48.0, 33.0, 47.0, 45.0, 41.0, 31.0, 28.0, 35.0, 28.0, 29.0, 15.0, 13.0, 15.0, 11.0, 11.0, 10.0, 9.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.58203125, -4.44378662109375, -4.3055419921875, -4.16729736328125, -4.029052734375, -3.89080810546875, -3.7525634765625, -3.61431884765625, -3.47607421875, -3.33782958984375, -3.1995849609375, -3.06134033203125, -2.923095703125, -2.78485107421875, -2.6466064453125, -2.50836181640625, -2.3701171875, -2.23187255859375, -2.0936279296875, -1.95538330078125, -1.817138671875, -1.67889404296875, -1.5406494140625, -1.40240478515625, -1.26416015625, -1.12591552734375, -0.9876708984375, -0.84942626953125, -0.711181640625, -0.57293701171875, -0.4346923828125, -0.29644775390625, -0.158203125, -0.01995849609375, 0.1182861328125, 0.25653076171875, 0.394775390625, 0.53302001953125, 0.6712646484375, 0.80950927734375, 0.94775390625, 1.08599853515625, 1.2242431640625, 1.36248779296875, 1.500732421875, 1.63897705078125, 1.7772216796875, 1.91546630859375, 2.0537109375, 2.19195556640625, 2.3302001953125, 2.46844482421875, 2.606689453125, 2.74493408203125, 2.8831787109375, 3.02142333984375, 3.15966796875, 3.29791259765625, 3.4361572265625, 3.57440185546875, 3.712646484375, 3.85089111328125, 3.9891357421875, 4.12738037109375, 4.265625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 13.0, 12.0, 24.0, 38.0, 58.0, 117.0, 160.0, 222.0, 369.0, 537.0, 824.0, 1231.0, 1864.0, 2795.0, 4320.0, 6894.0, 10378.0, 16156.0, 24650.0, 37337.0, 56019.0, 81351.0, 112633.0, 142878.0, 148704.0, 122610.0, 90323.0, 62882.0, 42566.0, 27925.0, 18351.0, 12062.0, 7819.0, 5075.0, 3266.0, 2100.0, 1347.0, 946.0, 584.0, 363.0, 255.0, 187.0, 108.0, 67.0, 42.0, 31.0, 27.0, 18.0, 6.0, 5.0, 9.0, 6.0], "bins": [-0.70556640625, -0.6860504150390625, -0.666534423828125, -0.6470184326171875, -0.62750244140625, -0.6079864501953125, -0.588470458984375, -0.5689544677734375, -0.5494384765625, -0.5299224853515625, -0.510406494140625, -0.4908905029296875, -0.47137451171875, -0.4518585205078125, -0.432342529296875, -0.4128265380859375, -0.393310546875, -0.3737945556640625, -0.354278564453125, -0.3347625732421875, -0.31524658203125, -0.2957305908203125, -0.276214599609375, -0.2566986083984375, -0.2371826171875, -0.2176666259765625, -0.198150634765625, -0.1786346435546875, -0.15911865234375, -0.1396026611328125, -0.120086669921875, -0.1005706787109375, -0.0810546875, -0.0615386962890625, -0.042022705078125, -0.0225067138671875, -0.00299072265625, 0.0165252685546875, 0.036041259765625, 0.0555572509765625, 0.0750732421875, 0.0945892333984375, 0.114105224609375, 0.1336212158203125, 0.15313720703125, 0.1726531982421875, 0.192169189453125, 0.2116851806640625, 0.231201171875, 0.2507171630859375, 0.270233154296875, 0.2897491455078125, 0.30926513671875, 0.3287811279296875, 0.348297119140625, 0.3678131103515625, 0.3873291015625, 0.4068450927734375, 0.426361083984375, 0.4458770751953125, 0.46539306640625, 0.4849090576171875, 0.504425048828125, 0.5239410400390625, 0.54345703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 9.0, 8.0, 6.0, 4.0, 11.0, 12.0, 13.0, 16.0, 21.0, 35.0, 27.0, 34.0, 34.0, 36.0, 33.0, 30.0, 39.0, 49.0, 49.0, 1059.0, 54.0, 38.0, 41.0, 42.0, 34.0, 31.0, 35.0, 39.0, 21.0, 24.0, 21.0, 25.0, 14.0, 17.0, 14.0, 13.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.75, -2.654754638671875, -2.55950927734375, -2.464263916015625, -2.3690185546875, -2.273773193359375, -2.17852783203125, -2.083282470703125, -1.988037109375, -1.892791748046875, -1.79754638671875, -1.702301025390625, -1.6070556640625, -1.511810302734375, -1.41656494140625, -1.321319580078125, -1.22607421875, -1.130828857421875, -1.03558349609375, -0.940338134765625, -0.8450927734375, -0.749847412109375, -0.65460205078125, -0.559356689453125, -0.464111328125, -0.368865966796875, -0.27362060546875, -0.178375244140625, -0.0831298828125, 0.012115478515625, 0.10736083984375, 0.202606201171875, 0.2978515625, 0.393096923828125, 0.48834228515625, 0.583587646484375, 0.6788330078125, 0.774078369140625, 0.86932373046875, 0.964569091796875, 1.059814453125, 1.155059814453125, 1.25030517578125, 1.345550537109375, 1.4407958984375, 1.536041259765625, 1.63128662109375, 1.726531982421875, 1.82177734375, 1.917022705078125, 2.01226806640625, 2.107513427734375, 2.2027587890625, 2.298004150390625, 2.39324951171875, 2.488494873046875, 2.583740234375, 2.678985595703125, 2.77423095703125, 2.869476318359375, 2.9647216796875, 3.059967041015625, 3.15521240234375, 3.250457763671875, 3.345703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 9.0, 7.0, 14.0, 20.0, 40.0, 49.0, 80.0, 121.0, 174.0, 274.0, 436.0, 631.0, 996.0, 1580.0, 2481.0, 3874.0, 6158.0, 10017.0, 15832.0, 25772.0, 40850.0, 63969.0, 96219.0, 134214.0, 1202370.0, 157394.0, 115489.0, 79198.0, 51706.0, 32525.0, 20461.0, 12698.0, 7924.0, 5011.0, 3074.0, 1949.0, 1253.0, 774.0, 486.0, 334.0, 224.0, 138.0, 104.0, 82.0, 45.0, 28.0, 17.0, 14.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.374755859375, -0.36295318603515625, -0.3511505126953125, -0.33934783935546875, -0.327545166015625, -0.31574249267578125, -0.3039398193359375, -0.29213714599609375, -0.28033447265625, -0.26853179931640625, -0.2567291259765625, -0.24492645263671875, -0.233123779296875, -0.22132110595703125, -0.2095184326171875, -0.19771575927734375, -0.1859130859375, -0.17411041259765625, -0.1623077392578125, -0.15050506591796875, -0.138702392578125, -0.12689971923828125, -0.1150970458984375, -0.10329437255859375, -0.09149169921875, -0.07968902587890625, -0.0678863525390625, -0.05608367919921875, -0.044281005859375, -0.03247833251953125, -0.0206756591796875, -0.00887298583984375, 0.0029296875, 0.01473236083984375, 0.0265350341796875, 0.03833770751953125, 0.050140380859375, 0.06194305419921875, 0.0737457275390625, 0.08554840087890625, 0.09735107421875, 0.10915374755859375, 0.1209564208984375, 0.13275909423828125, 0.144561767578125, 0.15636444091796875, 0.1681671142578125, 0.17996978759765625, 0.1917724609375, 0.20357513427734375, 0.2153778076171875, 0.22718048095703125, 0.238983154296875, 0.25078582763671875, 0.2625885009765625, 0.27439117431640625, 0.28619384765625, 0.29799652099609375, 0.3097991943359375, 0.32160186767578125, 0.333404541015625, 0.34520721435546875, 0.3570098876953125, 0.36881256103515625, 0.380615234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 4.0, 7.0, 8.0, 4.0, 9.0, 8.0, 8.0, 8.0, 11.0, 12.0, 11.0, 12.0, 25.0, 27.0, 31.0, 33.0, 43.0, 70.0, 88.0, 107.0, 93.0, 73.0, 61.0, 49.0, 36.0, 26.0, 20.0, 13.0, 12.0, 8.0, 11.0, 14.0, 8.0, 9.0, 10.0, 5.0, 3.0, 4.0, 1.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01462554931640625, -0.014130234718322754, -0.013634920120239258, -0.013139605522155762, -0.012644290924072266, -0.01214897632598877, -0.011653661727905273, -0.011158347129821777, -0.010663032531738281, -0.010167717933654785, -0.009672403335571289, -0.009177088737487793, -0.008681774139404297, -0.0081864595413208, -0.007691144943237305, -0.007195830345153809, -0.0067005157470703125, -0.006205201148986816, -0.00570988655090332, -0.005214571952819824, -0.004719257354736328, -0.004223942756652832, -0.003728628158569336, -0.00323331356048584, -0.0027379989624023438, -0.0022426843643188477, -0.0017473697662353516, -0.0012520551681518555, -0.0007567405700683594, -0.0002614259719848633, 0.0002338886260986328, 0.0007292032241821289, 0.001224517822265625, 0.001719832420349121, 0.002215147018432617, 0.0027104616165161133, 0.0032057762145996094, 0.0037010908126831055, 0.0041964054107666016, 0.004691720008850098, 0.005187034606933594, 0.00568234920501709, 0.006177663803100586, 0.006672978401184082, 0.007168292999267578, 0.007663607597351074, 0.00815892219543457, 0.008654236793518066, 0.009149551391601562, 0.009644865989685059, 0.010140180587768555, 0.01063549518585205, 0.011130809783935547, 0.011626124382019043, 0.012121438980102539, 0.012616753578186035, 0.013112068176269531, 0.013607382774353027, 0.014102697372436523, 0.01459801197052002, 0.015093326568603516, 0.015588641166687012, 0.016083955764770508, 0.016579270362854004, 0.0170745849609375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 4.0, 3.0, 4.0, 9.0, 7.0, 11.0, 14.0, 18.0, 14.0, 13.0, 23.0, 25.0, 41.0, 69.0, 107.0, 191.0, 308.0, 721.0, 5286.0, 668918.0, 366959.0, 4338.0, 641.0, 289.0, 166.0, 90.0, 66.0, 42.0, 25.0, 26.0, 23.0, 15.0, 9.0, 17.0, 8.0, 8.0, 9.0, 5.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3037109375, -0.2944984436035156, -0.28528594970703125, -0.2760734558105469, -0.2668609619140625, -0.2576484680175781, -0.24843597412109375, -0.23922348022460938, -0.230010986328125, -0.22079849243164062, -0.21158599853515625, -0.20237350463867188, -0.1931610107421875, -0.18394851684570312, -0.17473602294921875, -0.16552352905273438, -0.15631103515625, -0.14709854125976562, -0.13788604736328125, -0.12867355346679688, -0.1194610595703125, -0.11024856567382812, -0.10103607177734375, -0.09182357788085938, -0.082611083984375, -0.07339859008789062, -0.06418609619140625, -0.054973602294921875, -0.0457611083984375, -0.036548614501953125, -0.02733612060546875, -0.018123626708984375, -0.0089111328125, 0.000301361083984375, 0.00951385498046875, 0.018726348876953125, 0.0279388427734375, 0.037151336669921875, 0.04636383056640625, 0.055576324462890625, 0.064788818359375, 0.07400131225585938, 0.08321380615234375, 0.09242630004882812, 0.1016387939453125, 0.11085128784179688, 0.12006378173828125, 0.12927627563476562, 0.13848876953125, 0.14770126342773438, 0.15691375732421875, 0.16612625122070312, 0.1753387451171875, 0.18455123901367188, 0.19376373291015625, 0.20297622680664062, 0.212188720703125, 0.22140121459960938, 0.23061370849609375, 0.23982620239257812, 0.2490386962890625, 0.2582511901855469, 0.26746368408203125, 0.2766761779785156, 0.285888671875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 155.0, 797.0, 52.0, 3.0, 1.0], "bins": [-0.6201372742652893, -0.6098561882972717, -0.5995751023292542, -0.5892940163612366, -0.5790128707885742, -0.5687317848205566, -0.5584506988525391, -0.5481696128845215, -0.5378885269165039, -0.5276074409484863, -0.5173263549804688, -0.5070452690124512, -0.4967641532421112, -0.48648303747177124, -0.47620195150375366, -0.4659208655357361, -0.4556397497653961, -0.44535866379737854, -0.4350775480270386, -0.424796462059021, -0.4145153760910034, -0.40423429012298584, -0.3939531743526459, -0.3836720883846283, -0.37339097261428833, -0.36310988664627075, -0.3528287708759308, -0.3425476849079132, -0.33226659893989563, -0.32198548316955566, -0.3117043972015381, -0.3014233112335205, -0.29114219546318054, -0.28086110949516296, -0.270579993724823, -0.2602989077568054, -0.25001782178878784, -0.23973672091960907, -0.2294556200504303, -0.21917453408241272, -0.20889343321323395, -0.19861233234405518, -0.1883312463760376, -0.17805014550685883, -0.16776904463768005, -0.15748795866966248, -0.1472068578004837, -0.13692575693130493, -0.12664467096328735, -0.11636357754468918, -0.106082484126091, -0.09580138325691223, -0.08552028983831406, -0.07523919641971588, -0.06495809555053711, -0.054677002131938934, -0.04439591243863106, -0.034114815294742584, -0.02383372187614441, -0.013552626594901085, -0.0032715313136577606, 0.007009562104940414, 0.017290659248828888, 0.02757175639271736, 0.037852849811315536]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 6.0, 6.0, 8.0, 14.0, 19.0, 18.0, 18.0, 26.0, 34.0, 41.0, 31.0, 36.0, 37.0, 45.0, 49.0, 36.0, 51.0, 48.0, 38.0, 46.0, 41.0, 40.0, 42.0, 38.0, 39.0, 29.0, 27.0, 29.0, 19.0, 17.0, 6.0, 11.0, 11.0, 10.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03899747133255005, -0.037849538028240204, -0.03670160844922066, -0.03555367887020111, -0.034405745565891266, -0.03325781226158142, -0.032109882682561874, -0.03096195124089718, -0.029814019799232483, -0.028666088357567787, -0.02751815691590309, -0.026370225474238396, -0.0252222940325737, -0.024074362590909004, -0.02292643114924431, -0.021778499707579613, -0.020630568265914917, -0.01948263682425022, -0.018334705382585526, -0.01718677394092083, -0.016038842499256134, -0.014890911057591438, -0.013742979615926743, -0.012595048174262047, -0.011447116732597351, -0.010299185290932655, -0.00915125384926796, -0.008003322407603264, -0.006855390965938568, -0.005707459524273872, -0.004559528082609177, -0.003411596640944481, -0.002263665199279785, -0.0011157337576150894, 3.219768404960632e-05, 0.001180129125714302, 0.002328060567378998, 0.0034759920090436935, 0.004623923450708389, 0.005771854892373085, 0.006919786334037781, 0.008067717775702477, 0.009215649217367172, 0.010363580659031868, 0.011511512100696564, 0.01265944354236126, 0.013807374984025955, 0.014955306425690651, 0.016103237867355347, 0.017251169309020042, 0.018399100750684738, 0.019547032192349434, 0.02069496363401413, 0.021842895075678825, 0.02299082651734352, 0.024138757959008217, 0.025286689400672913, 0.02643462084233761, 0.027582552284002304, 0.028730483725667, 0.029878415167331696, 0.03102634660899639, 0.03217427805066109, 0.033322207629680634, 0.03447014093399048]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 2.0, 4.0, 6.0, 8.0, 7.0, 11.0, 11.0, 15.0, 15.0, 19.0, 21.0, 29.0, 28.0, 32.0, 33.0, 20.0, 44.0, 44.0, 39.0, 41.0, 47.0, 45.0, 49.0, 33.0, 46.0, 46.0, 41.0, 31.0, 28.0, 35.0, 28.0, 31.0, 13.0, 13.0, 15.0, 11.0, 11.0, 10.0, 9.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.58203125, -4.44378662109375, -4.3055419921875, -4.16729736328125, -4.029052734375, -3.89080810546875, -3.7525634765625, -3.61431884765625, -3.47607421875, -3.33782958984375, -3.1995849609375, -3.06134033203125, -2.923095703125, -2.78485107421875, -2.6466064453125, -2.50836181640625, -2.3701171875, -2.23187255859375, -2.0936279296875, -1.95538330078125, -1.817138671875, -1.67889404296875, -1.5406494140625, -1.40240478515625, -1.26416015625, -1.12591552734375, -0.9876708984375, -0.84942626953125, -0.711181640625, -0.57293701171875, -0.4346923828125, -0.29644775390625, -0.158203125, -0.01995849609375, 0.1182861328125, 0.25653076171875, 0.394775390625, 0.53302001953125, 0.6712646484375, 0.80950927734375, 0.94775390625, 1.08599853515625, 1.2242431640625, 1.36248779296875, 1.500732421875, 1.63897705078125, 1.7772216796875, 1.91546630859375, 2.0537109375, 2.19195556640625, 2.3302001953125, 2.46844482421875, 2.606689453125, 2.74493408203125, 2.8831787109375, 3.02142333984375, 3.15966796875, 3.29791259765625, 3.4361572265625, 3.57440185546875, 3.712646484375, 3.85089111328125, 3.9891357421875, 4.12738037109375, 4.265625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 7.0, 10.0, 2.0, 10.0, 17.0, 21.0, 40.0, 66.0, 85.0, 139.0, 198.0, 320.0, 495.0, 907.0, 1629.0, 2617.0, 4490.0, 8089.0, 14523.0, 29031.0, 67405.0, 200633.0, 437189.0, 165915.0, 57979.0, 25762.0, 13426.0, 7347.0, 4225.0, 2440.0, 1385.0, 834.0, 505.0, 302.0, 182.0, 133.0, 77.0, 48.0, 30.0, 19.0, 10.0, 6.0, 2.0, 1.0, 1.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.08203125, -4.93438720703125, -4.7867431640625, -4.63909912109375, -4.491455078125, -4.34381103515625, -4.1961669921875, -4.04852294921875, -3.90087890625, -3.75323486328125, -3.6055908203125, -3.45794677734375, -3.310302734375, -3.16265869140625, -3.0150146484375, -2.86737060546875, -2.7197265625, -2.57208251953125, -2.4244384765625, -2.27679443359375, -2.129150390625, -1.98150634765625, -1.8338623046875, -1.68621826171875, -1.53857421875, -1.39093017578125, -1.2432861328125, -1.09564208984375, -0.947998046875, -0.80035400390625, -0.6527099609375, -0.50506591796875, -0.357421875, -0.20977783203125, -0.0621337890625, 0.08551025390625, 0.233154296875, 0.38079833984375, 0.5284423828125, 0.67608642578125, 0.82373046875, 0.97137451171875, 1.1190185546875, 1.26666259765625, 1.414306640625, 1.56195068359375, 1.7095947265625, 1.85723876953125, 2.0048828125, 2.15252685546875, 2.3001708984375, 2.44781494140625, 2.595458984375, 2.74310302734375, 2.8907470703125, 3.03839111328125, 3.18603515625, 3.33367919921875, 3.4813232421875, 3.62896728515625, 3.776611328125, 3.92425537109375, 4.0718994140625, 4.21954345703125, 4.3671875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 0.0, 1.0, 5.0, 8.0, 13.0, 16.0, 7.0, 19.0, 21.0, 22.0, 22.0, 32.0, 45.0, 37.0, 33.0, 38.0, 44.0, 63.0, 109.0, 285.0, 1573.0, 179.0, 100.0, 46.0, 47.0, 32.0, 40.0, 33.0, 37.0, 21.0, 16.0, 26.0, 19.0, 20.0, 8.0, 10.0, 8.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.82275390625, -17.3173828125, -16.81201171875, -16.306640625, -15.80126953125, -15.2958984375, -14.79052734375, -14.28515625, -13.77978515625, -13.2744140625, -12.76904296875, -12.263671875, -11.75830078125, -11.2529296875, -10.74755859375, -10.2421875, -9.73681640625, -9.2314453125, -8.72607421875, -8.220703125, -7.71533203125, -7.2099609375, -6.70458984375, -6.19921875, -5.69384765625, -5.1884765625, -4.68310546875, -4.177734375, -3.67236328125, -3.1669921875, -2.66162109375, -2.15625, -1.65087890625, -1.1455078125, -0.64013671875, -0.134765625, 0.37060546875, 0.8759765625, 1.38134765625, 1.88671875, 2.39208984375, 2.8974609375, 3.40283203125, 3.908203125, 4.41357421875, 4.9189453125, 5.42431640625, 5.9296875, 6.43505859375, 6.9404296875, 7.44580078125, 7.951171875, 8.45654296875, 8.9619140625, 9.46728515625, 9.97265625, 10.47802734375, 10.9833984375, 11.48876953125, 11.994140625, 12.49951171875, 13.0048828125, 13.51025390625, 14.015625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 6.0, 9.0, 5.0, 10.0, 19.0, 16.0, 26.0, 45.0, 63.0, 69.0, 98.0, 147.0, 202.0, 253.0, 430.0, 1569.0, 52059.0, 3064165.0, 24044.0, 1091.0, 409.0, 249.0, 199.0, 149.0, 91.0, 69.0, 58.0, 39.0, 31.0, 17.0, 17.0, 10.0, 11.0, 9.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.08154296875, -30.8193359375, -29.55712890625, -28.294921875, -27.03271484375, -25.7705078125, -24.50830078125, -23.24609375, -21.98388671875, -20.7216796875, -19.45947265625, -18.197265625, -16.93505859375, -15.6728515625, -14.41064453125, -13.1484375, -11.88623046875, -10.6240234375, -9.36181640625, -8.099609375, -6.83740234375, -5.5751953125, -4.31298828125, -3.05078125, -1.78857421875, -0.5263671875, 0.73583984375, 1.998046875, 3.26025390625, 4.5224609375, 5.78466796875, 7.046875, 8.30908203125, 9.5712890625, 10.83349609375, 12.095703125, 13.35791015625, 14.6201171875, 15.88232421875, 17.14453125, 18.40673828125, 19.6689453125, 20.93115234375, 22.193359375, 23.45556640625, 24.7177734375, 25.97998046875, 27.2421875, 28.50439453125, 29.7666015625, 31.02880859375, 32.291015625, 33.55322265625, 34.8154296875, 36.07763671875, 37.33984375, 38.60205078125, 39.8642578125, 41.12646484375, 42.388671875, 43.65087890625, 44.9130859375, 46.17529296875, 47.4375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 19.0, 160.0, 514.0, 291.0, 31.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.34165954589844, -151.937744140625, -148.53382873535156, -145.12991333007812, -141.72598266601562, -138.3220672607422, -134.91815185546875, -131.5142364501953, -128.11032104492188, -124.70640563964844, -121.30248260498047, -117.89856719970703, -114.4946517944336, -111.09072875976562, -107.68681335449219, -104.28289794921875, -100.87897491455078, -97.47505950927734, -94.07113647460938, -90.66722106933594, -87.2633056640625, -83.85939025878906, -80.4554672241211, -77.05155181884766, -73.64762878417969, -70.24371337890625, -66.83979034423828, -63.435874938964844, -60.031959533691406, -56.6280403137207, -53.22412109375, -49.82020568847656, -46.416282653808594, -43.01236343383789, -39.60844802856445, -36.20452880859375, -32.80061340332031, -29.39669418334961, -25.992774963378906, -22.588857650756836, -19.184940338134766, -15.781023025512695, -12.377104759216309, -8.973186492919922, -5.569269180297852, -2.1653518676757812, 1.2385673522949219, 4.642484664916992, 8.046401977539062, 11.450319290161133, 14.85423755645752, 18.258155822753906, 21.662073135375977, 25.065990447998047, 28.46990966796875, 31.87382698059082, 35.27774429321289, 38.681663513183594, 42.08557891845703, 45.489498138427734, 48.89341735839844, 52.297332763671875, 55.70125198364258, 59.10517120361328, 62.50908660888672]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 8.0, 11.0, 4.0, 7.0, 6.0, 11.0, 23.0, 19.0, 18.0, 32.0, 28.0, 33.0, 28.0, 29.0, 48.0, 44.0, 39.0, 52.0, 49.0, 56.0, 51.0, 39.0, 40.0, 33.0, 36.0, 22.0, 33.0, 23.0, 30.0, 29.0, 24.0, 18.0, 17.0, 16.0, 10.0, 12.0, 9.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-49.87300109863281, -48.48075866699219, -47.0885124206543, -45.69626998901367, -44.30402374267578, -42.911781311035156, -41.51953887939453, -40.12729263305664, -38.735050201416016, -37.34280776977539, -35.9505615234375, -34.558319091796875, -33.166072845458984, -31.77383041381836, -30.3815860748291, -28.989341735839844, -27.597097396850586, -26.204853057861328, -24.81260871887207, -23.420364379882812, -22.028121948242188, -20.63587760925293, -19.243633270263672, -17.851390838623047, -16.459144592285156, -15.066900253295898, -13.674656867980957, -12.2824125289917, -10.890169143676758, -9.4979248046875, -8.105680465698242, -6.713437080383301, -5.321193695068359, -3.9289498329162598, -2.536705732345581, -1.1444616317749023, 0.24778223037719727, 1.6400260925292969, 3.0322704315185547, 4.424513816833496, 5.816758155822754, 7.2090020179748535, 8.601245880126953, 9.993490219116211, 11.385734558105469, 12.77797794342041, 14.170222282409668, 15.56246566772461, 16.954710006713867, 18.346954345703125, 19.739198684692383, 21.13144302368164, 22.523685455322266, 23.915929794311523, 25.30817413330078, 26.700416564941406, 28.092662811279297, 29.484907150268555, 30.877151489257812, 32.26939392089844, 33.66164016723633, 35.05388259887695, 36.446128845214844, 37.83837127685547, 39.230613708496094]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 7.0, 9.0, 7.0, 12.0, 16.0, 12.0, 12.0, 22.0, 23.0, 20.0, 28.0, 28.0, 21.0, 30.0, 45.0, 36.0, 39.0, 32.0, 45.0, 53.0, 40.0, 36.0, 45.0, 41.0, 30.0, 39.0, 38.0, 24.0, 27.0, 28.0, 21.0, 21.0, 11.0, 17.0, 17.0, 12.0, 6.0, 9.0, 7.0, 4.0, 1.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.37890625, -4.24005126953125, -4.1011962890625, -3.96234130859375, -3.823486328125, -3.68463134765625, -3.5457763671875, -3.40692138671875, -3.26806640625, -3.12921142578125, -2.9903564453125, -2.85150146484375, -2.712646484375, -2.57379150390625, -2.4349365234375, -2.29608154296875, -2.1572265625, -2.01837158203125, -1.8795166015625, -1.74066162109375, -1.601806640625, -1.46295166015625, -1.3240966796875, -1.18524169921875, -1.04638671875, -0.90753173828125, -0.7686767578125, -0.62982177734375, -0.490966796875, -0.35211181640625, -0.2132568359375, -0.07440185546875, 0.064453125, 0.20330810546875, 0.3421630859375, 0.48101806640625, 0.619873046875, 0.75872802734375, 0.8975830078125, 1.03643798828125, 1.17529296875, 1.31414794921875, 1.4530029296875, 1.59185791015625, 1.730712890625, 1.86956787109375, 2.0084228515625, 2.14727783203125, 2.2861328125, 2.42498779296875, 2.5638427734375, 2.70269775390625, 2.841552734375, 2.98040771484375, 3.1192626953125, 3.25811767578125, 3.39697265625, 3.53582763671875, 3.6746826171875, 3.81353759765625, 3.952392578125, 4.09124755859375, 4.2301025390625, 4.36895751953125, 4.5078125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 10.0, 15.0, 14.0, 28.0, 27.0, 42.0, 57.0, 85.0, 127.0, 226.0, 452.0, 969.0, 2556.0, 8490.0, 35330.0, 216090.0, 1629993.0, 1950577.0, 288020.0, 45107.0, 10492.0, 3217.0, 1147.0, 492.0, 274.0, 131.0, 83.0, 53.0, 43.0, 30.0, 26.0, 17.0, 12.0, 7.0, 7.0, 3.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.535888671875, -10.19677734375, -9.857666015625, -9.5185546875, -9.179443359375, -8.84033203125, -8.501220703125, -8.162109375, -7.822998046875, -7.48388671875, -7.144775390625, -6.8056640625, -6.466552734375, -6.12744140625, -5.788330078125, -5.44921875, -5.110107421875, -4.77099609375, -4.431884765625, -4.0927734375, -3.753662109375, -3.41455078125, -3.075439453125, -2.736328125, -2.397216796875, -2.05810546875, -1.718994140625, -1.3798828125, -1.040771484375, -0.70166015625, -0.362548828125, -0.0234375, 0.315673828125, 0.65478515625, 0.993896484375, 1.3330078125, 1.672119140625, 2.01123046875, 2.350341796875, 2.689453125, 3.028564453125, 3.36767578125, 3.706787109375, 4.0458984375, 4.385009765625, 4.72412109375, 5.063232421875, 5.40234375, 5.741455078125, 6.08056640625, 6.419677734375, 6.7587890625, 7.097900390625, 7.43701171875, 7.776123046875, 8.115234375, 8.454345703125, 8.79345703125, 9.132568359375, 9.4716796875, 9.810791015625, 10.14990234375, 10.489013671875, 10.828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 9.0, 11.0, 18.0, 20.0, 33.0, 60.0, 69.0, 104.0, 142.0, 242.0, 365.0, 517.0, 609.0, 581.0, 424.0, 273.0, 186.0, 131.0, 93.0, 54.0, 41.0, 24.0, 18.0, 15.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.328125, -17.8980712890625, -17.468017578125, -17.0379638671875, -16.60791015625, -16.1778564453125, -15.747802734375, -15.3177490234375, -14.8876953125, -14.4576416015625, -14.027587890625, -13.5975341796875, -13.16748046875, -12.7374267578125, -12.307373046875, -11.8773193359375, -11.447265625, -11.0172119140625, -10.587158203125, -10.1571044921875, -9.72705078125, -9.2969970703125, -8.866943359375, -8.4368896484375, -8.0068359375, -7.5767822265625, -7.146728515625, -6.7166748046875, -6.28662109375, -5.8565673828125, -5.426513671875, -4.9964599609375, -4.56640625, -4.1363525390625, -3.706298828125, -3.2762451171875, -2.84619140625, -2.4161376953125, -1.986083984375, -1.5560302734375, -1.1259765625, -0.6959228515625, -0.265869140625, 0.1641845703125, 0.59423828125, 1.0242919921875, 1.454345703125, 1.8843994140625, 2.314453125, 2.7445068359375, 3.174560546875, 3.6046142578125, 4.03466796875, 4.4647216796875, 4.894775390625, 5.3248291015625, 5.7548828125, 6.1849365234375, 6.614990234375, 7.0450439453125, 7.47509765625, 7.9051513671875, 8.335205078125, 8.7652587890625, 9.1953125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 8.0, 13.0, 13.0, 29.0, 43.0, 66.0, 118.0, 212.0, 365.0, 620.0, 2974.0, 198981.0, 3942974.0, 45074.0, 1589.0, 485.0, 274.0, 172.0, 75.0, 80.0, 39.0, 22.0, 14.0, 18.0, 10.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.6875, -28.154296875, -26.62109375, -25.087890625, -23.5546875, -22.021484375, -20.48828125, -18.955078125, -17.421875, -15.888671875, -14.35546875, -12.822265625, -11.2890625, -9.755859375, -8.22265625, -6.689453125, -5.15625, -3.623046875, -2.08984375, -0.556640625, 0.9765625, 2.509765625, 4.04296875, 5.576171875, 7.109375, 8.642578125, 10.17578125, 11.708984375, 13.2421875, 14.775390625, 16.30859375, 17.841796875, 19.375, 20.908203125, 22.44140625, 23.974609375, 25.5078125, 27.041015625, 28.57421875, 30.107421875, 31.640625, 33.173828125, 34.70703125, 36.240234375, 37.7734375, 39.306640625, 40.83984375, 42.373046875, 43.90625, 45.439453125, 46.97265625, 48.505859375, 50.0390625, 51.572265625, 53.10546875, 54.638671875, 56.171875, 57.705078125, 59.23828125, 60.771484375, 62.3046875, 63.837890625, 65.37109375, 66.904296875, 68.4375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 14.0, 21.0, 41.0, 42.0, 74.0, 96.0, 132.0, 132.0, 118.0, 93.0, 88.0, 51.0, 47.0, 25.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.19202423095703, -63.399169921875, -61.6063117980957, -59.81345748901367, -58.020599365234375, -56.227745056152344, -54.43489074707031, -52.642032623291016, -50.84917449951172, -49.05632019042969, -47.26346206665039, -45.47060775756836, -43.67774963378906, -41.88489532470703, -40.092041015625, -38.2991828918457, -36.50632858276367, -34.71347427368164, -32.920616149902344, -31.127761840820312, -29.334903717041016, -27.542049407958984, -25.74919319152832, -23.956336975097656, -22.163480758666992, -20.370624542236328, -18.577768325805664, -16.784912109375, -14.992056846618652, -13.199200630187988, -11.40634536743164, -9.613489151000977, -7.8206329345703125, -6.027776718139648, -4.234920978546143, -2.4420652389526367, -0.6492090225219727, 1.1436471939086914, 2.936502456665039, 4.729358673095703, 6.522214889526367, 8.315071105957031, 10.107927322387695, 11.900782585144043, 13.693638801574707, 15.486495018005371, 17.27935028076172, 19.072206497192383, 20.865062713623047, 22.65791893005371, 24.450775146484375, 26.243629455566406, 28.036487579345703, 29.829341888427734, 31.6221981048584, 33.41505432128906, 35.207908630371094, 37.000762939453125, 38.79362106323242, 40.58647537231445, 42.37933349609375, 44.17218780517578, 45.96504211425781, 47.75790023803711, 49.550758361816406]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 11.0, 16.0, 14.0, 12.0, 12.0, 13.0, 17.0, 21.0, 20.0, 19.0, 24.0, 29.0, 37.0, 34.0, 35.0, 44.0, 46.0, 42.0, 35.0, 46.0, 31.0, 37.0, 36.0, 30.0, 34.0, 34.0, 31.0, 24.0, 32.0, 23.0, 21.0, 17.0, 16.0, 16.0, 13.0, 11.0, 10.0, 11.0, 12.0, 5.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.11199951171875, -30.089059829711914, -29.066118240356445, -28.04317855834961, -27.02023696899414, -25.997297286987305, -24.97435760498047, -23.951416015625, -22.928476333618164, -21.905536651611328, -20.88259506225586, -19.859655380249023, -18.836715698242188, -17.81377410888672, -16.790834426879883, -15.76789379119873, -14.744953155517578, -13.722012519836426, -12.699071884155273, -11.676132202148438, -10.653191566467285, -9.630250930786133, -8.607311248779297, -7.5843706130981445, -6.561429977416992, -5.53848934173584, -4.515549182891846, -3.4926087856292725, -2.469668388366699, -1.4467277526855469, -0.42378759384155273, 0.5991525650024414, 1.6220932006835938, 2.645033597946167, 3.6679739952087402, 4.690914154052734, 5.713854789733887, 6.736795425415039, 7.759735584259033, 8.782675743103027, 9.80561637878418, 10.828557014465332, 11.851497650146484, 12.87443733215332, 13.897377967834473, 14.920318603515625, 15.943258285522461, 16.966197967529297, 17.989139556884766, 19.0120792388916, 20.03502082824707, 21.057960510253906, 22.080902099609375, 23.10384178161621, 24.126781463623047, 25.149723052978516, 26.17266273498535, 27.195602416992188, 28.218544006347656, 29.241483688354492, 30.264423370361328, 31.287364959716797, 32.310306549072266, 33.33324432373047, 34.35618591308594]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 11.0, 10.0, 11.0, 19.0, 13.0, 18.0, 30.0, 30.0, 31.0, 31.0, 32.0, 34.0, 34.0, 42.0, 44.0, 50.0, 39.0, 51.0, 33.0, 36.0, 45.0, 32.0, 34.0, 46.0, 38.0, 21.0, 19.0, 25.0, 17.0, 18.0, 17.0, 18.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.5728759765625, -4.427001953125, -4.2811279296875, -4.13525390625, -3.9893798828125, -3.843505859375, -3.6976318359375, -3.5517578125, -3.4058837890625, -3.260009765625, -3.1141357421875, -2.96826171875, -2.8223876953125, -2.676513671875, -2.5306396484375, -2.384765625, -2.2388916015625, -2.093017578125, -1.9471435546875, -1.80126953125, -1.6553955078125, -1.509521484375, -1.3636474609375, -1.2177734375, -1.0718994140625, -0.926025390625, -0.7801513671875, -0.63427734375, -0.4884033203125, -0.342529296875, -0.1966552734375, -0.05078125, 0.0950927734375, 0.240966796875, 0.3868408203125, 0.53271484375, 0.6785888671875, 0.824462890625, 0.9703369140625, 1.1162109375, 1.2620849609375, 1.407958984375, 1.5538330078125, 1.69970703125, 1.8455810546875, 1.991455078125, 2.1373291015625, 2.283203125, 2.4290771484375, 2.574951171875, 2.7208251953125, 2.86669921875, 3.0125732421875, 3.158447265625, 3.3043212890625, 3.4501953125, 3.5960693359375, 3.741943359375, 3.8878173828125, 4.03369140625, 4.1795654296875, 4.325439453125, 4.4713134765625, 4.6171875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 9.0, 9.0, 18.0, 17.0, 28.0, 43.0, 66.0, 91.0, 156.0, 233.0, 321.0, 505.0, 736.0, 1106.0, 1551.0, 2315.0, 3616.0, 5347.0, 7748.0, 11456.0, 16480.0, 24178.0, 34468.0, 48987.0, 69084.0, 94653.0, 122971.0, 140737.0, 126064.0, 98089.0, 71327.0, 50954.0, 36252.0, 24899.0, 17318.0, 11731.0, 8054.0, 5555.0, 3778.0, 2447.0, 1668.0, 1196.0, 751.0, 486.0, 359.0, 237.0, 166.0, 95.0, 76.0, 56.0, 32.0, 16.0, 13.0, 6.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0], "bins": [-0.57177734375, -0.5536575317382812, -0.5355377197265625, -0.5174179077148438, -0.499298095703125, -0.48117828369140625, -0.4630584716796875, -0.44493865966796875, -0.42681884765625, -0.40869903564453125, -0.3905792236328125, -0.37245941162109375, -0.354339599609375, -0.33621978759765625, -0.3180999755859375, -0.29998016357421875, -0.2818603515625, -0.26374053955078125, -0.2456207275390625, -0.22750091552734375, -0.209381103515625, -0.19126129150390625, -0.1731414794921875, -0.15502166748046875, -0.13690185546875, -0.11878204345703125, -0.1006622314453125, -0.08254241943359375, -0.064422607421875, -0.04630279541015625, -0.0281829833984375, -0.01006317138671875, 0.008056640625, 0.02617645263671875, 0.0442962646484375, 0.06241607666015625, 0.080535888671875, 0.09865570068359375, 0.1167755126953125, 0.13489532470703125, 0.15301513671875, 0.17113494873046875, 0.1892547607421875, 0.20737457275390625, 0.225494384765625, 0.24361419677734375, 0.2617340087890625, 0.27985382080078125, 0.2979736328125, 0.31609344482421875, 0.3342132568359375, 0.35233306884765625, 0.370452880859375, 0.38857269287109375, 0.4066925048828125, 0.42481231689453125, 0.44293212890625, 0.46105194091796875, 0.4791717529296875, 0.49729156494140625, 0.515411376953125, 0.5335311889648438, 0.5516510009765625, 0.5697708129882812, 0.587890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 6.0, 5.0, 3.0, 12.0, 10.0, 12.0, 13.0, 18.0, 19.0, 26.0, 27.0, 35.0, 30.0, 37.0, 27.0, 28.0, 43.0, 25.0, 39.0, 36.0, 40.0, 1062.0, 38.0, 42.0, 25.0, 27.0, 40.0, 30.0, 29.0, 24.0, 19.0, 22.0, 23.0, 22.0, 20.0, 17.0, 12.0, 13.0, 14.0, 5.0, 9.0, 6.0, 4.0, 7.0, 5.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0], "bins": [-2.685546875, -2.600433349609375, -2.51531982421875, -2.430206298828125, -2.3450927734375, -2.259979248046875, -2.17486572265625, -2.089752197265625, -2.004638671875, -1.919525146484375, -1.83441162109375, -1.749298095703125, -1.6641845703125, -1.579071044921875, -1.49395751953125, -1.408843994140625, -1.32373046875, -1.238616943359375, -1.15350341796875, -1.068389892578125, -0.9832763671875, -0.898162841796875, -0.81304931640625, -0.727935791015625, -0.642822265625, -0.557708740234375, -0.47259521484375, -0.387481689453125, -0.3023681640625, -0.217254638671875, -0.13214111328125, -0.047027587890625, 0.0380859375, 0.123199462890625, 0.20831298828125, 0.293426513671875, 0.3785400390625, 0.463653564453125, 0.54876708984375, 0.633880615234375, 0.718994140625, 0.804107666015625, 0.88922119140625, 0.974334716796875, 1.0594482421875, 1.144561767578125, 1.22967529296875, 1.314788818359375, 1.39990234375, 1.485015869140625, 1.57012939453125, 1.655242919921875, 1.7403564453125, 1.825469970703125, 1.91058349609375, 1.995697021484375, 2.080810546875, 2.165924072265625, 2.25103759765625, 2.336151123046875, 2.4212646484375, 2.506378173828125, 2.59149169921875, 2.676605224609375, 2.76171875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 17.0, 14.0, 20.0, 25.0, 62.0, 122.0, 133.0, 171.0, 289.0, 466.0, 723.0, 1075.0, 1576.0, 2484.0, 3628.0, 5732.0, 9132.0, 14412.0, 22633.0, 35268.0, 54148.0, 81988.0, 115257.0, 163173.0, 1185756.0, 128224.0, 93589.0, 63180.0, 40970.0, 26231.0, 16601.0, 10717.0, 6788.0, 4298.0, 2889.0, 1824.0, 1160.0, 774.0, 577.0, 348.0, 212.0, 141.0, 88.0, 85.0, 45.0, 30.0, 27.0, 10.0, 10.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.380126953125, -0.3683128356933594, -0.35649871826171875, -0.3446846008300781, -0.3328704833984375, -0.3210563659667969, -0.30924224853515625, -0.2974281311035156, -0.285614013671875, -0.2737998962402344, -0.26198577880859375, -0.2501716613769531, -0.2383575439453125, -0.22654342651367188, -0.21472930908203125, -0.20291519165039062, -0.19110107421875, -0.17928695678710938, -0.16747283935546875, -0.15565872192382812, -0.1438446044921875, -0.13203048706054688, -0.12021636962890625, -0.10840225219726562, -0.096588134765625, -0.08477401733398438, -0.07295989990234375, -0.061145782470703125, -0.0493316650390625, -0.037517547607421875, -0.02570343017578125, -0.013889312744140625, -0.0020751953125, 0.009738922119140625, 0.02155303955078125, 0.033367156982421875, 0.0451812744140625, 0.056995391845703125, 0.06880950927734375, 0.08062362670898438, 0.092437744140625, 0.10425186157226562, 0.11606597900390625, 0.12788009643554688, 0.1396942138671875, 0.15150833129882812, 0.16332244873046875, 0.17513656616210938, 0.18695068359375, 0.19876480102539062, 0.21057891845703125, 0.22239303588867188, 0.2342071533203125, 0.24602127075195312, 0.25783538818359375, 0.2696495056152344, 0.281463623046875, 0.2932777404785156, 0.30509185791015625, 0.3169059753417969, 0.3287200927734375, 0.3405342102050781, 0.35234832763671875, 0.3641624450683594, 0.3759765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 1.0, 10.0, 12.0, 15.0, 22.0, 19.0, 34.0, 42.0, 58.0, 73.0, 78.0, 78.0, 109.0, 83.0, 81.0, 56.0, 45.0, 38.0, 31.0, 32.0, 19.0, 17.0, 7.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018951416015625, -0.018333911895751953, -0.017716407775878906, -0.01709890365600586, -0.016481399536132812, -0.015863895416259766, -0.015246391296386719, -0.014628887176513672, -0.014011383056640625, -0.013393878936767578, -0.012776374816894531, -0.012158870697021484, -0.011541366577148438, -0.01092386245727539, -0.010306358337402344, -0.009688854217529297, -0.00907135009765625, -0.008453845977783203, -0.007836341857910156, -0.007218837738037109, -0.0066013336181640625, -0.005983829498291016, -0.005366325378417969, -0.004748821258544922, -0.004131317138671875, -0.003513813018798828, -0.0028963088989257812, -0.0022788047790527344, -0.0016613006591796875, -0.0010437965393066406, -0.00042629241943359375, 0.00019121170043945312, 0.0008087158203125, 0.0014262199401855469, 0.0020437240600585938, 0.0026612281799316406, 0.0032787322998046875, 0.0038962364196777344, 0.004513740539550781, 0.005131244659423828, 0.005748748779296875, 0.006366252899169922, 0.006983757019042969, 0.007601261138916016, 0.008218765258789062, 0.00883626937866211, 0.009453773498535156, 0.010071277618408203, 0.01068878173828125, 0.011306285858154297, 0.011923789978027344, 0.01254129409790039, 0.013158798217773438, 0.013776302337646484, 0.014393806457519531, 0.015011310577392578, 0.015628814697265625, 0.016246318817138672, 0.01686382293701172, 0.017481327056884766, 0.018098831176757812, 0.01871633529663086, 0.019333839416503906, 0.019951343536376953, 0.02056884765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 7.0, 10.0, 6.0, 19.0, 23.0, 34.0, 47.0, 59.0, 102.0, 259.0, 922.0, 26075.0, 1013469.0, 6455.0, 571.0, 175.0, 107.0, 69.0, 43.0, 37.0, 19.0, 12.0, 6.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447021484375, -0.4336128234863281, -0.42020416259765625, -0.4067955017089844, -0.3933868408203125, -0.3799781799316406, -0.36656951904296875, -0.3531608581542969, -0.339752197265625, -0.3263435363769531, -0.31293487548828125, -0.2995262145996094, -0.2861175537109375, -0.2727088928222656, -0.25930023193359375, -0.24589157104492188, -0.23248291015625, -0.21907424926757812, -0.20566558837890625, -0.19225692749023438, -0.1788482666015625, -0.16543960571289062, -0.15203094482421875, -0.13862228393554688, -0.125213623046875, -0.11180496215820312, -0.09839630126953125, -0.08498764038085938, -0.0715789794921875, -0.058170318603515625, -0.04476165771484375, -0.031352996826171875, -0.0179443359375, -0.004535675048828125, 0.00887298583984375, 0.022281646728515625, 0.0356903076171875, 0.049098968505859375, 0.06250762939453125, 0.07591629028320312, 0.089324951171875, 0.10273361206054688, 0.11614227294921875, 0.12955093383789062, 0.1429595947265625, 0.15636825561523438, 0.16977691650390625, 0.18318557739257812, 0.19659423828125, 0.21000289916992188, 0.22341156005859375, 0.23682022094726562, 0.2502288818359375, 0.2636375427246094, 0.27704620361328125, 0.2904548645019531, 0.303863525390625, 0.3172721862792969, 0.33068084716796875, 0.3440895080566406, 0.3574981689453125, 0.3709068298339844, 0.38431549072265625, 0.3977241516113281, 0.4111328125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 109.0, 747.0, 140.0, 10.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48654812574386597, -0.4779569208621979, -0.4693656861782074, -0.4607744812965393, -0.4521832764148712, -0.4435920715332031, -0.43500083684921265, -0.42640963196754456, -0.41781842708587646, -0.4092272222042084, -0.4006359875202179, -0.3920447826385498, -0.3834535777568817, -0.3748623728752136, -0.36627113819122314, -0.35767993330955505, -0.3490886986255646, -0.3404974937438965, -0.331906259059906, -0.3233150541782379, -0.3147238492965698, -0.30613261461257935, -0.29754140973091125, -0.28895020484924316, -0.2803589701652527, -0.2717677652835846, -0.2631765305995941, -0.254585325717926, -0.24599412083625793, -0.23740290105342865, -0.22881168127059937, -0.22022047638893127, -0.2116292417049408, -0.2030380219221115, -0.19444681704044342, -0.18585559725761414, -0.17726439237594604, -0.16867317259311676, -0.16008195281028748, -0.15149074792861938, -0.1428995430469513, -0.134308323264122, -0.12571711838245392, -0.11712589859962463, -0.10853468626737595, -0.09994347393512726, -0.09135225415229797, -0.08276104182004929, -0.07416982203722, -0.06557860970497131, -0.05698739364743233, -0.04839617758989334, -0.03980496525764465, -0.031213752925395966, -0.02262253686785698, -0.014031320810317993, -0.005440108478069305, 0.0031511057168245316, 0.011742319911718369, 0.020333534106612206, 0.028924748301506042, 0.03751596063375473, 0.046107176691293716, 0.0546983927488327, 0.06328960508108139]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 6.0, 10.0, 16.0, 5.0, 18.0, 7.0, 25.0, 25.0, 29.0, 31.0, 33.0, 43.0, 39.0, 36.0, 46.0, 45.0, 49.0, 50.0, 44.0, 36.0, 49.0, 37.0, 34.0, 31.0, 36.0, 34.0, 25.0, 21.0, 28.0, 19.0, 16.0, 12.0, 12.0, 9.0, 10.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.03310739994049072, -0.032058462500572205, -0.031009521335363388, -0.02996058203279972, -0.028911642730236053, -0.027862703427672386, -0.02681376412510872, -0.02576482482254505, -0.024715885519981384, -0.023666946217417717, -0.02261800691485405, -0.021569067612290382, -0.020520128309726715, -0.019471189007163048, -0.01842224970459938, -0.017373310402035713, -0.016324371099472046, -0.015275431796908379, -0.014226492494344711, -0.013177553191781044, -0.012128613889217377, -0.01107967458665371, -0.010030735284090042, -0.008981795981526375, -0.007932856678962708, -0.00688391737639904, -0.005834978073835373, -0.004786038771271706, -0.0037370994687080383, -0.002688160166144371, -0.0016392208635807037, -0.0005902815610170364, 0.00045865774154663086, 0.0015075970441102982, 0.0025565363466739655, 0.0036054756492376328, 0.0046544149518013, 0.005703354254364967, 0.006752293556928635, 0.007801232859492302, 0.00885017216205597, 0.009899111464619637, 0.010948050767183304, 0.011996990069746971, 0.013045929372310638, 0.014094868674874306, 0.015143807977437973, 0.01619274728000164, 0.017241686582565308, 0.018290625885128975, 0.019339565187692642, 0.02038850449025631, 0.021437443792819977, 0.022486383095383644, 0.02353532239794731, 0.02458426170051098, 0.025633201003074646, 0.026682140305638313, 0.02773107960820198, 0.028780018910765648, 0.029828958213329315, 0.030877897515892982, 0.03192683681845665, 0.032975777983665466, 0.034024715423583984]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 9.0, 8.0, 10.0, 11.0, 10.0, 11.0, 19.0, 13.0, 17.0, 31.0, 30.0, 31.0, 30.0, 33.0, 34.0, 34.0, 41.0, 44.0, 50.0, 39.0, 52.0, 33.0, 36.0, 45.0, 32.0, 34.0, 46.0, 38.0, 21.0, 19.0, 25.0, 17.0, 18.0, 18.0, 17.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.5728759765625, -4.427001953125, -4.2811279296875, -4.13525390625, -3.9893798828125, -3.843505859375, -3.6976318359375, -3.5517578125, -3.4058837890625, -3.260009765625, -3.1141357421875, -2.96826171875, -2.8223876953125, -2.676513671875, -2.5306396484375, -2.384765625, -2.2388916015625, -2.093017578125, -1.9471435546875, -1.80126953125, -1.6553955078125, -1.509521484375, -1.3636474609375, -1.2177734375, -1.0718994140625, -0.926025390625, -0.7801513671875, -0.63427734375, -0.4884033203125, -0.342529296875, -0.1966552734375, -0.05078125, 0.0950927734375, 0.240966796875, 0.3868408203125, 0.53271484375, 0.6785888671875, 0.824462890625, 0.9703369140625, 1.1162109375, 1.2620849609375, 1.407958984375, 1.5538330078125, 1.69970703125, 1.8455810546875, 1.991455078125, 2.1373291015625, 2.283203125, 2.4290771484375, 2.574951171875, 2.7208251953125, 2.86669921875, 3.0125732421875, 3.158447265625, 3.3043212890625, 3.4501953125, 3.5960693359375, 3.741943359375, 3.8878173828125, 4.03369140625, 4.1795654296875, 4.325439453125, 4.4713134765625, 4.6171875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 7.0, 14.0, 13.0, 16.0, 16.0, 24.0, 33.0, 57.0, 98.0, 167.0, 275.0, 488.0, 817.0, 1582.0, 2905.0, 6112.0, 13015.0, 31416.0, 82369.0, 229366.0, 421566.0, 157831.0, 57739.0, 22920.0, 9733.0, 4729.0, 2296.0, 1187.0, 684.0, 424.0, 235.0, 144.0, 87.0, 58.0, 45.0, 27.0, 14.0, 14.0, 10.0, 2.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.7265625, -4.584716796875, -4.44287109375, -4.301025390625, -4.1591796875, -4.017333984375, -3.87548828125, -3.733642578125, -3.591796875, -3.449951171875, -3.30810546875, -3.166259765625, -3.0244140625, -2.882568359375, -2.74072265625, -2.598876953125, -2.45703125, -2.315185546875, -2.17333984375, -2.031494140625, -1.8896484375, -1.747802734375, -1.60595703125, -1.464111328125, -1.322265625, -1.180419921875, -1.03857421875, -0.896728515625, -0.7548828125, -0.613037109375, -0.47119140625, -0.329345703125, -0.1875, -0.045654296875, 0.09619140625, 0.238037109375, 0.3798828125, 0.521728515625, 0.66357421875, 0.805419921875, 0.947265625, 1.089111328125, 1.23095703125, 1.372802734375, 1.5146484375, 1.656494140625, 1.79833984375, 1.940185546875, 2.08203125, 2.223876953125, 2.36572265625, 2.507568359375, 2.6494140625, 2.791259765625, 2.93310546875, 3.074951171875, 3.216796875, 3.358642578125, 3.50048828125, 3.642333984375, 3.7841796875, 3.926025390625, 4.06787109375, 4.209716796875, 4.3515625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 4.0, 8.0, 5.0, 9.0, 12.0, 15.0, 18.0, 16.0, 20.0, 31.0, 23.0, 32.0, 27.0, 38.0, 55.0, 61.0, 41.0, 66.0, 183.0, 1591.0, 268.0, 81.0, 53.0, 44.0, 52.0, 30.0, 37.0, 39.0, 27.0, 22.0, 17.0, 24.0, 13.0, 16.0, 11.0, 8.0, 6.0, 8.0, 7.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.6844482421875, -13.189208984375, -12.6939697265625, -12.19873046875, -11.7034912109375, -11.208251953125, -10.7130126953125, -10.2177734375, -9.7225341796875, -9.227294921875, -8.7320556640625, -8.23681640625, -7.7415771484375, -7.246337890625, -6.7510986328125, -6.255859375, -5.7606201171875, -5.265380859375, -4.7701416015625, -4.27490234375, -3.7796630859375, -3.284423828125, -2.7891845703125, -2.2939453125, -1.7987060546875, -1.303466796875, -0.8082275390625, -0.31298828125, 0.1822509765625, 0.677490234375, 1.1727294921875, 1.66796875, 2.1632080078125, 2.658447265625, 3.1536865234375, 3.64892578125, 4.1441650390625, 4.639404296875, 5.1346435546875, 5.6298828125, 6.1251220703125, 6.620361328125, 7.1156005859375, 7.61083984375, 8.1060791015625, 8.601318359375, 9.0965576171875, 9.591796875, 10.0870361328125, 10.582275390625, 11.0775146484375, 11.57275390625, 12.0679931640625, 12.563232421875, 13.0584716796875, 13.5537109375, 14.0489501953125, 14.544189453125, 15.0394287109375, 15.53466796875, 16.0299072265625, 16.525146484375, 17.0203857421875, 17.515625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 3.0, 7.0, 11.0, 12.0, 11.0, 14.0, 23.0, 36.0, 33.0, 50.0, 71.0, 113.0, 161.0, 214.0, 344.0, 593.0, 3067.0, 826934.0, 2308250.0, 3974.0, 655.0, 369.0, 228.0, 129.0, 93.0, 84.0, 57.0, 37.0, 34.0, 25.0, 15.0, 13.0, 11.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-53.53125, -52.22705078125, -50.9228515625, -49.61865234375, -48.314453125, -47.01025390625, -45.7060546875, -44.40185546875, -43.09765625, -41.79345703125, -40.4892578125, -39.18505859375, -37.880859375, -36.57666015625, -35.2724609375, -33.96826171875, -32.6640625, -31.35986328125, -30.0556640625, -28.75146484375, -27.447265625, -26.14306640625, -24.8388671875, -23.53466796875, -22.23046875, -20.92626953125, -19.6220703125, -18.31787109375, -17.013671875, -15.70947265625, -14.4052734375, -13.10107421875, -11.796875, -10.49267578125, -9.1884765625, -7.88427734375, -6.580078125, -5.27587890625, -3.9716796875, -2.66748046875, -1.36328125, -0.05908203125, 1.2451171875, 2.54931640625, 3.853515625, 5.15771484375, 6.4619140625, 7.76611328125, 9.0703125, 10.37451171875, 11.6787109375, 12.98291015625, 14.287109375, 15.59130859375, 16.8955078125, 18.19970703125, 19.50390625, 20.80810546875, 22.1123046875, 23.41650390625, 24.720703125, 26.02490234375, 27.3291015625, 28.63330078125, 29.9375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 366.0, 617.0, 29.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.06431579589844, -224.6688995361328, -220.2734832763672, -215.87806701660156, -211.48265075683594, -207.0872344970703, -202.6918182373047, -198.29640197753906, -193.90098571777344, -189.5055694580078, -185.1101531982422, -180.71473693847656, -176.31932067871094, -171.9239044189453, -167.5284881591797, -163.13307189941406, -158.7376708984375, -154.34225463867188, -149.94683837890625, -145.55142211914062, -141.156005859375, -136.76058959960938, -132.36517333984375, -127.96975708007812, -123.5743408203125, -119.17892456054688, -114.78350830078125, -110.38809204101562, -105.99267578125, -101.59725952148438, -97.20184326171875, -92.80642700195312, -88.41101837158203, -84.0156021118164, -79.62018585205078, -75.22476959228516, -70.82935333251953, -66.4339370727539, -62.03852462768555, -57.64310836791992, -53.2476921081543, -48.85227584838867, -44.45685958862305, -40.06144714355469, -35.66603088378906, -31.270612716674805, -26.875198364257812, -22.479782104492188, -18.084365844726562, -13.688949584960938, -9.293534278869629, -4.89811897277832, -0.5027027130126953, 3.8927135467529297, 8.288127899169922, 12.683544158935547, 17.078960418701172, 21.474376678466797, 25.869792938232422, 30.265207290649414, 34.660621643066406, 39.05603790283203, 43.451454162597656, 47.84687042236328, 52.242286682128906]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 0.0, 8.0, 5.0, 7.0, 7.0, 9.0, 13.0, 17.0, 13.0, 18.0, 16.0, 19.0, 28.0, 22.0, 28.0, 35.0, 34.0, 38.0, 27.0, 25.0, 39.0, 33.0, 36.0, 46.0, 41.0, 38.0, 30.0, 40.0, 33.0, 33.0, 25.0, 34.0, 25.0, 24.0, 23.0, 16.0, 13.0, 16.0, 18.0, 16.0, 16.0, 5.0, 10.0, 0.0, 2.0, 4.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-40.13652038574219, -38.909637451171875, -37.68275451660156, -36.455867767333984, -35.22898483276367, -34.00210189819336, -32.77521514892578, -31.54833221435547, -30.321449279785156, -29.094566345214844, -27.8676815032959, -26.640796661376953, -25.41391372680664, -24.187030792236328, -22.960145950317383, -21.733261108398438, -20.506378173828125, -19.279495239257812, -18.052610397338867, -16.825725555419922, -15.59884262084961, -14.37195873260498, -13.145074844360352, -11.918190956115723, -10.691307067871094, -9.464423179626465, -8.237539291381836, -7.010655403137207, -5.783771514892578, -4.556887626647949, -3.3300037384033203, -2.1031198501586914, -0.8762359619140625, 0.3506479263305664, 1.5775318145751953, 2.804415702819824, 4.031299591064453, 5.258183479309082, 6.485067367553711, 7.71195125579834, 8.938835144042969, 10.165719032287598, 11.392602920532227, 12.619486808776855, 13.846370697021484, 15.073254585266113, 16.300138473510742, 17.527023315429688, 18.75390625, 19.980789184570312, 21.207674026489258, 22.434558868408203, 23.661441802978516, 24.888324737548828, 26.115209579467773, 27.34209442138672, 28.56897735595703, 29.795860290527344, 31.02274513244629, 32.249629974365234, 33.47651290893555, 34.70339584350586, 35.93028259277344, 37.15716552734375, 38.38404846191406]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 5.0, 11.0, 8.0, 14.0, 16.0, 10.0, 13.0, 20.0, 20.0, 28.0, 24.0, 31.0, 27.0, 30.0, 43.0, 39.0, 34.0, 44.0, 43.0, 38.0, 54.0, 39.0, 32.0, 36.0, 43.0, 39.0, 36.0, 31.0, 23.0, 23.0, 27.0, 17.0, 11.0, 17.0, 22.0, 8.0, 8.0, 6.0, 10.0, 1.0, 1.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.99609375, -4.846435546875, -4.69677734375, -4.547119140625, -4.3974609375, -4.247802734375, -4.09814453125, -3.948486328125, -3.798828125, -3.649169921875, -3.49951171875, -3.349853515625, -3.2001953125, -3.050537109375, -2.90087890625, -2.751220703125, -2.6015625, -2.451904296875, -2.30224609375, -2.152587890625, -2.0029296875, -1.853271484375, -1.70361328125, -1.553955078125, -1.404296875, -1.254638671875, -1.10498046875, -0.955322265625, -0.8056640625, -0.656005859375, -0.50634765625, -0.356689453125, -0.20703125, -0.057373046875, 0.09228515625, 0.241943359375, 0.3916015625, 0.541259765625, 0.69091796875, 0.840576171875, 0.990234375, 1.139892578125, 1.28955078125, 1.439208984375, 1.5888671875, 1.738525390625, 1.88818359375, 2.037841796875, 2.1875, 2.337158203125, 2.48681640625, 2.636474609375, 2.7861328125, 2.935791015625, 3.08544921875, 3.235107421875, 3.384765625, 3.534423828125, 3.68408203125, 3.833740234375, 3.9833984375, 4.133056640625, 4.28271484375, 4.432373046875, 4.58203125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 8.0, 5.0, 10.0, 19.0, 18.0, 22.0, 31.0, 35.0, 44.0, 61.0, 68.0, 96.0, 128.0, 194.0, 354.0, 605.0, 1293.0, 3393.0, 10255.0, 38795.0, 212364.0, 1409383.0, 2018593.0, 408915.0, 65103.0, 15536.0, 4939.0, 1930.0, 841.0, 401.0, 257.0, 139.0, 109.0, 61.0, 63.0, 50.0, 41.0, 31.0, 21.0, 15.0, 11.0, 11.0, 13.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.6796875, -10.3670654296875, -10.054443359375, -9.7418212890625, -9.42919921875, -9.1165771484375, -8.803955078125, -8.4913330078125, -8.1787109375, -7.8660888671875, -7.553466796875, -7.2408447265625, -6.92822265625, -6.6156005859375, -6.302978515625, -5.9903564453125, -5.677734375, -5.3651123046875, -5.052490234375, -4.7398681640625, -4.42724609375, -4.1146240234375, -3.802001953125, -3.4893798828125, -3.1767578125, -2.8641357421875, -2.551513671875, -2.2388916015625, -1.92626953125, -1.6136474609375, -1.301025390625, -0.9884033203125, -0.67578125, -0.3631591796875, -0.050537109375, 0.2620849609375, 0.57470703125, 0.8873291015625, 1.199951171875, 1.5125732421875, 1.8251953125, 2.1378173828125, 2.450439453125, 2.7630615234375, 3.07568359375, 3.3883056640625, 3.700927734375, 4.0135498046875, 4.326171875, 4.6387939453125, 4.951416015625, 5.2640380859375, 5.57666015625, 5.8892822265625, 6.201904296875, 6.5145263671875, 6.8271484375, 7.1397705078125, 7.452392578125, 7.7650146484375, 8.07763671875, 8.3902587890625, 8.702880859375, 9.0155029296875, 9.328125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 9.0, 9.0, 9.0, 10.0, 18.0, 16.0, 20.0, 38.0, 40.0, 71.0, 74.0, 107.0, 148.0, 198.0, 269.0, 400.0, 428.0, 517.0, 420.0, 366.0, 239.0, 183.0, 133.0, 104.0, 66.0, 50.0, 38.0, 25.0, 25.0, 11.0, 10.0, 11.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.1121826171875, -10.779052734375, -10.4459228515625, -10.11279296875, -9.7796630859375, -9.446533203125, -9.1134033203125, -8.7802734375, -8.4471435546875, -8.114013671875, -7.7808837890625, -7.44775390625, -7.1146240234375, -6.781494140625, -6.4483642578125, -6.115234375, -5.7821044921875, -5.448974609375, -5.1158447265625, -4.78271484375, -4.4495849609375, -4.116455078125, -3.7833251953125, -3.4501953125, -3.1170654296875, -2.783935546875, -2.4508056640625, -2.11767578125, -1.7845458984375, -1.451416015625, -1.1182861328125, -0.78515625, -0.4520263671875, -0.118896484375, 0.2142333984375, 0.54736328125, 0.8804931640625, 1.213623046875, 1.5467529296875, 1.8798828125, 2.2130126953125, 2.546142578125, 2.8792724609375, 3.21240234375, 3.5455322265625, 3.878662109375, 4.2117919921875, 4.544921875, 4.8780517578125, 5.211181640625, 5.5443115234375, 5.87744140625, 6.2105712890625, 6.543701171875, 6.8768310546875, 7.2099609375, 7.5430908203125, 7.876220703125, 8.2093505859375, 8.54248046875, 8.8756103515625, 9.208740234375, 9.5418701171875, 9.875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 10.0, 10.0, 14.0, 28.0, 38.0, 47.0, 66.0, 92.0, 154.0, 224.0, 373.0, 997.0, 13664.0, 3537775.0, 635149.0, 3992.0, 645.0, 316.0, 221.0, 126.0, 102.0, 67.0, 45.0, 24.0, 25.0, 18.0, 21.0, 12.0, 7.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.0625, -43.44384765625, -41.8251953125, -40.20654296875, -38.587890625, -36.96923828125, -35.3505859375, -33.73193359375, -32.11328125, -30.49462890625, -28.8759765625, -27.25732421875, -25.638671875, -24.02001953125, -22.4013671875, -20.78271484375, -19.1640625, -17.54541015625, -15.9267578125, -14.30810546875, -12.689453125, -11.07080078125, -9.4521484375, -7.83349609375, -6.21484375, -4.59619140625, -2.9775390625, -1.35888671875, 0.259765625, 1.87841796875, 3.4970703125, 5.11572265625, 6.734375, 8.35302734375, 9.9716796875, 11.59033203125, 13.208984375, 14.82763671875, 16.4462890625, 18.06494140625, 19.68359375, 21.30224609375, 22.9208984375, 24.53955078125, 26.158203125, 27.77685546875, 29.3955078125, 31.01416015625, 32.6328125, 34.25146484375, 35.8701171875, 37.48876953125, 39.107421875, 40.72607421875, 42.3447265625, 43.96337890625, 45.58203125, 47.20068359375, 48.8193359375, 50.43798828125, 52.056640625, 53.67529296875, 55.2939453125, 56.91259765625, 58.53125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 39.0, 119.0, 283.0, 292.0, 196.0, 58.0, 15.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.82781982421875, -153.701171875, -149.5745391845703, -145.44789123535156, -141.3212432861328, -137.19461059570312, -133.06796264648438, -128.94131469726562, -124.8146743774414, -120.68803405761719, -116.56138610839844, -112.43474578857422, -108.30810546875, -104.18145751953125, -100.05481719970703, -95.92817687988281, -91.80152893066406, -87.67488861083984, -83.5482406616211, -79.42160034179688, -75.29495239257812, -71.1683120727539, -67.04167175292969, -62.9150276184082, -58.78838348388672, -54.661739349365234, -50.53509521484375, -46.40845489501953, -42.28181076049805, -38.15516662597656, -34.028526306152344, -29.90188217163086, -25.775245666503906, -21.648601531982422, -17.52195930480957, -13.395316123962402, -9.268672943115234, -5.14202880859375, -1.0153865814208984, 3.111255645751953, 7.2378997802734375, 11.364542961120605, 15.491186141967773, 19.617828369140625, 23.74447250366211, 27.871116638183594, 31.997758865356445, 36.1244010925293, 40.25104522705078, 44.377689361572266, 48.50433349609375, 52.63097381591797, 56.75761795043945, 60.88426208496094, 65.01090240478516, 69.13754272460938, 73.26419067382812, 77.39083099365234, 81.5174789428711, 85.64411926269531, 89.77076721191406, 93.89740753173828, 98.0240478515625, 102.15069580078125, 106.27733612060547]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 13.0, 8.0, 10.0, 13.0, 12.0, 9.0, 17.0, 17.0, 26.0, 26.0, 22.0, 34.0, 21.0, 24.0, 27.0, 43.0, 40.0, 43.0, 44.0, 40.0, 41.0, 37.0, 41.0, 29.0, 39.0, 30.0, 31.0, 38.0, 21.0, 28.0, 25.0, 16.0, 16.0, 20.0, 21.0, 17.0, 15.0, 6.0, 8.0, 5.0, 4.0, 5.0, 6.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0], "bins": [-34.767486572265625, -33.76421356201172, -32.76093673706055, -31.75766372680664, -30.7543888092041, -29.751113891601562, -28.747840881347656, -27.744565963745117, -26.741291046142578, -25.73801612854004, -24.7347412109375, -23.731468200683594, -22.728193283081055, -21.724918365478516, -20.72164535522461, -19.71837043762207, -18.71509552001953, -17.711820602416992, -16.708545684814453, -15.705272674560547, -14.701997756958008, -13.698722839355469, -12.695448875427246, -11.692174911499023, -10.688899993896484, -9.685625076293945, -8.682351112365723, -7.679076671600342, -6.675802230834961, -5.67252779006958, -4.669253349304199, -3.6659789085388184, -2.6627044677734375, -1.6594300270080566, -0.6561555862426758, 0.3471188545227051, 1.350393295288086, 2.353667736053467, 3.3569421768188477, 4.3602166175842285, 5.363491058349609, 6.36676549911499, 7.370039939880371, 8.373313903808594, 9.376588821411133, 10.379863739013672, 11.383137702941895, 12.386411666870117, 13.389686584472656, 14.392961502075195, 15.396235466003418, 16.39950942993164, 17.40278434753418, 18.40605926513672, 19.409332275390625, 20.412607192993164, 21.415882110595703, 22.419157028198242, 23.42243194580078, 24.425704956054688, 25.428979873657227, 26.432254791259766, 27.435527801513672, 28.43880271911621, 29.44207763671875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 8.0, 14.0, 10.0, 18.0, 10.0, 11.0, 24.0, 13.0, 14.0, 22.0, 28.0, 33.0, 32.0, 25.0, 45.0, 30.0, 32.0, 28.0, 48.0, 51.0, 38.0, 45.0, 38.0, 39.0, 36.0, 27.0, 31.0, 33.0, 29.0, 24.0, 24.0, 19.0, 19.0, 22.0, 14.0, 14.0, 8.0, 5.0, 10.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6640625, -4.52130126953125, -4.3785400390625, -4.23577880859375, -4.093017578125, -3.95025634765625, -3.8074951171875, -3.66473388671875, -3.52197265625, -3.37921142578125, -3.2364501953125, -3.09368896484375, -2.950927734375, -2.80816650390625, -2.6654052734375, -2.52264404296875, -2.3798828125, -2.23712158203125, -2.0943603515625, -1.95159912109375, -1.808837890625, -1.66607666015625, -1.5233154296875, -1.38055419921875, -1.23779296875, -1.09503173828125, -0.9522705078125, -0.80950927734375, -0.666748046875, -0.52398681640625, -0.3812255859375, -0.23846435546875, -0.095703125, 0.04705810546875, 0.1898193359375, 0.33258056640625, 0.475341796875, 0.61810302734375, 0.7608642578125, 0.90362548828125, 1.04638671875, 1.18914794921875, 1.3319091796875, 1.47467041015625, 1.617431640625, 1.76019287109375, 1.9029541015625, 2.04571533203125, 2.1884765625, 2.33123779296875, 2.4739990234375, 2.61676025390625, 2.759521484375, 2.90228271484375, 3.0450439453125, 3.18780517578125, 3.33056640625, 3.47332763671875, 3.6160888671875, 3.75885009765625, 3.901611328125, 4.04437255859375, 4.1871337890625, 4.32989501953125, 4.47265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 6.0, 5.0, 21.0, 18.0, 29.0, 50.0, 63.0, 119.0, 155.0, 231.0, 336.0, 509.0, 746.0, 1054.0, 1539.0, 2248.0, 3133.0, 4511.0, 6489.0, 9149.0, 12777.0, 18294.0, 25891.0, 35920.0, 49496.0, 67828.0, 90511.0, 113610.0, 127368.0, 118567.0, 96438.0, 73323.0, 53765.0, 38904.0, 28007.0, 19988.0, 14222.0, 9924.0, 6997.0, 5073.0, 3532.0, 2352.0, 1767.0, 1129.0, 784.0, 541.0, 384.0, 250.0, 194.0, 123.0, 71.0, 45.0, 28.0, 21.0, 12.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.495361328125, -0.4786415100097656, -0.46192169189453125, -0.4452018737792969, -0.4284820556640625, -0.4117622375488281, -0.39504241943359375, -0.3783226013183594, -0.361602783203125, -0.3448829650878906, -0.32816314697265625, -0.3114433288574219, -0.2947235107421875, -0.2780036926269531, -0.26128387451171875, -0.24456405639648438, -0.22784423828125, -0.21112442016601562, -0.19440460205078125, -0.17768478393554688, -0.1609649658203125, -0.14424514770507812, -0.12752532958984375, -0.11080551147460938, -0.094085693359375, -0.07736587524414062, -0.06064605712890625, -0.043926239013671875, -0.0272064208984375, -0.010486602783203125, 0.00623321533203125, 0.022953033447265625, 0.0396728515625, 0.056392669677734375, 0.07311248779296875, 0.08983230590820312, 0.1065521240234375, 0.12327194213867188, 0.13999176025390625, 0.15671157836914062, 0.173431396484375, 0.19015121459960938, 0.20687103271484375, 0.22359085083007812, 0.2403106689453125, 0.2570304870605469, 0.27375030517578125, 0.2904701232910156, 0.30718994140625, 0.3239097595214844, 0.34062957763671875, 0.3573493957519531, 0.3740692138671875, 0.3907890319824219, 0.40750885009765625, 0.4242286682128906, 0.440948486328125, 0.4576683044433594, 0.47438812255859375, 0.4911079406738281, 0.5078277587890625, 0.5245475769042969, 0.5412673950195312, 0.5579872131347656, 0.57470703125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 10.0, 13.0, 12.0, 12.0, 18.0, 17.0, 30.0, 29.0, 23.0, 36.0, 32.0, 28.0, 44.0, 38.0, 44.0, 41.0, 1055.0, 46.0, 43.0, 44.0, 38.0, 49.0, 34.0, 33.0, 28.0, 28.0, 34.0, 31.0, 12.0, 25.0, 18.0, 18.0, 11.0, 9.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.271484375, -3.16900634765625, -3.0665283203125, -2.96405029296875, -2.861572265625, -2.75909423828125, -2.6566162109375, -2.55413818359375, -2.45166015625, -2.34918212890625, -2.2467041015625, -2.14422607421875, -2.041748046875, -1.93927001953125, -1.8367919921875, -1.73431396484375, -1.6318359375, -1.52935791015625, -1.4268798828125, -1.32440185546875, -1.221923828125, -1.11944580078125, -1.0169677734375, -0.91448974609375, -0.81201171875, -0.70953369140625, -0.6070556640625, -0.50457763671875, -0.402099609375, -0.29962158203125, -0.1971435546875, -0.09466552734375, 0.0078125, 0.11029052734375, 0.2127685546875, 0.31524658203125, 0.417724609375, 0.52020263671875, 0.6226806640625, 0.72515869140625, 0.82763671875, 0.93011474609375, 1.0325927734375, 1.13507080078125, 1.237548828125, 1.34002685546875, 1.4425048828125, 1.54498291015625, 1.6474609375, 1.74993896484375, 1.8524169921875, 1.95489501953125, 2.057373046875, 2.15985107421875, 2.2623291015625, 2.36480712890625, 2.46728515625, 2.56976318359375, 2.6722412109375, 2.77471923828125, 2.877197265625, 2.97967529296875, 3.0821533203125, 3.18463134765625, 3.287109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 17.0, 30.0, 43.0, 52.0, 86.0, 127.0, 195.0, 256.0, 459.0, 625.0, 1021.0, 1470.0, 2337.0, 3584.0, 5529.0, 8555.0, 13170.0, 20573.0, 31332.0, 47700.0, 70470.0, 99762.0, 132492.0, 1197668.0, 137619.0, 103952.0, 73744.0, 49862.0, 32962.0, 21531.0, 14023.0, 9154.0, 5771.0, 3781.0, 2457.0, 1599.0, 1041.0, 752.0, 420.0, 288.0, 197.0, 137.0, 85.0, 72.0, 42.0, 27.0, 19.0, 14.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0], "bins": [-0.374755859375, -0.3632469177246094, -0.35173797607421875, -0.3402290344238281, -0.3287200927734375, -0.3172111511230469, -0.30570220947265625, -0.2941932678222656, -0.282684326171875, -0.2711753845214844, -0.25966644287109375, -0.24815750122070312, -0.2366485595703125, -0.22513961791992188, -0.21363067626953125, -0.20212173461914062, -0.19061279296875, -0.17910385131835938, -0.16759490966796875, -0.15608596801757812, -0.1445770263671875, -0.13306808471679688, -0.12155914306640625, -0.11005020141601562, -0.098541259765625, -0.08703231811523438, -0.07552337646484375, -0.06401443481445312, -0.0525054931640625, -0.040996551513671875, -0.02948760986328125, -0.017978668212890625, -0.0064697265625, 0.005039215087890625, 0.01654815673828125, 0.028057098388671875, 0.0395660400390625, 0.051074981689453125, 0.06258392333984375, 0.07409286499023438, 0.085601806640625, 0.09711074829101562, 0.10861968994140625, 0.12012863159179688, 0.1316375732421875, 0.14314651489257812, 0.15465545654296875, 0.16616439819335938, 0.17767333984375, 0.18918228149414062, 0.20069122314453125, 0.21220016479492188, 0.2237091064453125, 0.23521804809570312, 0.24672698974609375, 0.2582359313964844, 0.269744873046875, 0.2812538146972656, 0.29276275634765625, 0.3042716979980469, 0.3157806396484375, 0.3272895812988281, 0.33879852294921875, 0.3503074645996094, 0.36181640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 3.0, 4.0, 6.0, 7.0, 14.0, 5.0, 11.0, 18.0, 19.0, 25.0, 35.0, 58.0, 77.0, 76.0, 146.0, 123.0, 75.0, 63.0, 48.0, 36.0, 25.0, 25.0, 12.0, 16.0, 14.0, 11.0, 7.0, 5.0, 8.0, 2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0168914794921875, -0.016360044479370117, -0.015828609466552734, -0.015297174453735352, -0.014765739440917969, -0.014234304428100586, -0.013702869415283203, -0.01317143440246582, -0.012639999389648438, -0.012108564376831055, -0.011577129364013672, -0.011045694351196289, -0.010514259338378906, -0.009982824325561523, -0.00945138931274414, -0.008919954299926758, -0.008388519287109375, -0.007857084274291992, -0.007325649261474609, -0.0067942142486572266, -0.006262779235839844, -0.005731344223022461, -0.005199909210205078, -0.004668474197387695, -0.0041370391845703125, -0.0036056041717529297, -0.003074169158935547, -0.002542734146118164, -0.0020112991333007812, -0.0014798641204833984, -0.0009484291076660156, -0.0004169940948486328, 0.00011444091796875, 0.0006458759307861328, 0.0011773109436035156, 0.0017087459564208984, 0.0022401809692382812, 0.002771615982055664, 0.003303050994873047, 0.0038344860076904297, 0.0043659210205078125, 0.004897356033325195, 0.005428791046142578, 0.005960226058959961, 0.006491661071777344, 0.0070230960845947266, 0.007554531097412109, 0.008085966110229492, 0.008617401123046875, 0.009148836135864258, 0.00968027114868164, 0.010211706161499023, 0.010743141174316406, 0.011274576187133789, 0.011806011199951172, 0.012337446212768555, 0.012868881225585938, 0.01340031623840332, 0.013931751251220703, 0.014463186264038086, 0.014994621276855469, 0.015526056289672852, 0.016057491302490234, 0.016588926315307617, 0.017120361328125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 7.0, 6.0, 10.0, 6.0, 23.0, 17.0, 14.0, 29.0, 38.0, 50.0, 89.0, 160.0, 256.0, 948.0, 46477.0, 994587.0, 4823.0, 468.0, 204.0, 91.0, 61.0, 35.0, 35.0, 23.0, 18.0, 13.0, 10.0, 6.0, 10.0, 7.0, 6.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33837890625, -0.3278923034667969, -0.31740570068359375, -0.3069190979003906, -0.2964324951171875, -0.2859458923339844, -0.27545928955078125, -0.2649726867675781, -0.254486083984375, -0.24399948120117188, -0.23351287841796875, -0.22302627563476562, -0.2125396728515625, -0.20205307006835938, -0.19156646728515625, -0.18107986450195312, -0.17059326171875, -0.16010665893554688, -0.14962005615234375, -0.13913345336914062, -0.1286468505859375, -0.11816024780273438, -0.10767364501953125, -0.09718704223632812, -0.086700439453125, -0.07621383666992188, -0.06572723388671875, -0.055240631103515625, -0.0447540283203125, -0.034267425537109375, -0.02378082275390625, -0.013294219970703125, -0.0028076171875, 0.007678985595703125, 0.01816558837890625, 0.028652191162109375, 0.0391387939453125, 0.049625396728515625, 0.06011199951171875, 0.07059860229492188, 0.081085205078125, 0.09157180786132812, 0.10205841064453125, 0.11254501342773438, 0.1230316162109375, 0.13351821899414062, 0.14400482177734375, 0.15449142456054688, 0.16497802734375, 0.17546463012695312, 0.18595123291015625, 0.19643783569335938, 0.2069244384765625, 0.21741104125976562, 0.22789764404296875, 0.23838424682617188, 0.248870849609375, 0.2593574523925781, 0.26984405517578125, 0.2803306579589844, 0.2908172607421875, 0.3013038635253906, 0.31179046630859375, 0.3222770690917969, 0.332763671875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 9.0, 317.0, 681.0, 11.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5163511037826538, -0.5073102712631226, -0.49826937913894653, -0.4892285466194153, -0.48018768429756165, -0.471146821975708, -0.46210595965385437, -0.45306509733200073, -0.4440242648124695, -0.43498340249061584, -0.4259425401687622, -0.41690170764923096, -0.4078608453273773, -0.3988199830055237, -0.38977912068367004, -0.3807382583618164, -0.37169742584228516, -0.3626565635204315, -0.3536157011985779, -0.34457486867904663, -0.335534006357193, -0.32649314403533936, -0.3174522817134857, -0.3084114193916321, -0.29937055706977844, -0.2903296947479248, -0.28128883242607117, -0.2722479999065399, -0.2632071375846863, -0.25416627526283264, -0.245125412940979, -0.23608456552028656, -0.22704371809959412, -0.21800285577774048, -0.20896200835704803, -0.1999211460351944, -0.19088029861450195, -0.18183943629264832, -0.17279857397079468, -0.16375772655010223, -0.1547168791294098, -0.14567601680755615, -0.1366351693868637, -0.12759430706501007, -0.11855345964431763, -0.10951259732246399, -0.10047174245119095, -0.09143088757991791, -0.08239003270864487, -0.07334917783737183, -0.06430832296609879, -0.055267464369535446, -0.046226609498262405, -0.037185754626989365, -0.028144896030426025, -0.019104041159152985, -0.010063186287879944, -0.0010223304852843285, 0.008018525317311287, 0.017059382051229477, 0.026100236922502518, 0.03514109179377556, 0.0441819503903389, 0.05322280526161194, 0.06226366013288498]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 13.0, 12.0, 22.0, 23.0, 25.0, 22.0, 31.0, 29.0, 31.0, 37.0, 33.0, 34.0, 43.0, 29.0, 36.0, 39.0, 42.0, 34.0, 33.0, 42.0, 39.0, 43.0, 32.0, 41.0, 38.0, 25.0, 23.0, 13.0, 21.0, 16.0, 4.0, 16.0, 12.0, 9.0, 4.0, 6.0, 3.0, 0.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.020860910415649414, -0.020134367048740387, -0.01940782181918621, -0.018681276589632034, -0.017954733222723007, -0.01722818985581398, -0.016501644626259804, -0.015775099396705627, -0.0150485560297966, -0.014322011731564999, -0.013595467433333397, -0.012868923135101795, -0.012142378836870193, -0.011415834538638592, -0.01068929024040699, -0.009962745942175388, -0.009236201643943787, -0.008509657345712185, -0.007783113047480583, -0.0070565687492489815, -0.00633002445101738, -0.005603480152785778, -0.004876935854554176, -0.004150391556322575, -0.003423847258090973, -0.002697302959859371, -0.0019707586616277695, -0.0012442143633961678, -0.000517670065164566, 0.00020887423306703568, 0.0009354185312986374, 0.001661962829530239, 0.002388507127761841, 0.0031150514259934425, 0.0038415957242250443, 0.004568140022456646, 0.005294684320688248, 0.006021228618919849, 0.006747772917151451, 0.007474317215383053, 0.008200861513614655, 0.008927405811846256, 0.009653950110077858, 0.01038049440830946, 0.011107038706541061, 0.011833583004772663, 0.012560127303004265, 0.013286671601235867, 0.014013215899467468, 0.01473976019769907, 0.015466304495930672, 0.016192849725484848, 0.016919393092393875, 0.017645936459302902, 0.01837248168885708, 0.019099026918411255, 0.019825570285320282, 0.02055211365222931, 0.021278658881783485, 0.022005204111337662, 0.02273174747824669, 0.023458290845155716, 0.024184836074709892, 0.02491138130426407, 0.025637924671173096]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 8.0, 14.0, 10.0, 18.0, 10.0, 11.0, 24.0, 13.0, 14.0, 22.0, 28.0, 34.0, 31.0, 25.0, 45.0, 30.0, 32.0, 28.0, 48.0, 51.0, 38.0, 45.0, 38.0, 39.0, 35.0, 28.0, 32.0, 32.0, 30.0, 23.0, 24.0, 20.0, 18.0, 22.0, 14.0, 14.0, 8.0, 5.0, 11.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6640625, -4.52130126953125, -4.3785400390625, -4.23577880859375, -4.093017578125, -3.95025634765625, -3.8074951171875, -3.66473388671875, -3.52197265625, -3.37921142578125, -3.2364501953125, -3.09368896484375, -2.950927734375, -2.80816650390625, -2.6654052734375, -2.52264404296875, -2.3798828125, -2.23712158203125, -2.0943603515625, -1.95159912109375, -1.808837890625, -1.66607666015625, -1.5233154296875, -1.38055419921875, -1.23779296875, -1.09503173828125, -0.9522705078125, -0.80950927734375, -0.666748046875, -0.52398681640625, -0.3812255859375, -0.23846435546875, -0.095703125, 0.04705810546875, 0.1898193359375, 0.33258056640625, 0.475341796875, 0.61810302734375, 0.7608642578125, 0.90362548828125, 1.04638671875, 1.18914794921875, 1.3319091796875, 1.47467041015625, 1.617431640625, 1.76019287109375, 1.9029541015625, 2.04571533203125, 2.1884765625, 2.33123779296875, 2.4739990234375, 2.61676025390625, 2.759521484375, 2.90228271484375, 3.0450439453125, 3.18780517578125, 3.33056640625, 3.47332763671875, 3.6160888671875, 3.75885009765625, 3.901611328125, 4.04437255859375, 4.1871337890625, 4.32989501953125, 4.47265625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 13.0, 9.0, 25.0, 44.0, 88.0, 166.0, 330.0, 648.0, 1399.0, 2968.0, 6047.0, 13469.0, 33862.0, 99711.0, 356863.0, 370493.0, 102304.0, 34407.0, 13651.0, 6335.0, 2928.0, 1441.0, 670.0, 329.0, 173.0, 83.0, 42.0, 16.0, 16.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7265625, -4.55157470703125, -4.3765869140625, -4.20159912109375, -4.026611328125, -3.85162353515625, -3.6766357421875, -3.50164794921875, -3.32666015625, -3.15167236328125, -2.9766845703125, -2.80169677734375, -2.626708984375, -2.45172119140625, -2.2767333984375, -2.10174560546875, -1.9267578125, -1.75177001953125, -1.5767822265625, -1.40179443359375, -1.226806640625, -1.05181884765625, -0.8768310546875, -0.70184326171875, -0.52685546875, -0.35186767578125, -0.1768798828125, -0.00189208984375, 0.173095703125, 0.34808349609375, 0.5230712890625, 0.69805908203125, 0.873046875, 1.04803466796875, 1.2230224609375, 1.39801025390625, 1.572998046875, 1.74798583984375, 1.9229736328125, 2.09796142578125, 2.27294921875, 2.44793701171875, 2.6229248046875, 2.79791259765625, 2.972900390625, 3.14788818359375, 3.3228759765625, 3.49786376953125, 3.6728515625, 3.84783935546875, 4.0228271484375, 4.19781494140625, 4.372802734375, 4.54779052734375, 4.7227783203125, 4.89776611328125, 5.07275390625, 5.24774169921875, 5.4227294921875, 5.59771728515625, 5.772705078125, 5.94769287109375, 6.1226806640625, 6.29766845703125, 6.47265625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 9.0, 8.0, 9.0, 8.0, 18.0, 13.0, 13.0, 17.0, 21.0, 18.0, 28.0, 26.0, 35.0, 32.0, 33.0, 42.0, 57.0, 50.0, 96.0, 222.0, 1518.0, 242.0, 84.0, 45.0, 55.0, 33.0, 35.0, 38.0, 20.0, 19.0, 35.0, 33.0, 23.0, 15.0, 21.0, 13.0, 11.0, 10.0, 4.0, 8.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0], "bins": [-16.296875, -15.8250732421875, -15.353271484375, -14.8814697265625, -14.40966796875, -13.9378662109375, -13.466064453125, -12.9942626953125, -12.5224609375, -12.0506591796875, -11.578857421875, -11.1070556640625, -10.63525390625, -10.1634521484375, -9.691650390625, -9.2198486328125, -8.748046875, -8.2762451171875, -7.804443359375, -7.3326416015625, -6.86083984375, -6.3890380859375, -5.917236328125, -5.4454345703125, -4.9736328125, -4.5018310546875, -4.030029296875, -3.5582275390625, -3.08642578125, -2.6146240234375, -2.142822265625, -1.6710205078125, -1.19921875, -0.7274169921875, -0.255615234375, 0.2161865234375, 0.68798828125, 1.1597900390625, 1.631591796875, 2.1033935546875, 2.5751953125, 3.0469970703125, 3.518798828125, 3.9906005859375, 4.46240234375, 4.9342041015625, 5.406005859375, 5.8778076171875, 6.349609375, 6.8214111328125, 7.293212890625, 7.7650146484375, 8.23681640625, 8.7086181640625, 9.180419921875, 9.6522216796875, 10.1240234375, 10.5958251953125, 11.067626953125, 11.5394287109375, 12.01123046875, 12.4830322265625, 12.954833984375, 13.4266357421875, 13.8984375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 7.0, 4.0, 6.0, 10.0, 10.0, 11.0, 17.0, 37.0, 25.0, 40.0, 51.0, 72.0, 81.0, 120.0, 158.0, 214.0, 313.0, 835.0, 5217.0, 1779648.0, 1351998.0, 4782.0, 777.0, 404.0, 230.0, 140.0, 133.0, 85.0, 60.0, 41.0, 38.0, 36.0, 18.0, 19.0, 19.0, 9.0, 12.0, 6.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.25, -31.970703125, -30.69140625, -29.412109375, -28.1328125, -26.853515625, -25.57421875, -24.294921875, -23.015625, -21.736328125, -20.45703125, -19.177734375, -17.8984375, -16.619140625, -15.33984375, -14.060546875, -12.78125, -11.501953125, -10.22265625, -8.943359375, -7.6640625, -6.384765625, -5.10546875, -3.826171875, -2.546875, -1.267578125, 0.01171875, 1.291015625, 2.5703125, 3.849609375, 5.12890625, 6.408203125, 7.6875, 8.966796875, 10.24609375, 11.525390625, 12.8046875, 14.083984375, 15.36328125, 16.642578125, 17.921875, 19.201171875, 20.48046875, 21.759765625, 23.0390625, 24.318359375, 25.59765625, 26.876953125, 28.15625, 29.435546875, 30.71484375, 31.994140625, 33.2734375, 34.552734375, 35.83203125, 37.111328125, 38.390625, 39.669921875, 40.94921875, 42.228515625, 43.5078125, 44.787109375, 46.06640625, 47.345703125, 48.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 9.0, 237.0, 651.0, 117.0, 4.0], "bins": [-242.23150634765625, -238.28182983398438, -234.33216857910156, -230.3824920654297, -226.43283081054688, -222.483154296875, -218.5334930419922, -214.5838165283203, -210.6341552734375, -206.68447875976562, -202.7348175048828, -198.78514099121094, -194.83547973632812, -190.88580322265625, -186.93614196777344, -182.98646545410156, -179.0367889404297, -175.0871124267578, -171.137451171875, -167.18777465820312, -163.2381134033203, -159.28843688964844, -155.33877563476562, -151.38909912109375, -147.43942260742188, -143.48974609375, -139.5400848388672, -135.5904083251953, -131.6407470703125, -127.69107055664062, -123.74140167236328, -119.79173278808594, -115.8420639038086, -111.89239501953125, -107.9427261352539, -103.99305725097656, -100.04338073730469, -96.09371948242188, -92.14404296875, -88.19437408447266, -84.24470520019531, -80.29503631591797, -76.34536743164062, -72.39569854736328, -68.44602966308594, -64.49635314941406, -60.54668426513672, -56.597015380859375, -52.64734649658203, -48.69767761230469, -44.748008728027344, -40.798336029052734, -36.84866714477539, -32.89899826049805, -28.94932746887207, -24.999656677246094, -21.04998779296875, -17.100318908691406, -13.15064811706543, -9.20097827911377, -5.251308441162109, -1.3016395568847656, 2.648031234741211, 6.5977020263671875, 10.547369956970215]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 9.0, 3.0, 5.0, 7.0, 11.0, 11.0, 9.0, 18.0, 10.0, 19.0, 19.0, 20.0, 22.0, 16.0, 31.0, 33.0, 30.0, 27.0, 34.0, 28.0, 46.0, 39.0, 41.0, 36.0, 52.0, 30.0, 34.0, 34.0, 20.0, 41.0, 26.0, 28.0, 27.0, 37.0, 10.0, 23.0, 18.0, 13.0, 13.0, 13.0, 9.0, 9.0, 8.0, 11.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.9173583984375, -36.764320373535156, -35.61128234863281, -34.45824432373047, -33.305206298828125, -32.15216827392578, -30.999128341674805, -29.846088409423828, -28.693050384521484, -27.54001235961914, -26.386974334716797, -25.233936309814453, -24.080896377563477, -22.927858352661133, -21.77482032775879, -20.621780395507812, -19.4687442779541, -18.315706253051758, -17.162668228149414, -16.009628295898438, -14.856590270996094, -13.70355224609375, -12.550514221191406, -11.397475242614746, -10.244437217712402, -9.091399192810059, -7.938360214233398, -6.785322189331055, -5.632283687591553, -4.479245185852051, -3.326207160949707, -2.173168182373047, -1.0201301574707031, 0.13290822505950928, 1.2859466075897217, 2.4389848709106445, 3.5920233726501465, 4.745061874389648, 5.898099899291992, 7.051138877868652, 8.204176902770996, 9.35721492767334, 10.51025390625, 11.663291931152344, 12.816329956054688, 13.969368934631348, 15.122406959533691, 16.27544593811035, 17.428483963012695, 18.58152198791504, 19.734560012817383, 20.88759994506836, 22.040637969970703, 23.193675994873047, 24.34671401977539, 25.499752044677734, 26.652790069580078, 27.805828094482422, 28.958866119384766, 30.11190414428711, 31.264944076538086, 32.41798400878906, 33.571022033691406, 34.72406005859375, 35.877098083496094]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 6.0, 3.0, 8.0, 11.0, 17.0, 7.0, 15.0, 13.0, 12.0, 24.0, 20.0, 20.0, 34.0, 34.0, 35.0, 37.0, 29.0, 34.0, 34.0, 46.0, 42.0, 33.0, 38.0, 48.0, 41.0, 38.0, 27.0, 23.0, 36.0, 28.0, 34.0, 27.0, 23.0, 16.0, 16.0, 16.0, 14.0, 10.0, 13.0, 8.0, 9.0, 5.0, 1.0, 3.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.76165771484375, -4.6092529296875, -4.45684814453125, -4.304443359375, -4.15203857421875, -3.9996337890625, -3.84722900390625, -3.69482421875, -3.54241943359375, -3.3900146484375, -3.23760986328125, -3.085205078125, -2.93280029296875, -2.7803955078125, -2.62799072265625, -2.4755859375, -2.32318115234375, -2.1707763671875, -2.01837158203125, -1.865966796875, -1.71356201171875, -1.5611572265625, -1.40875244140625, -1.25634765625, -1.10394287109375, -0.9515380859375, -0.79913330078125, -0.646728515625, -0.49432373046875, -0.3419189453125, -0.18951416015625, -0.037109375, 0.11529541015625, 0.2677001953125, 0.42010498046875, 0.572509765625, 0.72491455078125, 0.8773193359375, 1.02972412109375, 1.18212890625, 1.33453369140625, 1.4869384765625, 1.63934326171875, 1.791748046875, 1.94415283203125, 2.0965576171875, 2.24896240234375, 2.4013671875, 2.55377197265625, 2.7061767578125, 2.85858154296875, 3.010986328125, 3.16339111328125, 3.3157958984375, 3.46820068359375, 3.62060546875, 3.77301025390625, 3.9254150390625, 4.07781982421875, 4.230224609375, 4.38262939453125, 4.5350341796875, 4.68743896484375, 4.83984375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 4.0, 9.0, 13.0, 11.0, 10.0, 23.0, 20.0, 27.0, 30.0, 40.0, 60.0, 88.0, 133.0, 257.0, 578.0, 1630.0, 5489.0, 27364.0, 273754.0, 2772200.0, 1026867.0, 70013.0, 11054.0, 2795.0, 946.0, 348.0, 169.0, 88.0, 54.0, 41.0, 36.0, 24.0, 17.0, 17.0, 17.0, 14.0, 9.0, 11.0, 2.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0703125, -14.5953369140625, -14.120361328125, -13.6453857421875, -13.17041015625, -12.6954345703125, -12.220458984375, -11.7454833984375, -11.2705078125, -10.7955322265625, -10.320556640625, -9.8455810546875, -9.37060546875, -8.8956298828125, -8.420654296875, -7.9456787109375, -7.470703125, -6.9957275390625, -6.520751953125, -6.0457763671875, -5.57080078125, -5.0958251953125, -4.620849609375, -4.1458740234375, -3.6708984375, -3.1959228515625, -2.720947265625, -2.2459716796875, -1.77099609375, -1.2960205078125, -0.821044921875, -0.3460693359375, 0.12890625, 0.6038818359375, 1.078857421875, 1.5538330078125, 2.02880859375, 2.5037841796875, 2.978759765625, 3.4537353515625, 3.9287109375, 4.4036865234375, 4.878662109375, 5.3536376953125, 5.82861328125, 6.3035888671875, 6.778564453125, 7.2535400390625, 7.728515625, 8.2034912109375, 8.678466796875, 9.1534423828125, 9.62841796875, 10.1033935546875, 10.578369140625, 11.0533447265625, 11.5283203125, 12.0032958984375, 12.478271484375, 12.9532470703125, 13.42822265625, 13.9031982421875, 14.378173828125, 14.8531494140625, 15.328125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 6.0, 8.0, 18.0, 12.0, 12.0, 30.0, 33.0, 47.0, 46.0, 74.0, 85.0, 120.0, 148.0, 191.0, 241.0, 358.0, 395.0, 460.0, 373.0, 331.0, 271.0, 225.0, 130.0, 106.0, 83.0, 56.0, 42.0, 49.0, 33.0, 14.0, 22.0, 11.0, 17.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.015625, -9.72509765625, -9.4345703125, -9.14404296875, -8.853515625, -8.56298828125, -8.2724609375, -7.98193359375, -7.69140625, -7.40087890625, -7.1103515625, -6.81982421875, -6.529296875, -6.23876953125, -5.9482421875, -5.65771484375, -5.3671875, -5.07666015625, -4.7861328125, -4.49560546875, -4.205078125, -3.91455078125, -3.6240234375, -3.33349609375, -3.04296875, -2.75244140625, -2.4619140625, -2.17138671875, -1.880859375, -1.59033203125, -1.2998046875, -1.00927734375, -0.71875, -0.42822265625, -0.1376953125, 0.15283203125, 0.443359375, 0.73388671875, 1.0244140625, 1.31494140625, 1.60546875, 1.89599609375, 2.1865234375, 2.47705078125, 2.767578125, 3.05810546875, 3.3486328125, 3.63916015625, 3.9296875, 4.22021484375, 4.5107421875, 4.80126953125, 5.091796875, 5.38232421875, 5.6728515625, 5.96337890625, 6.25390625, 6.54443359375, 6.8349609375, 7.12548828125, 7.416015625, 7.70654296875, 7.9970703125, 8.28759765625, 8.578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 20.0, 17.0, 27.0, 28.0, 58.0, 56.0, 69.0, 103.0, 167.0, 217.0, 350.0, 625.0, 4988.0, 395007.0, 3751272.0, 38318.0, 1470.0, 451.0, 283.0, 195.0, 137.0, 100.0, 82.0, 60.0, 33.0, 39.0, 22.0, 21.0, 14.0, 11.0, 6.0, 9.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.84375, -39.4482421875, -38.052734375, -36.6572265625, -35.26171875, -33.8662109375, -32.470703125, -31.0751953125, -29.6796875, -28.2841796875, -26.888671875, -25.4931640625, -24.09765625, -22.7021484375, -21.306640625, -19.9111328125, -18.515625, -17.1201171875, -15.724609375, -14.3291015625, -12.93359375, -11.5380859375, -10.142578125, -8.7470703125, -7.3515625, -5.9560546875, -4.560546875, -3.1650390625, -1.76953125, -0.3740234375, 1.021484375, 2.4169921875, 3.8125, 5.2080078125, 6.603515625, 7.9990234375, 9.39453125, 10.7900390625, 12.185546875, 13.5810546875, 14.9765625, 16.3720703125, 17.767578125, 19.1630859375, 20.55859375, 21.9541015625, 23.349609375, 24.7451171875, 26.140625, 27.5361328125, 28.931640625, 30.3271484375, 31.72265625, 33.1181640625, 34.513671875, 35.9091796875, 37.3046875, 38.7001953125, 40.095703125, 41.4912109375, 42.88671875, 44.2822265625, 45.677734375, 47.0732421875, 48.46875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 34.0, 33.0, 49.0, 78.0, 79.0, 111.0, 132.0, 129.0, 81.0, 96.0, 58.0, 54.0, 29.0, 14.0, 7.0, 10.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-74.3153076171875, -72.82379150390625, -71.33228302001953, -69.84076690673828, -68.34925842285156, -66.85774230957031, -65.36622619628906, -63.87471389770508, -62.383201599121094, -60.89168930053711, -59.400177001953125, -57.908660888671875, -56.41714859008789, -54.925636291503906, -53.434120178222656, -51.94260787963867, -50.45109558105469, -48.9595832824707, -47.46807098388672, -45.97655487060547, -44.485042572021484, -42.9935302734375, -41.50201416015625, -40.010501861572266, -38.51898956298828, -37.0274772644043, -35.53596496582031, -34.04444885253906, -32.55293655395508, -31.061424255371094, -29.569910049438477, -28.07839584350586, -26.586883544921875, -25.09537124633789, -23.603857040405273, -22.112342834472656, -20.620830535888672, -19.129318237304688, -17.63780403137207, -16.146289825439453, -14.654777526855469, -13.163264274597168, -11.671751022338867, -10.180237770080566, -8.688724517822266, -7.197211265563965, -5.705698013305664, -4.214184761047363, -2.7226715087890625, -1.2311582565307617, 0.26035499572753906, 1.7518682479858398, 3.2433815002441406, 4.734894752502441, 6.226408004760742, 7.717921257019043, 9.209434509277344, 10.700947761535645, 12.192461013793945, 13.683974266052246, 15.175487518310547, 16.66699981689453, 18.15851402282715, 19.650028228759766, 21.14154052734375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 9.0, 9.0, 13.0, 10.0, 20.0, 16.0, 21.0, 18.0, 31.0, 33.0, 24.0, 39.0, 30.0, 42.0, 46.0, 38.0, 43.0, 46.0, 45.0, 50.0, 49.0, 32.0, 26.0, 38.0, 29.0, 40.0, 29.0, 19.0, 23.0, 26.0, 25.0, 14.0, 17.0, 11.0, 8.0, 7.0, 10.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.44563293457031, -32.433616638183594, -31.421598434448242, -30.40958023071289, -29.397563934326172, -28.38554573059082, -27.37352752685547, -26.36151123046875, -25.3494930267334, -24.337474822998047, -23.325458526611328, -22.313440322875977, -21.301422119140625, -20.289405822753906, -19.277387619018555, -18.265369415283203, -17.253353118896484, -16.241334915161133, -15.229318618774414, -14.217300415039062, -13.205283164978027, -12.193265914916992, -11.18124771118164, -10.169230461120605, -9.15721321105957, -8.145195960998535, -7.133178234100342, -6.121160507202148, -5.109143257141113, -4.097126007080078, -3.0851082801818848, -2.0730905532836914, -1.0610733032226562, -0.04905581474304199, 0.9629616737365723, 1.9749791622161865, 2.986996650695801, 3.999013900756836, 5.011031627655029, 6.023049354553223, 7.035066604614258, 8.047083854675293, 9.059101104736328, 10.07111930847168, 11.083136558532715, 12.09515380859375, 13.107172012329102, 14.119189262390137, 15.131206512451172, 16.143224716186523, 17.155241012573242, 18.167259216308594, 19.179275512695312, 20.191293716430664, 21.203311920166016, 22.215328216552734, 23.227346420288086, 24.239364624023438, 25.251380920410156, 26.263399124145508, 27.27541732788086, 28.287433624267578, 29.29945182800293, 30.31147003173828, 31.323486328125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 8.0, 8.0, 9.0, 6.0, 6.0, 21.0, 13.0, 18.0, 18.0, 18.0, 13.0, 25.0, 21.0, 14.0, 30.0, 29.0, 30.0, 34.0, 34.0, 40.0, 40.0, 34.0, 44.0, 39.0, 41.0, 43.0, 37.0, 30.0, 44.0, 40.0, 38.0, 25.0, 18.0, 24.0, 23.0, 18.0, 14.0, 8.0, 12.0, 5.0, 9.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.046875, -4.89508056640625, -4.7432861328125, -4.59149169921875, -4.439697265625, -4.28790283203125, -4.1361083984375, -3.98431396484375, -3.83251953125, -3.68072509765625, -3.5289306640625, -3.37713623046875, -3.225341796875, -3.07354736328125, -2.9217529296875, -2.76995849609375, -2.6181640625, -2.46636962890625, -2.3145751953125, -2.16278076171875, -2.010986328125, -1.85919189453125, -1.7073974609375, -1.55560302734375, -1.40380859375, -1.25201416015625, -1.1002197265625, -0.94842529296875, -0.796630859375, -0.64483642578125, -0.4930419921875, -0.34124755859375, -0.189453125, -0.03765869140625, 0.1141357421875, 0.26593017578125, 0.417724609375, 0.56951904296875, 0.7213134765625, 0.87310791015625, 1.02490234375, 1.17669677734375, 1.3284912109375, 1.48028564453125, 1.632080078125, 1.78387451171875, 1.9356689453125, 2.08746337890625, 2.2392578125, 2.39105224609375, 2.5428466796875, 2.69464111328125, 2.846435546875, 2.99822998046875, 3.1500244140625, 3.30181884765625, 3.45361328125, 3.60540771484375, 3.7572021484375, 3.90899658203125, 4.060791015625, 4.21258544921875, 4.3643798828125, 4.51617431640625, 4.66796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 13.0, 16.0, 24.0, 39.0, 56.0, 93.0, 142.0, 187.0, 293.0, 495.0, 715.0, 1200.0, 1804.0, 2806.0, 4233.0, 6633.0, 10312.0, 15920.0, 24521.0, 37267.0, 54953.0, 79737.0, 111304.0, 143236.0, 151016.0, 123353.0, 90606.0, 63144.0, 42541.0, 28439.0, 18940.0, 12188.0, 8055.0, 5069.0, 3220.0, 2133.0, 1327.0, 875.0, 583.0, 370.0, 250.0, 156.0, 111.0, 60.0, 44.0, 25.0, 10.0, 8.0, 12.0, 6.0, 5.0, 3.0, 5.0, 2.0], "bins": [-0.7109375, -0.6901397705078125, -0.669342041015625, -0.6485443115234375, -0.62774658203125, -0.6069488525390625, -0.586151123046875, -0.5653533935546875, -0.5445556640625, -0.5237579345703125, -0.502960205078125, -0.4821624755859375, -0.46136474609375, -0.4405670166015625, -0.419769287109375, -0.3989715576171875, -0.378173828125, -0.3573760986328125, -0.336578369140625, -0.3157806396484375, -0.29498291015625, -0.2741851806640625, -0.253387451171875, -0.2325897216796875, -0.2117919921875, -0.1909942626953125, -0.170196533203125, -0.1493988037109375, -0.12860107421875, -0.1078033447265625, -0.087005615234375, -0.0662078857421875, -0.04541015625, -0.0246124267578125, -0.003814697265625, 0.0169830322265625, 0.03778076171875, 0.0585784912109375, 0.079376220703125, 0.1001739501953125, 0.1209716796875, 0.1417694091796875, 0.162567138671875, 0.1833648681640625, 0.20416259765625, 0.2249603271484375, 0.245758056640625, 0.2665557861328125, 0.287353515625, 0.3081512451171875, 0.328948974609375, 0.3497467041015625, 0.37054443359375, 0.3913421630859375, 0.412139892578125, 0.4329376220703125, 0.4537353515625, 0.4745330810546875, 0.495330810546875, 0.5161285400390625, 0.53692626953125, 0.5577239990234375, 0.578521728515625, 0.5993194580078125, 0.6201171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 7.0, 7.0, 12.0, 17.0, 13.0, 22.0, 18.0, 31.0, 23.0, 31.0, 37.0, 34.0, 36.0, 44.0, 31.0, 32.0, 44.0, 42.0, 1060.0, 37.0, 39.0, 42.0, 40.0, 32.0, 30.0, 27.0, 33.0, 26.0, 23.0, 24.0, 16.0, 16.0, 22.0, 13.0, 12.0, 6.0, 4.0, 3.0, 5.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.16998291015625, -3.0665283203125, -2.96307373046875, -2.859619140625, -2.75616455078125, -2.6527099609375, -2.54925537109375, -2.44580078125, -2.34234619140625, -2.2388916015625, -2.13543701171875, -2.031982421875, -1.92852783203125, -1.8250732421875, -1.72161865234375, -1.6181640625, -1.51470947265625, -1.4112548828125, -1.30780029296875, -1.204345703125, -1.10089111328125, -0.9974365234375, -0.89398193359375, -0.79052734375, -0.68707275390625, -0.5836181640625, -0.48016357421875, -0.376708984375, -0.27325439453125, -0.1697998046875, -0.06634521484375, 0.037109375, 0.14056396484375, 0.2440185546875, 0.34747314453125, 0.450927734375, 0.55438232421875, 0.6578369140625, 0.76129150390625, 0.86474609375, 0.96820068359375, 1.0716552734375, 1.17510986328125, 1.278564453125, 1.38201904296875, 1.4854736328125, 1.58892822265625, 1.6923828125, 1.79583740234375, 1.8992919921875, 2.00274658203125, 2.106201171875, 2.20965576171875, 2.3131103515625, 2.41656494140625, 2.52001953125, 2.62347412109375, 2.7269287109375, 2.83038330078125, 2.933837890625, 3.03729248046875, 3.1407470703125, 3.24420166015625, 3.34765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 25.0, 42.0, 55.0, 69.0, 126.0, 182.0, 234.0, 362.0, 487.0, 800.0, 1088.0, 1753.0, 2614.0, 3947.0, 6092.0, 9220.0, 13796.0, 21023.0, 31434.0, 46143.0, 66337.0, 91865.0, 119900.0, 1177527.0, 141674.0, 107941.0, 79690.0, 56678.0, 38562.0, 26103.0, 17253.0, 11469.0, 7576.0, 5014.0, 3309.0, 2267.0, 1445.0, 989.0, 659.0, 437.0, 293.0, 197.0, 131.0, 106.0, 64.0, 45.0, 32.0, 19.0, 13.0, 7.0, 6.0, 3.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.34912109375, -0.33777618408203125, -0.3264312744140625, -0.31508636474609375, -0.303741455078125, -0.29239654541015625, -0.2810516357421875, -0.26970672607421875, -0.25836181640625, -0.24701690673828125, -0.2356719970703125, -0.22432708740234375, -0.212982177734375, -0.20163726806640625, -0.1902923583984375, -0.17894744873046875, -0.1676025390625, -0.15625762939453125, -0.1449127197265625, -0.13356781005859375, -0.122222900390625, -0.11087799072265625, -0.0995330810546875, -0.08818817138671875, -0.07684326171875, -0.06549835205078125, -0.0541534423828125, -0.04280853271484375, -0.031463623046875, -0.02011871337890625, -0.0087738037109375, 0.00257110595703125, 0.013916015625, 0.02526092529296875, 0.0366058349609375, 0.04795074462890625, 0.059295654296875, 0.07064056396484375, 0.0819854736328125, 0.09333038330078125, 0.10467529296875, 0.11602020263671875, 0.1273651123046875, 0.13871002197265625, 0.150054931640625, 0.16139984130859375, 0.1727447509765625, 0.18408966064453125, 0.1954345703125, 0.20677947998046875, 0.2181243896484375, 0.22946929931640625, 0.240814208984375, 0.25215911865234375, 0.2635040283203125, 0.27484893798828125, 0.28619384765625, 0.29753875732421875, 0.3088836669921875, 0.32022857666015625, 0.331573486328125, 0.34291839599609375, 0.3542633056640625, 0.36560821533203125, 0.376953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 9.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 11.0, 15.0, 18.0, 14.0, 18.0, 22.0, 25.0, 37.0, 40.0, 40.0, 56.0, 50.0, 73.0, 69.0, 56.0, 60.0, 62.0, 40.0, 37.0, 36.0, 23.0, 22.0, 24.0, 16.0, 12.0, 7.0, 8.0, 13.0, 6.0, 12.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.00919342041015625, -0.008895397186279297, -0.008597373962402344, -0.00829935073852539, -0.008001327514648438, -0.007703304290771484, -0.007405281066894531, -0.007107257843017578, -0.006809234619140625, -0.006511211395263672, -0.006213188171386719, -0.005915164947509766, -0.0056171417236328125, -0.005319118499755859, -0.005021095275878906, -0.004723072052001953, -0.004425048828125, -0.004127025604248047, -0.0038290023803710938, -0.0035309791564941406, -0.0032329559326171875, -0.0029349327087402344, -0.0026369094848632812, -0.002338886260986328, -0.002040863037109375, -0.0017428398132324219, -0.0014448165893554688, -0.0011467933654785156, -0.0008487701416015625, -0.0005507469177246094, -0.00025272369384765625, 4.5299530029296875e-05, 0.00034332275390625, 0.0006413459777832031, 0.0009393692016601562, 0.0012373924255371094, 0.0015354156494140625, 0.0018334388732910156, 0.0021314620971679688, 0.002429485321044922, 0.002727508544921875, 0.003025531768798828, 0.0033235549926757812, 0.0036215782165527344, 0.0039196014404296875, 0.004217624664306641, 0.004515647888183594, 0.004813671112060547, 0.0051116943359375, 0.005409717559814453, 0.005707740783691406, 0.006005764007568359, 0.0063037872314453125, 0.006601810455322266, 0.006899833679199219, 0.007197856903076172, 0.007495880126953125, 0.007793903350830078, 0.008091926574707031, 0.008389949798583984, 0.008687973022460938, 0.00898599624633789, 0.009284019470214844, 0.009582042694091797, 0.00988006591796875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 6.0, 2.0, 10.0, 9.0, 13.0, 17.0, 10.0, 26.0, 25.0, 34.0, 56.0, 57.0, 93.0, 140.0, 284.0, 1526.0, 49969.0, 978490.0, 16092.0, 881.0, 275.0, 132.0, 82.0, 59.0, 60.0, 36.0, 24.0, 26.0, 24.0, 20.0, 19.0, 3.0, 8.0, 6.0, 7.0, 8.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2296142578125, -0.2225208282470703, -0.21542739868164062, -0.20833396911621094, -0.20124053955078125, -0.19414710998535156, -0.18705368041992188, -0.1799602508544922, -0.1728668212890625, -0.1657733917236328, -0.15867996215820312, -0.15158653259277344, -0.14449310302734375, -0.13739967346191406, -0.13030624389648438, -0.12321281433105469, -0.116119384765625, -0.10902595520019531, -0.10193252563476562, -0.09483909606933594, -0.08774566650390625, -0.08065223693847656, -0.07355880737304688, -0.06646537780761719, -0.0593719482421875, -0.05227851867675781, -0.045185089111328125, -0.03809165954589844, -0.03099822998046875, -0.023904800415039062, -0.016811370849609375, -0.009717941284179688, -0.00262451171875, 0.0044689178466796875, 0.011562347412109375, 0.018655776977539062, 0.02574920654296875, 0.03284263610839844, 0.039936065673828125, 0.04702949523925781, 0.0541229248046875, 0.06121635437011719, 0.06830978393554688, 0.07540321350097656, 0.08249664306640625, 0.08959007263183594, 0.09668350219726562, 0.10377693176269531, 0.110870361328125, 0.11796379089355469, 0.12505722045898438, 0.13215065002441406, 0.13924407958984375, 0.14633750915527344, 0.15343093872070312, 0.1605243682861328, 0.1676177978515625, 0.1747112274169922, 0.18180465698242188, 0.18889808654785156, 0.19599151611328125, 0.20308494567871094, 0.21017837524414062, 0.2172718048095703, 0.224365234375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 12.0, 112.0, 792.0, 99.0, 1.0, 0.0, 1.0], "bins": [-0.3848075270652771, -0.37833914160728455, -0.3718707859516144, -0.3654024004936218, -0.35893404483795166, -0.3524656593799591, -0.34599727392196655, -0.3395289182662964, -0.33306053280830383, -0.3265921473503113, -0.3201237916946411, -0.31365540623664856, -0.3071870505809784, -0.30071866512298584, -0.2942502796649933, -0.2877819240093231, -0.28131353855133057, -0.274845153093338, -0.26837679743766785, -0.2619084119796753, -0.2554400563240051, -0.24897167086601257, -0.2425033003091812, -0.23603492975234985, -0.2295665591955185, -0.22309818863868713, -0.21662981808185577, -0.21016143262386322, -0.20369306206703186, -0.1972246915102005, -0.19075632095336914, -0.1842879354953766, -0.17781955003738403, -0.17135117948055267, -0.1648828089237213, -0.15841442346572876, -0.1519460529088974, -0.14547768235206604, -0.13900931179523468, -0.13254094123840332, -0.12607255578041077, -0.1196041852235794, -0.11313580721616745, -0.10666743665933609, -0.10019905865192413, -0.09373068809509277, -0.08726231753826141, -0.08079393953084946, -0.0743255764245987, -0.06785720586776733, -0.06138882786035538, -0.05492045730352402, -0.04845207929611206, -0.0419837087392807, -0.03551533445715904, -0.029046960175037384, -0.022578582167625427, -0.01611020788550377, -0.009641834534704685, -0.0031734611839056015, 0.003294913098216057, 0.009763285517692566, 0.016231659799814224, 0.022700034081935883, 0.02916840836405754]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 6.0, 3.0, 12.0, 10.0, 12.0, 9.0, 22.0, 19.0, 22.0, 28.0, 28.0, 33.0, 44.0, 39.0, 39.0, 35.0, 42.0, 39.0, 56.0, 35.0, 42.0, 43.0, 39.0, 37.0, 45.0, 34.0, 34.0, 26.0, 23.0, 24.0, 15.0, 21.0, 23.0, 10.0, 7.0, 10.0, 8.0, 7.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01643824577331543, -0.015873000025749207, -0.015307754278182983, -0.01474250853061676, -0.014177262783050537, -0.013612017035484314, -0.01304677128791809, -0.012481525540351868, -0.011916279792785645, -0.011351034045219421, -0.010785788297653198, -0.010220542550086975, -0.009655296802520752, -0.009090051054954529, -0.008524805307388306, -0.007959559559822083, -0.007394313812255859, -0.006829068064689636, -0.006263822317123413, -0.00569857656955719, -0.005133330821990967, -0.004568085074424744, -0.0040028393268585205, -0.0034375935792922974, -0.0028723478317260742, -0.002307102084159851, -0.001741856336593628, -0.0011766105890274048, -0.0006113648414611816, -4.6119093894958496e-05, 0.0005191266536712646, 0.0010843724012374878, 0.001649618148803711, 0.002214863896369934, 0.0027801096439361572, 0.0033453553915023804, 0.0039106011390686035, 0.004475846886634827, 0.00504109263420105, 0.005606338381767273, 0.006171584129333496, 0.006736829876899719, 0.007302075624465942, 0.007867321372032166, 0.008432567119598389, 0.008997812867164612, 0.009563058614730835, 0.010128304362297058, 0.010693550109863281, 0.011258795857429504, 0.011824041604995728, 0.01238928735256195, 0.012954533100128174, 0.013519778847694397, 0.01408502459526062, 0.014650270342826843, 0.015215516090393066, 0.01578076183795929, 0.016346007585525513, 0.016911253333091736, 0.01747649908065796, 0.018041744828224182, 0.018606990575790405, 0.01917223632335663, 0.01973748207092285]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 8.0, 8.0, 9.0, 7.0, 6.0, 20.0, 13.0, 18.0, 18.0, 18.0, 13.0, 25.0, 21.0, 14.0, 30.0, 29.0, 30.0, 34.0, 35.0, 41.0, 38.0, 34.0, 44.0, 40.0, 41.0, 42.0, 37.0, 31.0, 44.0, 39.0, 38.0, 25.0, 19.0, 23.0, 23.0, 18.0, 14.0, 8.0, 12.0, 5.0, 9.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8912353515625, -4.739501953125, -4.5877685546875, -4.43603515625, -4.2843017578125, -4.132568359375, -3.9808349609375, -3.8291015625, -3.6773681640625, -3.525634765625, -3.3739013671875, -3.22216796875, -3.0704345703125, -2.918701171875, -2.7669677734375, -2.615234375, -2.4635009765625, -2.311767578125, -2.1600341796875, -2.00830078125, -1.8565673828125, -1.704833984375, -1.5531005859375, -1.4013671875, -1.2496337890625, -1.097900390625, -0.9461669921875, -0.79443359375, -0.6427001953125, -0.490966796875, -0.3392333984375, -0.1875, -0.0357666015625, 0.115966796875, 0.2677001953125, 0.41943359375, 0.5711669921875, 0.722900390625, 0.8746337890625, 1.0263671875, 1.1781005859375, 1.329833984375, 1.4815673828125, 1.63330078125, 1.7850341796875, 1.936767578125, 2.0885009765625, 2.240234375, 2.3919677734375, 2.543701171875, 2.6954345703125, 2.84716796875, 2.9989013671875, 3.150634765625, 3.3023681640625, 3.4541015625, 3.6058349609375, 3.757568359375, 3.9093017578125, 4.06103515625, 4.2127685546875, 4.364501953125, 4.5162353515625, 4.66796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 11.0, 11.0, 10.0, 29.0, 25.0, 37.0, 34.0, 64.0, 79.0, 118.0, 162.0, 249.0, 419.0, 767.0, 1465.0, 3370.0, 7468.0, 17039.0, 41532.0, 113291.0, 380889.0, 318956.0, 98307.0, 36283.0, 15159.0, 6636.0, 2951.0, 1411.0, 674.0, 380.0, 215.0, 148.0, 90.0, 69.0, 67.0, 31.0, 24.0, 23.0, 15.0, 13.0, 5.0, 6.0, 6.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.33203125, -5.1650390625, -4.998046875, -4.8310546875, -4.6640625, -4.4970703125, -4.330078125, -4.1630859375, -3.99609375, -3.8291015625, -3.662109375, -3.4951171875, -3.328125, -3.1611328125, -2.994140625, -2.8271484375, -2.66015625, -2.4931640625, -2.326171875, -2.1591796875, -1.9921875, -1.8251953125, -1.658203125, -1.4912109375, -1.32421875, -1.1572265625, -0.990234375, -0.8232421875, -0.65625, -0.4892578125, -0.322265625, -0.1552734375, 0.01171875, 0.1787109375, 0.345703125, 0.5126953125, 0.6796875, 0.8466796875, 1.013671875, 1.1806640625, 1.34765625, 1.5146484375, 1.681640625, 1.8486328125, 2.015625, 2.1826171875, 2.349609375, 2.5166015625, 2.68359375, 2.8505859375, 3.017578125, 3.1845703125, 3.3515625, 3.5185546875, 3.685546875, 3.8525390625, 4.01953125, 4.1865234375, 4.353515625, 4.5205078125, 4.6875, 4.8544921875, 5.021484375, 5.1884765625, 5.35546875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 7.0, 12.0, 14.0, 13.0, 18.0, 11.0, 22.0, 24.0, 35.0, 34.0, 35.0, 36.0, 58.0, 47.0, 86.0, 188.0, 1608.0, 268.0, 105.0, 69.0, 50.0, 44.0, 33.0, 37.0, 33.0, 23.0, 27.0, 22.0, 12.0, 17.0, 19.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.6796875, -19.078125, -18.4765625, -17.875, -17.2734375, -16.671875, -16.0703125, -15.46875, -14.8671875, -14.265625, -13.6640625, -13.0625, -12.4609375, -11.859375, -11.2578125, -10.65625, -10.0546875, -9.453125, -8.8515625, -8.25, -7.6484375, -7.046875, -6.4453125, -5.84375, -5.2421875, -4.640625, -4.0390625, -3.4375, -2.8359375, -2.234375, -1.6328125, -1.03125, -0.4296875, 0.171875, 0.7734375, 1.375, 1.9765625, 2.578125, 3.1796875, 3.78125, 4.3828125, 4.984375, 5.5859375, 6.1875, 6.7890625, 7.390625, 7.9921875, 8.59375, 9.1953125, 9.796875, 10.3984375, 11.0, 11.6015625, 12.203125, 12.8046875, 13.40625, 14.0078125, 14.609375, 15.2109375, 15.8125, 16.4140625, 17.015625, 17.6171875, 18.21875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 5.0, 9.0, 4.0, 8.0, 13.0, 13.0, 22.0, 27.0, 27.0, 52.0, 47.0, 66.0, 91.0, 98.0, 178.0, 273.0, 522.0, 1063.0, 4800.0, 468421.0, 2657639.0, 9180.0, 1443.0, 585.0, 342.0, 197.0, 128.0, 107.0, 70.0, 57.0, 36.0, 34.0, 32.0, 24.0, 16.0, 15.0, 16.0, 18.0, 4.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.71875, -34.57080078125, -33.4228515625, -32.27490234375, -31.126953125, -29.97900390625, -28.8310546875, -27.68310546875, -26.53515625, -25.38720703125, -24.2392578125, -23.09130859375, -21.943359375, -20.79541015625, -19.6474609375, -18.49951171875, -17.3515625, -16.20361328125, -15.0556640625, -13.90771484375, -12.759765625, -11.61181640625, -10.4638671875, -9.31591796875, -8.16796875, -7.02001953125, -5.8720703125, -4.72412109375, -3.576171875, -2.42822265625, -1.2802734375, -0.13232421875, 1.015625, 2.16357421875, 3.3115234375, 4.45947265625, 5.607421875, 6.75537109375, 7.9033203125, 9.05126953125, 10.19921875, 11.34716796875, 12.4951171875, 13.64306640625, 14.791015625, 15.93896484375, 17.0869140625, 18.23486328125, 19.3828125, 20.53076171875, 21.6787109375, 22.82666015625, 23.974609375, 25.12255859375, 26.2705078125, 27.41845703125, 28.56640625, 29.71435546875, 30.8623046875, 32.01025390625, 33.158203125, 34.30615234375, 35.4541015625, 36.60205078125, 37.75]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 30.0, 76.0, 231.0, 287.0, 247.0, 88.0, 39.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.84210205078125, -74.4255599975586, -73.00901794433594, -71.59247589111328, -70.17593383789062, -68.75938415527344, -67.34284210205078, -65.92630004882812, -64.50975799560547, -63.09321594238281, -61.676673889160156, -60.260128021240234, -58.84358596801758, -57.42704391479492, -56.010498046875, -54.593955993652344, -53.17741394042969, -51.76087188720703, -50.344329833984375, -48.92778396606445, -47.5112419128418, -46.09469985961914, -44.67815399169922, -43.26161193847656, -41.845069885253906, -40.42852783203125, -39.011985778808594, -37.59543991088867, -36.178897857666016, -34.76235580444336, -33.34580993652344, -31.92926788330078, -30.51272201538086, -29.096179962158203, -27.679636001586914, -26.263092041015625, -24.84654998779297, -23.430007934570312, -22.013463973999023, -20.596920013427734, -19.180377960205078, -17.763835906982422, -16.347291946411133, -14.93074893951416, -13.514205932617188, -12.097662925720215, -10.681119918823242, -9.26457691192627, -7.848034858703613, -6.431491851806641, -5.014948844909668, -3.5984058380126953, -2.1818628311157227, -0.76531982421875, 0.6512231826782227, 2.0677661895751953, 3.484309196472168, 4.900852203369141, 6.317395210266113, 7.733938217163086, 9.150481224060059, 10.567024230957031, 11.983567237854004, 13.400110244750977, 14.81665325164795]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 12.0, 18.0, 18.0, 17.0, 16.0, 18.0, 19.0, 21.0, 24.0, 34.0, 38.0, 35.0, 36.0, 54.0, 54.0, 50.0, 48.0, 45.0, 50.0, 40.0, 45.0, 21.0, 37.0, 24.0, 31.0, 25.0, 22.0, 24.0, 13.0, 21.0, 14.0, 13.0, 7.0, 9.0, 3.0, 7.0, 3.0, 5.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-50.122135162353516, -48.63666915893555, -47.15120315551758, -45.665740966796875, -44.180274963378906, -42.69480895996094, -41.20934295654297, -39.723876953125, -38.23841094970703, -36.75294494628906, -35.267478942871094, -33.782012939453125, -32.29655075073242, -30.811084747314453, -29.325618743896484, -27.840152740478516, -26.354690551757812, -24.869224548339844, -23.383760452270508, -21.89829444885254, -20.412830352783203, -18.927364349365234, -17.441898345947266, -15.956433296203613, -14.470968246459961, -12.985503196716309, -11.500038146972656, -10.014572143554688, -8.529107093811035, -7.043642044067383, -5.558176040649414, -4.072710990905762, -2.587249755859375, -1.1017844676971436, 0.3836808204650879, 1.8691463470458984, 3.354611396789551, 4.840076446533203, 6.325542449951172, 7.811007499694824, 9.296472549438477, 10.781937599182129, 12.267402648925781, 13.75286865234375, 15.238333702087402, 16.723798751831055, 18.209264755249023, 19.69472885131836, 21.180194854736328, 22.665660858154297, 24.151124954223633, 25.6365909576416, 27.122055053710938, 28.607521057128906, 30.092987060546875, 31.578453063964844, 33.06391906738281, 34.54938507080078, 36.03485107421875, 37.52031707763672, 39.00577926635742, 40.49124526977539, 41.97671127319336, 43.46217727661133, 44.94763946533203]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 7.0, 8.0, 17.0, 14.0, 12.0, 14.0, 20.0, 17.0, 19.0, 19.0, 23.0, 17.0, 23.0, 26.0, 32.0, 46.0, 29.0, 33.0, 38.0, 45.0, 40.0, 36.0, 38.0, 38.0, 38.0, 36.0, 37.0, 24.0, 37.0, 34.0, 22.0, 19.0, 22.0, 22.0, 15.0, 5.0, 10.0, 6.0, 11.0, 8.0, 9.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.23828125, -5.08441162109375, -4.9305419921875, -4.77667236328125, -4.622802734375, -4.46893310546875, -4.3150634765625, -4.16119384765625, -4.00732421875, -3.85345458984375, -3.6995849609375, -3.54571533203125, -3.391845703125, -3.23797607421875, -3.0841064453125, -2.93023681640625, -2.7763671875, -2.62249755859375, -2.4686279296875, -2.31475830078125, -2.160888671875, -2.00701904296875, -1.8531494140625, -1.69927978515625, -1.54541015625, -1.39154052734375, -1.2376708984375, -1.08380126953125, -0.929931640625, -0.77606201171875, -0.6221923828125, -0.46832275390625, -0.314453125, -0.16058349609375, -0.0067138671875, 0.14715576171875, 0.301025390625, 0.45489501953125, 0.6087646484375, 0.76263427734375, 0.91650390625, 1.07037353515625, 1.2242431640625, 1.37811279296875, 1.531982421875, 1.68585205078125, 1.8397216796875, 1.99359130859375, 2.1474609375, 2.30133056640625, 2.4552001953125, 2.60906982421875, 2.762939453125, 2.91680908203125, 3.0706787109375, 3.22454833984375, 3.37841796875, 3.53228759765625, 3.6861572265625, 3.84002685546875, 3.993896484375, 4.14776611328125, 4.3016357421875, 4.45550537109375, 4.609375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 5.0, 6.0, 7.0, 11.0, 12.0, 18.0, 16.0, 21.0, 22.0, 33.0, 26.0, 45.0, 64.0, 108.0, 179.0, 352.0, 704.0, 2109.0, 7676.0, 42642.0, 497094.0, 2966719.0, 613882.0, 50090.0, 8634.0, 2235.0, 729.0, 301.0, 161.0, 92.0, 52.0, 51.0, 38.0, 30.0, 19.0, 19.0, 8.0, 15.0, 4.0, 9.0, 9.0, 1.0, 4.0, 8.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-15.8125, -15.3546142578125, -14.896728515625, -14.4388427734375, -13.98095703125, -13.5230712890625, -13.065185546875, -12.6072998046875, -12.1494140625, -11.6915283203125, -11.233642578125, -10.7757568359375, -10.31787109375, -9.8599853515625, -9.402099609375, -8.9442138671875, -8.486328125, -8.0284423828125, -7.570556640625, -7.1126708984375, -6.65478515625, -6.1968994140625, -5.739013671875, -5.2811279296875, -4.8232421875, -4.3653564453125, -3.907470703125, -3.4495849609375, -2.99169921875, -2.5338134765625, -2.075927734375, -1.6180419921875, -1.16015625, -0.7022705078125, -0.244384765625, 0.2135009765625, 0.67138671875, 1.1292724609375, 1.587158203125, 2.0450439453125, 2.5029296875, 2.9608154296875, 3.418701171875, 3.8765869140625, 4.33447265625, 4.7923583984375, 5.250244140625, 5.7081298828125, 6.166015625, 6.6239013671875, 7.081787109375, 7.5396728515625, 7.99755859375, 8.4554443359375, 8.913330078125, 9.3712158203125, 9.8291015625, 10.2869873046875, 10.744873046875, 11.2027587890625, 11.66064453125, 12.1185302734375, 12.576416015625, 13.0343017578125, 13.4921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 17.0, 16.0, 21.0, 29.0, 42.0, 53.0, 75.0, 76.0, 117.0, 162.0, 245.0, 380.0, 477.0, 559.0, 519.0, 365.0, 250.0, 177.0, 126.0, 94.0, 81.0, 53.0, 30.0, 20.0, 22.0, 18.0, 12.0, 2.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.71875, -10.3670654296875, -10.015380859375, -9.6636962890625, -9.31201171875, -8.9603271484375, -8.608642578125, -8.2569580078125, -7.9052734375, -7.5535888671875, -7.201904296875, -6.8502197265625, -6.49853515625, -6.1468505859375, -5.795166015625, -5.4434814453125, -5.091796875, -4.7401123046875, -4.388427734375, -4.0367431640625, -3.68505859375, -3.3333740234375, -2.981689453125, -2.6300048828125, -2.2783203125, -1.9266357421875, -1.574951171875, -1.2232666015625, -0.87158203125, -0.5198974609375, -0.168212890625, 0.1834716796875, 0.53515625, 0.8868408203125, 1.238525390625, 1.5902099609375, 1.94189453125, 2.2935791015625, 2.645263671875, 2.9969482421875, 3.3486328125, 3.7003173828125, 4.052001953125, 4.4036865234375, 4.75537109375, 5.1070556640625, 5.458740234375, 5.8104248046875, 6.162109375, 6.5137939453125, 6.865478515625, 7.2171630859375, 7.56884765625, 7.9205322265625, 8.272216796875, 8.6239013671875, 8.9755859375, 9.3272705078125, 9.678955078125, 10.0306396484375, 10.38232421875, 10.7340087890625, 11.085693359375, 11.4373779296875, 11.7890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 9.0, 7.0, 14.0, 23.0, 17.0, 31.0, 51.0, 74.0, 87.0, 131.0, 207.0, 278.0, 528.0, 3194.0, 511798.0, 3663953.0, 12000.0, 756.0, 372.0, 210.0, 150.0, 97.0, 76.0, 53.0, 41.0, 38.0, 22.0, 16.0, 12.0, 8.0, 10.0, 10.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.21875, -61.36865234375, -59.5185546875, -57.66845703125, -55.818359375, -53.96826171875, -52.1181640625, -50.26806640625, -48.41796875, -46.56787109375, -44.7177734375, -42.86767578125, -41.017578125, -39.16748046875, -37.3173828125, -35.46728515625, -33.6171875, -31.76708984375, -29.9169921875, -28.06689453125, -26.216796875, -24.36669921875, -22.5166015625, -20.66650390625, -18.81640625, -16.96630859375, -15.1162109375, -13.26611328125, -11.416015625, -9.56591796875, -7.7158203125, -5.86572265625, -4.015625, -2.16552734375, -0.3154296875, 1.53466796875, 3.384765625, 5.23486328125, 7.0849609375, 8.93505859375, 10.78515625, 12.63525390625, 14.4853515625, 16.33544921875, 18.185546875, 20.03564453125, 21.8857421875, 23.73583984375, 25.5859375, 27.43603515625, 29.2861328125, 31.13623046875, 32.986328125, 34.83642578125, 36.6865234375, 38.53662109375, 40.38671875, 42.23681640625, 44.0869140625, 45.93701171875, 47.787109375, 49.63720703125, 51.4873046875, 53.33740234375, 55.1875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 15.0, 45.0, 142.0, 294.0, 323.0, 127.0, 59.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.84120178222656, -210.71072387695312, -206.58023071289062, -202.4497528076172, -198.31927490234375, -194.18878173828125, -190.0583038330078, -185.9278106689453, -181.79733276367188, -177.66685485839844, -173.53636169433594, -169.4058837890625, -165.275390625, -161.14491271972656, -157.01443481445312, -152.88394165039062, -148.7534637451172, -144.62298583984375, -140.49249267578125, -136.3620147705078, -132.23153686523438, -128.10104370117188, -123.97056579589844, -119.84008026123047, -115.7095947265625, -111.57910919189453, -107.44862365722656, -103.31814575195312, -99.18766021728516, -95.05717468261719, -90.92669677734375, -86.79621124267578, -82.66573333740234, -78.53524780273438, -74.40476989746094, -70.27428436279297, -66.143798828125, -62.01331329345703, -57.88283157348633, -53.752349853515625, -49.621864318847656, -45.49137878417969, -41.360897064208984, -37.23041534423828, -33.09992980957031, -28.969446182250977, -24.83896255493164, -20.708478927612305, -16.57799530029297, -12.447511672973633, -8.317028045654297, -4.186544418334961, -0.056060791015625, 4.074422836303711, 8.204906463623047, 12.335390090942383, 16.46587371826172, 20.596357345581055, 24.72684097290039, 28.857324600219727, 32.98780822753906, 37.11829376220703, 41.248775482177734, 45.37925720214844, 49.509742736816406]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 12.0, 9.0, 8.0, 9.0, 10.0, 21.0, 18.0, 21.0, 24.0, 28.0, 24.0, 34.0, 23.0, 35.0, 33.0, 28.0, 37.0, 27.0, 34.0, 31.0, 32.0, 40.0, 42.0, 36.0, 43.0, 54.0, 33.0, 36.0, 23.0, 24.0, 17.0, 23.0, 24.0, 11.0, 11.0, 14.0, 8.0, 5.0, 8.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.642791748046875, -28.682708740234375, -27.722625732421875, -26.762540817260742, -25.802457809448242, -24.842374801635742, -23.88228988647461, -22.92220687866211, -21.96212387084961, -21.00204086303711, -20.04195785522461, -19.081872940063477, -18.121789932250977, -17.161706924438477, -16.201622009277344, -15.241539001464844, -14.281455993652344, -13.321372985839844, -12.361289024353027, -11.401205062866211, -10.441122055053711, -9.481039047241211, -8.520955085754395, -7.560871601104736, -6.600788116455078, -5.64070463180542, -4.680621147155762, -3.7205376625061035, -2.7604541778564453, -1.800370693206787, -0.8402872085571289, 0.1197962760925293, 1.0798797607421875, 2.0399632453918457, 3.000046730041504, 3.960130214691162, 4.92021369934082, 5.8802971839904785, 6.840380668640137, 7.800464153289795, 8.760547637939453, 9.720630645751953, 10.68071460723877, 11.640798568725586, 12.600881576538086, 13.560964584350586, 14.521048545837402, 15.481132507324219, 16.44121551513672, 17.40129852294922, 18.36138153076172, 19.32146644592285, 20.28154945373535, 21.24163246154785, 22.201717376708984, 23.161800384521484, 24.121883392333984, 25.081966400146484, 26.042049407958984, 27.002134323120117, 27.962217330932617, 28.922300338745117, 29.88238525390625, 30.84246826171875, 31.80255126953125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 13.0, 9.0, 10.0, 15.0, 20.0, 22.0, 12.0, 27.0, 24.0, 32.0, 35.0, 26.0, 36.0, 37.0, 31.0, 57.0, 36.0, 49.0, 45.0, 34.0, 60.0, 48.0, 47.0, 25.0, 31.0, 24.0, 28.0, 24.0, 26.0, 20.0, 17.0, 15.0, 15.0, 8.0, 5.0, 7.0, 7.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.19140625, -6.007568359375, -5.82373046875, -5.639892578125, -5.4560546875, -5.272216796875, -5.08837890625, -4.904541015625, -4.720703125, -4.536865234375, -4.35302734375, -4.169189453125, -3.9853515625, -3.801513671875, -3.61767578125, -3.433837890625, -3.25, -3.066162109375, -2.88232421875, -2.698486328125, -2.5146484375, -2.330810546875, -2.14697265625, -1.963134765625, -1.779296875, -1.595458984375, -1.41162109375, -1.227783203125, -1.0439453125, -0.860107421875, -0.67626953125, -0.492431640625, -0.30859375, -0.124755859375, 0.05908203125, 0.242919921875, 0.4267578125, 0.610595703125, 0.79443359375, 0.978271484375, 1.162109375, 1.345947265625, 1.52978515625, 1.713623046875, 1.8974609375, 2.081298828125, 2.26513671875, 2.448974609375, 2.6328125, 2.816650390625, 3.00048828125, 3.184326171875, 3.3681640625, 3.552001953125, 3.73583984375, 3.919677734375, 4.103515625, 4.287353515625, 4.47119140625, 4.655029296875, 4.8388671875, 5.022705078125, 5.20654296875, 5.390380859375, 5.57421875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 9.0, 12.0, 20.0, 23.0, 33.0, 47.0, 88.0, 152.0, 214.0, 353.0, 554.0, 908.0, 1292.0, 2109.0, 3127.0, 4874.0, 7455.0, 11320.0, 17465.0, 26744.0, 40094.0, 58341.0, 83363.0, 114228.0, 143062.0, 144554.0, 117196.0, 87295.0, 61230.0, 41716.0, 28009.0, 18462.0, 12151.0, 7809.0, 5083.0, 3283.0, 2074.0, 1340.0, 884.0, 543.0, 344.0, 240.0, 162.0, 110.0, 54.0, 43.0, 31.0, 18.0, 15.0, 5.0, 6.0, 5.0, 3.0, 0.0, 4.0], "bins": [-0.73974609375, -0.7180252075195312, -0.6963043212890625, -0.6745834350585938, -0.652862548828125, -0.6311416625976562, -0.6094207763671875, -0.5876998901367188, -0.56597900390625, -0.5442581176757812, -0.5225372314453125, -0.5008163452148438, -0.479095458984375, -0.45737457275390625, -0.4356536865234375, -0.41393280029296875, -0.3922119140625, -0.37049102783203125, -0.3487701416015625, -0.32704925537109375, -0.305328369140625, -0.28360748291015625, -0.2618865966796875, -0.24016571044921875, -0.21844482421875, -0.19672393798828125, -0.1750030517578125, -0.15328216552734375, -0.131561279296875, -0.10984039306640625, -0.0881195068359375, -0.06639862060546875, -0.044677734375, -0.02295684814453125, -0.0012359619140625, 0.02048492431640625, 0.042205810546875, 0.06392669677734375, 0.0856475830078125, 0.10736846923828125, 0.12908935546875, 0.15081024169921875, 0.1725311279296875, 0.19425201416015625, 0.215972900390625, 0.23769378662109375, 0.2594146728515625, 0.28113555908203125, 0.3028564453125, 0.32457733154296875, 0.3462982177734375, 0.36801910400390625, 0.389739990234375, 0.41146087646484375, 0.4331817626953125, 0.45490264892578125, 0.47662353515625, 0.49834442138671875, 0.5200653076171875, 0.5417861938476562, 0.563507080078125, 0.5852279663085938, 0.6069488525390625, 0.6286697387695312, 0.650390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 13.0, 9.0, 8.0, 14.0, 18.0, 23.0, 21.0, 21.0, 24.0, 25.0, 35.0, 28.0, 37.0, 34.0, 47.0, 33.0, 56.0, 1070.0, 50.0, 40.0, 43.0, 41.0, 41.0, 35.0, 41.0, 34.0, 26.0, 20.0, 17.0, 17.0, 10.0, 15.0, 15.0, 3.0, 11.0, 10.0, 7.0, 1.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.17578125, -4.055908203125, -3.93603515625, -3.816162109375, -3.6962890625, -3.576416015625, -3.45654296875, -3.336669921875, -3.216796875, -3.096923828125, -2.97705078125, -2.857177734375, -2.7373046875, -2.617431640625, -2.49755859375, -2.377685546875, -2.2578125, -2.137939453125, -2.01806640625, -1.898193359375, -1.7783203125, -1.658447265625, -1.53857421875, -1.418701171875, -1.298828125, -1.178955078125, -1.05908203125, -0.939208984375, -0.8193359375, -0.699462890625, -0.57958984375, -0.459716796875, -0.33984375, -0.219970703125, -0.10009765625, 0.019775390625, 0.1396484375, 0.259521484375, 0.37939453125, 0.499267578125, 0.619140625, 0.739013671875, 0.85888671875, 0.978759765625, 1.0986328125, 1.218505859375, 1.33837890625, 1.458251953125, 1.578125, 1.697998046875, 1.81787109375, 1.937744140625, 2.0576171875, 2.177490234375, 2.29736328125, 2.417236328125, 2.537109375, 2.656982421875, 2.77685546875, 2.896728515625, 3.0166015625, 3.136474609375, 3.25634765625, 3.376220703125, 3.49609375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 19.0, 30.0, 49.0, 67.0, 84.0, 138.0, 209.0, 294.0, 502.0, 638.0, 1040.0, 1612.0, 2396.0, 3667.0, 5543.0, 8433.0, 13273.0, 20096.0, 30004.0, 44934.0, 66336.0, 93361.0, 123865.0, 1182170.0, 147019.0, 108732.0, 78695.0, 54656.0, 37374.0, 24442.0, 16315.0, 10662.0, 7009.0, 4695.0, 2975.0, 2014.0, 1262.0, 849.0, 529.0, 398.0, 246.0, 167.0, 108.0, 67.0, 50.0, 39.0, 16.0, 20.0, 8.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4052734375, -0.39250946044921875, -0.3797454833984375, -0.36698150634765625, -0.354217529296875, -0.34145355224609375, -0.3286895751953125, -0.31592559814453125, -0.30316162109375, -0.29039764404296875, -0.2776336669921875, -0.26486968994140625, -0.252105712890625, -0.23934173583984375, -0.2265777587890625, -0.21381378173828125, -0.2010498046875, -0.18828582763671875, -0.1755218505859375, -0.16275787353515625, -0.149993896484375, -0.13722991943359375, -0.1244659423828125, -0.11170196533203125, -0.09893798828125, -0.08617401123046875, -0.0734100341796875, -0.06064605712890625, -0.047882080078125, -0.03511810302734375, -0.0223541259765625, -0.00959014892578125, 0.003173828125, 0.01593780517578125, 0.0287017822265625, 0.04146575927734375, 0.054229736328125, 0.06699371337890625, 0.0797576904296875, 0.09252166748046875, 0.10528564453125, 0.11804962158203125, 0.1308135986328125, 0.14357757568359375, 0.156341552734375, 0.16910552978515625, 0.1818695068359375, 0.19463348388671875, 0.2073974609375, 0.22016143798828125, 0.2329254150390625, 0.24568939208984375, 0.258453369140625, 0.27121734619140625, 0.2839813232421875, 0.29674530029296875, 0.30950927734375, 0.32227325439453125, 0.3350372314453125, 0.34780120849609375, 0.360565185546875, 0.37332916259765625, 0.3860931396484375, 0.39885711669921875, 0.41162109375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 10.0, 8.0, 11.0, 10.0, 10.0, 16.0, 12.0, 23.0, 23.0, 25.0, 33.0, 55.0, 77.0, 109.0, 99.0, 83.0, 84.0, 65.0, 60.0, 35.0, 17.0, 31.0, 16.0, 15.0, 17.0, 6.0, 7.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.015045166015625, -0.01461172103881836, -0.014178276062011719, -0.013744831085205078, -0.013311386108398438, -0.012877941131591797, -0.012444496154785156, -0.012011051177978516, -0.011577606201171875, -0.011144161224365234, -0.010710716247558594, -0.010277271270751953, -0.009843826293945312, -0.009410381317138672, -0.008976936340332031, -0.00854349136352539, -0.00811004638671875, -0.007676601409912109, -0.007243156433105469, -0.006809711456298828, -0.0063762664794921875, -0.005942821502685547, -0.005509376525878906, -0.005075931549072266, -0.004642486572265625, -0.004209041595458984, -0.0037755966186523438, -0.003342151641845703, -0.0029087066650390625, -0.002475261688232422, -0.0020418167114257812, -0.0016083717346191406, -0.0011749267578125, -0.0007414817810058594, -0.00030803680419921875, 0.00012540817260742188, 0.0005588531494140625, 0.0009922981262207031, 0.0014257431030273438, 0.0018591880798339844, 0.002292633056640625, 0.0027260780334472656, 0.0031595230102539062, 0.003592967987060547, 0.0040264129638671875, 0.004459857940673828, 0.004893302917480469, 0.005326747894287109, 0.00576019287109375, 0.006193637847900391, 0.006627082824707031, 0.007060527801513672, 0.0074939727783203125, 0.007927417755126953, 0.008360862731933594, 0.008794307708740234, 0.009227752685546875, 0.009661197662353516, 0.010094642639160156, 0.010528087615966797, 0.010961532592773438, 0.011394977569580078, 0.011828422546386719, 0.01226186752319336, 0.0126953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 8.0, 13.0, 18.0, 21.0, 28.0, 41.0, 44.0, 83.0, 141.0, 333.0, 2962.0, 165747.0, 868546.0, 9452.0, 571.0, 166.0, 79.0, 55.0, 43.0, 42.0, 25.0, 15.0, 16.0, 17.0, 13.0, 11.0, 8.0, 8.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2841796875, -0.27443695068359375, -0.2646942138671875, -0.25495147705078125, -0.245208740234375, -0.23546600341796875, -0.2257232666015625, -0.21598052978515625, -0.20623779296875, -0.19649505615234375, -0.1867523193359375, -0.17700958251953125, -0.167266845703125, -0.15752410888671875, -0.1477813720703125, -0.13803863525390625, -0.1282958984375, -0.11855316162109375, -0.1088104248046875, -0.09906768798828125, -0.089324951171875, -0.07958221435546875, -0.0698394775390625, -0.06009674072265625, -0.05035400390625, -0.04061126708984375, -0.0308685302734375, -0.02112579345703125, -0.011383056640625, -0.00164031982421875, 0.0081024169921875, 0.01784515380859375, 0.027587890625, 0.03733062744140625, 0.0470733642578125, 0.05681610107421875, 0.066558837890625, 0.07630157470703125, 0.0860443115234375, 0.09578704833984375, 0.10552978515625, 0.11527252197265625, 0.1250152587890625, 0.13475799560546875, 0.144500732421875, 0.15424346923828125, 0.1639862060546875, 0.17372894287109375, 0.1834716796875, 0.19321441650390625, 0.2029571533203125, 0.21269989013671875, 0.222442626953125, 0.23218536376953125, 0.2419281005859375, 0.25167083740234375, 0.26141357421875, 0.27115631103515625, 0.2808990478515625, 0.29064178466796875, 0.300384521484375, 0.31012725830078125, 0.3198699951171875, 0.32961273193359375, 0.33935546875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 41.0, 176.0, 642.0, 123.0, 19.0, 6.0, 1.0, 0.0, 1.0], "bins": [-0.42861753702163696, -0.4211585521697998, -0.41369956731796265, -0.4062405824661255, -0.39878159761428833, -0.39132261276245117, -0.383863627910614, -0.37640464305877686, -0.3689456582069397, -0.36148667335510254, -0.3540276885032654, -0.3465687036514282, -0.33910971879959106, -0.3316507339477539, -0.32419174909591675, -0.3167327642440796, -0.3092738091945648, -0.30181482434272766, -0.2943558394908905, -0.28689685463905334, -0.2794378697872162, -0.27197888493537903, -0.26451990008354187, -0.2570609450340271, -0.24960194528102875, -0.2421429604291916, -0.23468397557735443, -0.22722499072551727, -0.2197660207748413, -0.21230703592300415, -0.204848051071167, -0.19738906621932983, -0.18993009626865387, -0.1824711114168167, -0.17501212656497955, -0.1675531417131424, -0.16009417176246643, -0.15263518691062927, -0.14517620205879211, -0.13771721720695496, -0.1302582323551178, -0.12279924750328064, -0.11534026265144348, -0.10788128525018692, -0.10042230039834976, -0.0929633155465126, -0.08550433814525604, -0.07804535329341888, -0.07058636844158173, -0.06312738358974457, -0.05566840246319771, -0.04820942133665085, -0.04075043648481369, -0.03329145163297653, -0.025832470506429672, -0.018373489379882812, -0.010914500802755356, -0.003455517813563347, 0.004003465175628662, 0.011462448164820671, 0.01892143115401268, 0.026380416005849838, 0.0338393971323967, 0.04129837825894356, 0.048757363110780716]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 2.0, 5.0, 10.0, 9.0, 9.0, 14.0, 19.0, 18.0, 18.0, 25.0, 32.0, 22.0, 35.0, 30.0, 32.0, 45.0, 33.0, 52.0, 39.0, 33.0, 47.0, 34.0, 53.0, 38.0, 48.0, 38.0, 35.0, 35.0, 22.0, 16.0, 28.0, 25.0, 15.0, 15.0, 17.0, 14.0, 9.0, 5.0, 4.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016185224056243896, -0.015666281804442406, -0.015147339552640915, -0.014628397300839424, -0.014109455049037933, -0.013590512797236443, -0.013071570545434952, -0.012552628293633461, -0.01203368604183197, -0.01151474379003048, -0.010995801538228989, -0.010476859286427498, -0.009957917034626007, -0.009438974782824516, -0.008920032531023026, -0.008401090279221535, -0.007882148027420044, -0.007363205775618553, -0.006844263523817062, -0.006325321272015572, -0.005806379020214081, -0.00528743676841259, -0.004768494516611099, -0.0042495522648096085, -0.0037306100130081177, -0.003211667761206627, -0.002692725509405136, -0.0021737832576036453, -0.0016548410058021545, -0.0011358987540006638, -0.000616956502199173, -9.801425039768219e-05, 0.0004209280014038086, 0.0009398702532052994, 0.0014588125050067902, 0.001977754756808281, 0.0024966970086097717, 0.0030156392604112625, 0.0035345815122127533, 0.004053523764014244, 0.004572466015815735, 0.005091408267617226, 0.005610350519418716, 0.006129292771220207, 0.006648235023021698, 0.007167177274823189, 0.0076861195266246796, 0.00820506177842617, 0.008724004030227661, 0.009242946282029152, 0.009761888533830643, 0.010280830785632133, 0.010799773037433624, 0.011318715289235115, 0.011837657541036606, 0.012356599792838097, 0.012875542044639587, 0.013394484296441078, 0.013913426548242569, 0.01443236880004406, 0.01495131105184555, 0.015470253303647041, 0.015989195555448532, 0.016508137807250023, 0.017027080059051514]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 13.0, 9.0, 11.0, 14.0, 20.0, 22.0, 12.0, 27.0, 24.0, 32.0, 35.0, 27.0, 35.0, 37.0, 31.0, 57.0, 36.0, 49.0, 45.0, 34.0, 59.0, 49.0, 46.0, 26.0, 31.0, 23.0, 29.0, 25.0, 25.0, 20.0, 17.0, 15.0, 15.0, 8.0, 5.0, 7.0, 7.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.19140625, -6.007568359375, -5.82373046875, -5.639892578125, -5.4560546875, -5.272216796875, -5.08837890625, -4.904541015625, -4.720703125, -4.536865234375, -4.35302734375, -4.169189453125, -3.9853515625, -3.801513671875, -3.61767578125, -3.433837890625, -3.25, -3.066162109375, -2.88232421875, -2.698486328125, -2.5146484375, -2.330810546875, -2.14697265625, -1.963134765625, -1.779296875, -1.595458984375, -1.41162109375, -1.227783203125, -1.0439453125, -0.860107421875, -0.67626953125, -0.492431640625, -0.30859375, -0.124755859375, 0.05908203125, 0.242919921875, 0.4267578125, 0.610595703125, 0.79443359375, 0.978271484375, 1.162109375, 1.345947265625, 1.52978515625, 1.713623046875, 1.8974609375, 2.081298828125, 2.26513671875, 2.448974609375, 2.6328125, 2.816650390625, 3.00048828125, 3.184326171875, 3.3681640625, 3.552001953125, 3.73583984375, 3.919677734375, 4.103515625, 4.287353515625, 4.47119140625, 4.655029296875, 4.8388671875, 5.022705078125, 5.20654296875, 5.390380859375, 5.57421875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 6.0, 12.0, 12.0, 17.0, 24.0, 30.0, 50.0, 43.0, 62.0, 94.0, 132.0, 213.0, 336.0, 673.0, 1397.0, 3587.0, 10611.0, 46527.0, 432073.0, 484539.0, 49916.0, 11293.0, 3733.0, 1446.0, 670.0, 349.0, 199.0, 141.0, 84.0, 78.0, 44.0, 40.0, 31.0, 29.0, 17.0, 5.0, 7.0, 9.0, 6.0, 6.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.5234375, -10.214111328125, -9.90478515625, -9.595458984375, -9.2861328125, -8.976806640625, -8.66748046875, -8.358154296875, -8.048828125, -7.739501953125, -7.43017578125, -7.120849609375, -6.8115234375, -6.502197265625, -6.19287109375, -5.883544921875, -5.57421875, -5.264892578125, -4.95556640625, -4.646240234375, -4.3369140625, -4.027587890625, -3.71826171875, -3.408935546875, -3.099609375, -2.790283203125, -2.48095703125, -2.171630859375, -1.8623046875, -1.552978515625, -1.24365234375, -0.934326171875, -0.625, -0.315673828125, -0.00634765625, 0.302978515625, 0.6123046875, 0.921630859375, 1.23095703125, 1.540283203125, 1.849609375, 2.158935546875, 2.46826171875, 2.777587890625, 3.0869140625, 3.396240234375, 3.70556640625, 4.014892578125, 4.32421875, 4.633544921875, 4.94287109375, 5.252197265625, 5.5615234375, 5.870849609375, 6.18017578125, 6.489501953125, 6.798828125, 7.108154296875, 7.41748046875, 7.726806640625, 8.0361328125, 8.345458984375, 8.65478515625, 8.964111328125, 9.2734375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 9.0, 3.0, 9.0, 11.0, 11.0, 13.0, 23.0, 27.0, 31.0, 34.0, 32.0, 38.0, 37.0, 42.0, 63.0, 107.0, 399.0, 1610.0, 109.0, 62.0, 44.0, 42.0, 37.0, 45.0, 30.0, 25.0, 28.0, 15.0, 19.0, 21.0, 18.0, 10.0, 12.0, 4.0, 9.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.40625, -19.7275390625, -19.048828125, -18.3701171875, -17.69140625, -17.0126953125, -16.333984375, -15.6552734375, -14.9765625, -14.2978515625, -13.619140625, -12.9404296875, -12.26171875, -11.5830078125, -10.904296875, -10.2255859375, -9.546875, -8.8681640625, -8.189453125, -7.5107421875, -6.83203125, -6.1533203125, -5.474609375, -4.7958984375, -4.1171875, -3.4384765625, -2.759765625, -2.0810546875, -1.40234375, -0.7236328125, -0.044921875, 0.6337890625, 1.3125, 1.9912109375, 2.669921875, 3.3486328125, 4.02734375, 4.7060546875, 5.384765625, 6.0634765625, 6.7421875, 7.4208984375, 8.099609375, 8.7783203125, 9.45703125, 10.1357421875, 10.814453125, 11.4931640625, 12.171875, 12.8505859375, 13.529296875, 14.2080078125, 14.88671875, 15.5654296875, 16.244140625, 16.9228515625, 17.6015625, 18.2802734375, 18.958984375, 19.6376953125, 20.31640625, 20.9951171875, 21.673828125, 22.3525390625, 23.03125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 2.0, 7.0, 9.0, 6.0, 9.0, 19.0, 17.0, 22.0, 14.0, 31.0, 33.0, 42.0, 65.0, 86.0, 133.0, 219.0, 376.0, 1949.0, 467584.0, 2671330.0, 2608.0, 503.0, 196.0, 91.0, 76.0, 49.0, 56.0, 42.0, 27.0, 25.0, 14.0, 12.0, 10.0, 8.0, 7.0, 5.0, 2.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-65.875, -63.94091796875, -62.0068359375, -60.07275390625, -58.138671875, -56.20458984375, -54.2705078125, -52.33642578125, -50.40234375, -48.46826171875, -46.5341796875, -44.60009765625, -42.666015625, -40.73193359375, -38.7978515625, -36.86376953125, -34.9296875, -32.99560546875, -31.0615234375, -29.12744140625, -27.193359375, -25.25927734375, -23.3251953125, -21.39111328125, -19.45703125, -17.52294921875, -15.5888671875, -13.65478515625, -11.720703125, -9.78662109375, -7.8525390625, -5.91845703125, -3.984375, -2.05029296875, -0.1162109375, 1.81787109375, 3.751953125, 5.68603515625, 7.6201171875, 9.55419921875, 11.48828125, 13.42236328125, 15.3564453125, 17.29052734375, 19.224609375, 21.15869140625, 23.0927734375, 25.02685546875, 26.9609375, 28.89501953125, 30.8291015625, 32.76318359375, 34.697265625, 36.63134765625, 38.5654296875, 40.49951171875, 42.43359375, 44.36767578125, 46.3017578125, 48.23583984375, 50.169921875, 52.10400390625, 54.0380859375, 55.97216796875, 57.90625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 67.0, 514.0, 408.0, 22.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.208892822265625, -33.80355453491211, -30.398218154907227, -26.99287986755371, -23.587543487548828, -20.182205200195312, -16.776866912841797, -13.371530532836914, -9.966192245483398, -6.560854911804199, -3.155517101287842, 0.24982070922851562, 3.655158042907715, 7.060495376586914, 10.46583366394043, 13.871170043945312, 17.276508331298828, 20.681846618652344, 24.087182998657227, 27.492521286010742, 30.897857666015625, 34.30319595336914, 37.708534240722656, 41.113868713378906, 44.51921081542969, 47.9245491027832, 51.32988739013672, 54.73522186279297, 58.140560150146484, 61.5458984375, 64.95123291015625, 68.35657501220703, 71.76190948486328, 75.16724395751953, 78.57258605957031, 81.97792053222656, 85.38326263427734, 88.7885971069336, 92.19393920898438, 95.59927368164062, 99.00460815429688, 102.40994262695312, 105.8152847290039, 109.22061920166016, 112.62596130371094, 116.03129577636719, 119.43663024902344, 122.84197235107422, 126.247314453125, 129.65264892578125, 133.0579833984375, 136.4633331298828, 139.86866760253906, 143.2740020751953, 146.67933654785156, 150.0846710205078, 153.49000549316406, 156.8953399658203, 160.30067443847656, 163.70602416992188, 167.11135864257812, 170.51669311523438, 173.92202758789062, 177.32736206054688, 180.7327117919922]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 12.0, 11.0, 11.0, 15.0, 12.0, 20.0, 12.0, 19.0, 19.0, 34.0, 20.0, 42.0, 25.0, 47.0, 36.0, 40.0, 56.0, 36.0, 33.0, 39.0, 38.0, 32.0, 45.0, 46.0, 40.0, 37.0, 29.0, 28.0, 23.0, 21.0, 17.0, 20.0, 18.0, 22.0, 5.0, 10.0, 8.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-63.84220886230469, -62.07742691040039, -60.31264114379883, -58.54785919189453, -56.78307342529297, -55.01829147338867, -53.253509521484375, -51.48872375488281, -49.723941802978516, -47.95915985107422, -46.194374084472656, -44.42959213256836, -42.66481018066406, -40.9000244140625, -39.1352424621582, -37.370460510253906, -35.605674743652344, -33.84089279174805, -32.076107025146484, -30.311325073242188, -28.546541213989258, -26.781757354736328, -25.01697540283203, -23.2521915435791, -21.487407684326172, -19.722623825073242, -17.957839965820312, -16.193058013916016, -14.428274154663086, -12.663490295410156, -10.898707389831543, -9.13392448425293, -7.369140625, -5.6043572425842285, -3.839573860168457, -2.0747904777526855, -0.31000709533691406, 1.4547767639160156, 3.219559669494629, 4.984342575073242, 6.749126434326172, 8.513910293579102, 10.278693199157715, 12.043476104736328, 13.808259963989258, 15.573043823242188, 17.337825775146484, 19.102609634399414, 20.867393493652344, 22.632177352905273, 24.396961212158203, 26.1617431640625, 27.92652702331543, 29.69131088256836, 31.456092834472656, 33.22087860107422, 34.985660552978516, 36.75044250488281, 38.515228271484375, 40.28001022338867, 42.04479217529297, 43.80957794189453, 45.57435989379883, 47.339141845703125, 49.10392761230469]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 12.0, 15.0, 24.0, 17.0, 17.0, 24.0, 39.0, 32.0, 26.0, 27.0, 35.0, 43.0, 44.0, 51.0, 47.0, 48.0, 51.0, 44.0, 45.0, 51.0, 36.0, 31.0, 38.0, 20.0, 32.0, 22.0, 23.0, 22.0, 17.0, 13.0, 13.0, 4.0, 8.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.48046875, -7.26971435546875, -7.0589599609375, -6.84820556640625, -6.637451171875, -6.42669677734375, -6.2159423828125, -6.00518798828125, -5.79443359375, -5.58367919921875, -5.3729248046875, -5.16217041015625, -4.951416015625, -4.74066162109375, -4.5299072265625, -4.31915283203125, -4.1083984375, -3.89764404296875, -3.6868896484375, -3.47613525390625, -3.265380859375, -3.05462646484375, -2.8438720703125, -2.63311767578125, -2.42236328125, -2.21160888671875, -2.0008544921875, -1.79010009765625, -1.579345703125, -1.36859130859375, -1.1578369140625, -0.94708251953125, -0.736328125, -0.52557373046875, -0.3148193359375, -0.10406494140625, 0.106689453125, 0.31744384765625, 0.5281982421875, 0.73895263671875, 0.94970703125, 1.16046142578125, 1.3712158203125, 1.58197021484375, 1.792724609375, 2.00347900390625, 2.2142333984375, 2.42498779296875, 2.6357421875, 2.84649658203125, 3.0572509765625, 3.26800537109375, 3.478759765625, 3.68951416015625, 3.9002685546875, 4.11102294921875, 4.32177734375, 4.53253173828125, 4.7432861328125, 4.95404052734375, 5.164794921875, 5.37554931640625, 5.5863037109375, 5.79705810546875, 6.0078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 10.0, 15.0, 34.0, 26.0, 37.0, 58.0, 78.0, 142.0, 242.0, 459.0, 858.0, 1774.0, 3957.0, 10070.0, 28845.0, 103848.0, 467873.0, 1595144.0, 1454418.0, 396932.0, 88526.0, 25260.0, 8693.0, 3535.0, 1629.0, 831.0, 401.0, 220.0, 141.0, 79.0, 49.0, 31.0, 20.0, 15.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8555908203125, -8.578369140625, -8.3011474609375, -8.02392578125, -7.7467041015625, -7.469482421875, -7.1922607421875, -6.9150390625, -6.6378173828125, -6.360595703125, -6.0833740234375, -5.80615234375, -5.5289306640625, -5.251708984375, -4.9744873046875, -4.697265625, -4.4200439453125, -4.142822265625, -3.8656005859375, -3.58837890625, -3.3111572265625, -3.033935546875, -2.7567138671875, -2.4794921875, -2.2022705078125, -1.925048828125, -1.6478271484375, -1.37060546875, -1.0933837890625, -0.816162109375, -0.5389404296875, -0.26171875, 0.0155029296875, 0.292724609375, 0.5699462890625, 0.84716796875, 1.1243896484375, 1.401611328125, 1.6788330078125, 1.9560546875, 2.2332763671875, 2.510498046875, 2.7877197265625, 3.06494140625, 3.3421630859375, 3.619384765625, 3.8966064453125, 4.173828125, 4.4510498046875, 4.728271484375, 5.0054931640625, 5.28271484375, 5.5599365234375, 5.837158203125, 6.1143798828125, 6.3916015625, 6.6688232421875, 6.946044921875, 7.2232666015625, 7.50048828125, 7.7777099609375, 8.054931640625, 8.3321533203125, 8.609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 9.0, 12.0, 11.0, 25.0, 25.0, 28.0, 36.0, 46.0, 78.0, 79.0, 119.0, 161.0, 217.0, 282.0, 306.0, 391.0, 454.0, 393.0, 333.0, 251.0, 180.0, 142.0, 89.0, 96.0, 55.0, 60.0, 36.0, 34.0, 30.0, 18.0, 16.0, 8.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 6.0, 0.0, 1.0, 3.0, 1.0], "bins": [-11.171875, -10.85595703125, -10.5400390625, -10.22412109375, -9.908203125, -9.59228515625, -9.2763671875, -8.96044921875, -8.64453125, -8.32861328125, -8.0126953125, -7.69677734375, -7.380859375, -7.06494140625, -6.7490234375, -6.43310546875, -6.1171875, -5.80126953125, -5.4853515625, -5.16943359375, -4.853515625, -4.53759765625, -4.2216796875, -3.90576171875, -3.58984375, -3.27392578125, -2.9580078125, -2.64208984375, -2.326171875, -2.01025390625, -1.6943359375, -1.37841796875, -1.0625, -0.74658203125, -0.4306640625, -0.11474609375, 0.201171875, 0.51708984375, 0.8330078125, 1.14892578125, 1.46484375, 1.78076171875, 2.0966796875, 2.41259765625, 2.728515625, 3.04443359375, 3.3603515625, 3.67626953125, 3.9921875, 4.30810546875, 4.6240234375, 4.93994140625, 5.255859375, 5.57177734375, 5.8876953125, 6.20361328125, 6.51953125, 6.83544921875, 7.1513671875, 7.46728515625, 7.783203125, 8.09912109375, 8.4150390625, 8.73095703125, 9.046875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 16.0, 28.0, 29.0, 40.0, 66.0, 93.0, 83.0, 157.0, 231.0, 357.0, 676.0, 1742.0, 15682.0, 1046227.0, 3088037.0, 35982.0, 2658.0, 874.0, 439.0, 281.0, 142.0, 98.0, 85.0, 54.0, 48.0, 38.0, 17.0, 20.0, 11.0, 10.0, 8.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.46630859375, -30.2138671875, -28.96142578125, -27.708984375, -26.45654296875, -25.2041015625, -23.95166015625, -22.69921875, -21.44677734375, -20.1943359375, -18.94189453125, -17.689453125, -16.43701171875, -15.1845703125, -13.93212890625, -12.6796875, -11.42724609375, -10.1748046875, -8.92236328125, -7.669921875, -6.41748046875, -5.1650390625, -3.91259765625, -2.66015625, -1.40771484375, -0.1552734375, 1.09716796875, 2.349609375, 3.60205078125, 4.8544921875, 6.10693359375, 7.359375, 8.61181640625, 9.8642578125, 11.11669921875, 12.369140625, 13.62158203125, 14.8740234375, 16.12646484375, 17.37890625, 18.63134765625, 19.8837890625, 21.13623046875, 22.388671875, 23.64111328125, 24.8935546875, 26.14599609375, 27.3984375, 28.65087890625, 29.9033203125, 31.15576171875, 32.408203125, 33.66064453125, 34.9130859375, 36.16552734375, 37.41796875, 38.67041015625, 39.9228515625, 41.17529296875, 42.427734375, 43.68017578125, 44.9326171875, 46.18505859375, 47.4375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 19.0, 164.0, 429.0, 322.0, 76.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.21986389160156, -201.86439514160156, -195.50894165039062, -189.15347290039062, -182.79800415039062, -176.44253540039062, -170.08706665039062, -163.7316131591797, -157.3761444091797, -151.0206756591797, -144.66522216796875, -138.30975341796875, -131.95428466796875, -125.59881591796875, -119.24335479736328, -112.88789367675781, -106.53242492675781, -100.17695617675781, -93.82149505615234, -87.46603393554688, -81.11056518554688, -74.75509643554688, -68.3996353149414, -62.04417037963867, -55.68870544433594, -49.3332405090332, -42.97777557373047, -36.622310638427734, -30.266845703125, -23.911380767822266, -17.55591583251953, -11.200450897216797, -4.845001220703125, 1.5104637145996094, 7.865928649902344, 14.221393585205078, 20.576858520507812, 26.932323455810547, 33.28778839111328, 39.643253326416016, 45.99871826171875, 52.354183197021484, 58.70964813232422, 65.06510925292969, 71.42057800292969, 77.77604675292969, 84.13150787353516, 90.48696899414062, 96.84243774414062, 103.19790649414062, 109.5533676147461, 115.90882873535156, 122.26429748535156, 128.61976623535156, 134.9752197265625, 141.3306884765625, 147.6861572265625, 154.0416259765625, 160.3970947265625, 166.75254821777344, 173.10801696777344, 179.46348571777344, 185.81893920898438, 192.17440795898438, 198.52987670898438]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 7.0, 13.0, 12.0, 9.0, 14.0, 15.0, 18.0, 16.0, 24.0, 22.0, 28.0, 33.0, 35.0, 38.0, 44.0, 45.0, 47.0, 42.0, 38.0, 49.0, 38.0, 37.0, 30.0, 35.0, 38.0, 28.0, 31.0, 29.0, 34.0, 24.0, 21.0, 22.0, 15.0, 16.0, 13.0, 9.0, 6.0, 5.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.673431396484375, -39.45307540893555, -38.23271942138672, -37.012367248535156, -35.79201126098633, -34.5716552734375, -33.35130310058594, -32.13094711303711, -30.91059112548828, -29.690235137939453, -28.469881057739258, -27.249526977539062, -26.029170989990234, -24.808815002441406, -23.58846092224121, -22.368106842041016, -21.147750854492188, -19.92739486694336, -18.707040786743164, -17.48668670654297, -16.26633071899414, -15.045975685119629, -13.825620651245117, -12.605265617370605, -11.384910583496094, -10.164555549621582, -8.94420051574707, -7.723845481872559, -6.503490447998047, -5.283135414123535, -4.062780380249023, -2.8424253463745117, -1.6220703125, -0.4017152786254883, 0.8186397552490234, 2.038994789123535, 3.259349822998047, 4.479704856872559, 5.70005989074707, 6.920414924621582, 8.140769958496094, 9.361124992370605, 10.581480026245117, 11.801835060119629, 13.02219009399414, 14.242545127868652, 15.462900161743164, 16.68325424194336, 17.903610229492188, 19.123966217041016, 20.34432029724121, 21.564674377441406, 22.785030364990234, 24.005386352539062, 25.225740432739258, 26.446094512939453, 27.66645050048828, 28.88680648803711, 30.107160568237305, 31.3275146484375, 32.54787063598633, 33.768226623535156, 34.98857879638672, 36.20893478393555, 37.429290771484375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 12.0, 13.0, 13.0, 23.0, 22.0, 22.0, 33.0, 22.0, 22.0, 42.0, 32.0, 33.0, 45.0, 51.0, 44.0, 46.0, 43.0, 40.0, 39.0, 39.0, 44.0, 41.0, 37.0, 36.0, 28.0, 16.0, 25.0, 22.0, 21.0, 23.0, 14.0, 9.0, 10.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.907958984375, -5.71044921875, -5.512939453125, -5.3154296875, -5.117919921875, -4.92041015625, -4.722900390625, -4.525390625, -4.327880859375, -4.13037109375, -3.932861328125, -3.7353515625, -3.537841796875, -3.34033203125, -3.142822265625, -2.9453125, -2.747802734375, -2.55029296875, -2.352783203125, -2.1552734375, -1.957763671875, -1.76025390625, -1.562744140625, -1.365234375, -1.167724609375, -0.97021484375, -0.772705078125, -0.5751953125, -0.377685546875, -0.18017578125, 0.017333984375, 0.21484375, 0.412353515625, 0.60986328125, 0.807373046875, 1.0048828125, 1.202392578125, 1.39990234375, 1.597412109375, 1.794921875, 1.992431640625, 2.18994140625, 2.387451171875, 2.5849609375, 2.782470703125, 2.97998046875, 3.177490234375, 3.375, 3.572509765625, 3.77001953125, 3.967529296875, 4.1650390625, 4.362548828125, 4.56005859375, 4.757568359375, 4.955078125, 5.152587890625, 5.35009765625, 5.547607421875, 5.7451171875, 5.942626953125, 6.14013671875, 6.337646484375, 6.53515625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 8.0, 4.0, 9.0, 9.0, 12.0, 19.0, 25.0, 46.0, 81.0, 84.0, 145.0, 210.0, 309.0, 470.0, 761.0, 990.0, 1438.0, 2200.0, 3283.0, 4676.0, 6860.0, 10493.0, 15725.0, 22757.0, 33423.0, 49001.0, 69196.0, 96117.0, 122301.0, 140743.0, 127556.0, 101247.0, 73989.0, 52369.0, 36017.0, 24677.0, 16505.0, 11257.0, 7621.0, 5162.0, 3464.0, 2274.0, 1686.0, 1055.0, 703.0, 502.0, 344.0, 237.0, 176.0, 128.0, 68.0, 49.0, 27.0, 20.0, 10.0, 16.0, 7.0, 3.0, 4.0, 1.0, 2.0], "bins": [-0.6953125, -0.673980712890625, -0.65264892578125, -0.631317138671875, -0.6099853515625, -0.588653564453125, -0.56732177734375, -0.545989990234375, -0.524658203125, -0.503326416015625, -0.48199462890625, -0.460662841796875, -0.4393310546875, -0.417999267578125, -0.39666748046875, -0.375335693359375, -0.35400390625, -0.332672119140625, -0.31134033203125, -0.290008544921875, -0.2686767578125, -0.247344970703125, -0.22601318359375, -0.204681396484375, -0.183349609375, -0.162017822265625, -0.14068603515625, -0.119354248046875, -0.0980224609375, -0.076690673828125, -0.05535888671875, -0.034027099609375, -0.0126953125, 0.008636474609375, 0.02996826171875, 0.051300048828125, 0.0726318359375, 0.093963623046875, 0.11529541015625, 0.136627197265625, 0.157958984375, 0.179290771484375, 0.20062255859375, 0.221954345703125, 0.2432861328125, 0.264617919921875, 0.28594970703125, 0.307281494140625, 0.32861328125, 0.349945068359375, 0.37127685546875, 0.392608642578125, 0.4139404296875, 0.435272216796875, 0.45660400390625, 0.477935791015625, 0.499267578125, 0.520599365234375, 0.54193115234375, 0.563262939453125, 0.5845947265625, 0.605926513671875, 0.62725830078125, 0.648590087890625, 0.669921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 11.0, 4.0, 11.0, 11.0, 7.0, 14.0, 16.0, 21.0, 15.0, 21.0, 30.0, 25.0, 21.0, 34.0, 36.0, 19.0, 29.0, 35.0, 37.0, 43.0, 46.0, 1064.0, 36.0, 37.0, 34.0, 33.0, 34.0, 34.0, 28.0, 25.0, 20.0, 25.0, 21.0, 22.0, 25.0, 12.0, 15.0, 10.0, 11.0, 12.0, 5.0, 10.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.5703125, -3.4600830078125, -3.349853515625, -3.2396240234375, -3.12939453125, -3.0191650390625, -2.908935546875, -2.7987060546875, -2.6884765625, -2.5782470703125, -2.468017578125, -2.3577880859375, -2.24755859375, -2.1373291015625, -2.027099609375, -1.9168701171875, -1.806640625, -1.6964111328125, -1.586181640625, -1.4759521484375, -1.36572265625, -1.2554931640625, -1.145263671875, -1.0350341796875, -0.9248046875, -0.8145751953125, -0.704345703125, -0.5941162109375, -0.48388671875, -0.3736572265625, -0.263427734375, -0.1531982421875, -0.04296875, 0.0672607421875, 0.177490234375, 0.2877197265625, 0.39794921875, 0.5081787109375, 0.618408203125, 0.7286376953125, 0.8388671875, 0.9490966796875, 1.059326171875, 1.1695556640625, 1.27978515625, 1.3900146484375, 1.500244140625, 1.6104736328125, 1.720703125, 1.8309326171875, 1.941162109375, 2.0513916015625, 2.16162109375, 2.2718505859375, 2.382080078125, 2.4923095703125, 2.6025390625, 2.7127685546875, 2.822998046875, 2.9332275390625, 3.04345703125, 3.1536865234375, 3.263916015625, 3.3741455078125, 3.484375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 4.0, 14.0, 18.0, 30.0, 39.0, 71.0, 97.0, 129.0, 205.0, 283.0, 433.0, 628.0, 844.0, 1325.0, 2054.0, 3077.0, 4568.0, 6899.0, 10489.0, 15814.0, 23787.0, 35584.0, 53025.0, 76809.0, 107047.0, 136778.0, 1189898.0, 125479.0, 95795.0, 67158.0, 46627.0, 30920.0, 20940.0, 13537.0, 8924.0, 5997.0, 3882.0, 2482.0, 1720.0, 1223.0, 757.0, 600.0, 391.0, 229.0, 161.0, 121.0, 79.0, 52.0, 44.0, 27.0, 15.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0], "bins": [-0.4404296875, -0.4272117614746094, -0.41399383544921875, -0.4007759094238281, -0.3875579833984375, -0.3743400573730469, -0.36112213134765625, -0.3479042053222656, -0.334686279296875, -0.3214683532714844, -0.30825042724609375, -0.2950325012207031, -0.2818145751953125, -0.2685966491699219, -0.25537872314453125, -0.24216079711914062, -0.22894287109375, -0.21572494506835938, -0.20250701904296875, -0.18928909301757812, -0.1760711669921875, -0.16285324096679688, -0.14963531494140625, -0.13641738891601562, -0.123199462890625, -0.10998153686523438, -0.09676361083984375, -0.08354568481445312, -0.0703277587890625, -0.057109832763671875, -0.04389190673828125, -0.030673980712890625, -0.0174560546875, -0.004238128662109375, 0.00897979736328125, 0.022197723388671875, 0.0354156494140625, 0.048633575439453125, 0.06185150146484375, 0.07506942749023438, 0.088287353515625, 0.10150527954101562, 0.11472320556640625, 0.12794113159179688, 0.1411590576171875, 0.15437698364257812, 0.16759490966796875, 0.18081283569335938, 0.19403076171875, 0.20724868774414062, 0.22046661376953125, 0.23368453979492188, 0.2469024658203125, 0.2601203918457031, 0.27333831787109375, 0.2865562438964844, 0.299774169921875, 0.3129920959472656, 0.32621002197265625, 0.3394279479980469, 0.3526458740234375, 0.3658638000488281, 0.37908172607421875, 0.3922996520996094, 0.405517578125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 4.0, 12.0, 11.0, 16.0, 21.0, 19.0, 49.0, 86.0, 97.0, 123.0, 103.0, 113.0, 117.0, 67.0, 49.0, 24.0, 16.0, 12.0, 7.0, 6.0, 10.0, 9.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0104827880859375, -0.010088324546813965, -0.00969386100769043, -0.009299397468566895, -0.00890493392944336, -0.008510470390319824, -0.008116006851196289, -0.007721543312072754, -0.007327079772949219, -0.006932616233825684, -0.0065381526947021484, -0.006143689155578613, -0.005749225616455078, -0.005354762077331543, -0.004960298538208008, -0.004565834999084473, -0.0041713714599609375, -0.0037769079208374023, -0.003382444381713867, -0.002987980842590332, -0.002593517303466797, -0.0021990537643432617, -0.0018045902252197266, -0.0014101266860961914, -0.0010156631469726562, -0.0006211996078491211, -0.00022673606872558594, 0.00016772747039794922, 0.0005621910095214844, 0.0009566545486450195, 0.0013511180877685547, 0.0017455816268920898, 0.002140045166015625, 0.00253450870513916, 0.0029289722442626953, 0.0033234357833862305, 0.0037178993225097656, 0.004112362861633301, 0.004506826400756836, 0.004901289939880371, 0.005295753479003906, 0.005690217018127441, 0.0060846805572509766, 0.006479144096374512, 0.006873607635498047, 0.007268071174621582, 0.007662534713745117, 0.008056998252868652, 0.008451461791992188, 0.008845925331115723, 0.009240388870239258, 0.009634852409362793, 0.010029315948486328, 0.010423779487609863, 0.010818243026733398, 0.011212706565856934, 0.011607170104980469, 0.012001633644104004, 0.012396097183227539, 0.012790560722351074, 0.01318502426147461, 0.013579487800598145, 0.01397395133972168, 0.014368414878845215, 0.01476287841796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 1.0, 6.0, 10.0, 11.0, 11.0, 14.0, 26.0, 33.0, 42.0, 95.0, 255.0, 1535.0, 52622.0, 977327.0, 15291.0, 836.0, 191.0, 79.0, 46.0, 28.0, 25.0, 18.0, 13.0, 7.0, 2.0, 8.0, 8.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.301025390625, -0.2922630310058594, -0.28350067138671875, -0.2747383117675781, -0.2659759521484375, -0.2572135925292969, -0.24845123291015625, -0.23968887329101562, -0.230926513671875, -0.22216415405273438, -0.21340179443359375, -0.20463943481445312, -0.1958770751953125, -0.18711471557617188, -0.17835235595703125, -0.16958999633789062, -0.16082763671875, -0.15206527709960938, -0.14330291748046875, -0.13454055786132812, -0.1257781982421875, -0.11701583862304688, -0.10825347900390625, -0.09949111938476562, -0.090728759765625, -0.08196640014648438, -0.07320404052734375, -0.06444168090820312, -0.0556793212890625, -0.046916961669921875, -0.03815460205078125, -0.029392242431640625, -0.0206298828125, -0.011867523193359375, -0.00310516357421875, 0.005657196044921875, 0.0144195556640625, 0.023181915283203125, 0.03194427490234375, 0.040706634521484375, 0.049468994140625, 0.058231353759765625, 0.06699371337890625, 0.07575607299804688, 0.0845184326171875, 0.09328079223632812, 0.10204315185546875, 0.11080551147460938, 0.11956787109375, 0.12833023071289062, 0.13709259033203125, 0.14585494995117188, 0.1546173095703125, 0.16337966918945312, 0.17214202880859375, 0.18090438842773438, 0.189666748046875, 0.19842910766601562, 0.20719146728515625, 0.21595382690429688, 0.2247161865234375, 0.23347854614257812, 0.24224090576171875, 0.2510032653808594, 0.259765625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 8.0, 9.0, 12.0, 13.0, 28.0, 36.0, 86.0, 135.0, 261.0, 193.0, 81.0, 47.0, 39.0, 25.0, 12.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0780419185757637, -0.07640847563743591, -0.07477504014968872, -0.07314159721136093, -0.07150816172361374, -0.06987471878528595, -0.06824128329753876, -0.06660784035921097, -0.06497440487146378, -0.06334096193313599, -0.061707526445388794, -0.0600740872323513, -0.05844064801931381, -0.05680720880627632, -0.05517376959323883, -0.05354032665491104, -0.05190688744187355, -0.05027344822883606, -0.04864000901579857, -0.04700656980276108, -0.04537313058972359, -0.043739691376686096, -0.04210624843835831, -0.040472812950611115, -0.038839370012283325, -0.037205930799245834, -0.035572491586208344, -0.03393905237317085, -0.03230561316013336, -0.03067217394709587, -0.02903873287141323, -0.02740529365837574, -0.025771858170628548, -0.024138418957591057, -0.022504979744553566, -0.020871538668870926, -0.019238099455833435, -0.017604660242795944, -0.015971221029758453, -0.014337781816720963, -0.012704342603683472, -0.01107090339064598, -0.00943746417760849, -0.0078040240332484245, -0.006170584820210934, -0.004537145607173443, -0.0029037054628133774, -0.0012702662497758865, 0.0003631729632616043, 0.001996612409129739, 0.0036300518549978733, 0.0052634915336966515, 0.006896930746734142, 0.008530369959771633, 0.010163810104131699, 0.01179724931716919, 0.01343068853020668, 0.015064127743244171, 0.016697566956281662, 0.018331006169319153, 0.019964445382356644, 0.021597884595394135, 0.023231325671076775, 0.024864764884114265, 0.026498204097151756]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 2.0, 8.0, 6.0, 12.0, 8.0, 15.0, 9.0, 19.0, 17.0, 17.0, 19.0, 17.0, 28.0, 36.0, 36.0, 29.0, 40.0, 35.0, 39.0, 42.0, 51.0, 54.0, 28.0, 33.0, 40.0, 35.0, 27.0, 33.0, 29.0, 33.0, 23.0, 25.0, 22.0, 23.0, 11.0, 20.0, 15.0, 16.0, 7.0, 10.0, 9.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.006200432777404785, -0.006025218404829502, -0.005850004032254219, -0.005674789659678936, -0.005499575287103653, -0.00532436091452837, -0.005149146541953087, -0.004973932169377804, -0.004798717796802521, -0.004623503424227238, -0.004448289051651955, -0.004273074679076672, -0.0040978603065013885, -0.0039226459339261055, -0.0037474315613508224, -0.0035722171887755394, -0.0033970028162002563, -0.0032217884436249733, -0.0030465740710496902, -0.002871359698474407, -0.002696145325899124, -0.002520930953323841, -0.002345716580748558, -0.002170502208173275, -0.001995287835597992, -0.001820073463022709, -0.0016448590904474258, -0.0014696447178721428, -0.0012944303452968597, -0.0011192159727215767, -0.0009440016001462936, -0.0007687872275710106, -0.0005935728549957275, -0.0004183584824204445, -0.00024314410984516144, -6.792973726987839e-05, 0.00010728463530540466, 0.0002824990078806877, 0.00045771338045597076, 0.0006329277530312538, 0.0008081421256065369, 0.00098335649818182, 0.001158570870757103, 0.001333785243332386, 0.001508999615907669, 0.0016842139884829521, 0.0018594283610582352, 0.0020346427336335182, 0.0022098571062088013, 0.0023850714787840843, 0.0025602858513593674, 0.0027355002239346504, 0.0029107145965099335, 0.0030859289690852165, 0.0032611433416604996, 0.0034363577142357826, 0.0036115720868110657, 0.0037867864593863487, 0.003962000831961632, 0.004137215204536915, 0.004312429577112198, 0.004487643949687481, 0.004662858322262764, 0.004838072694838047, 0.00501328706741333]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 11.0, 12.0, 13.0, 13.0, 23.0, 22.0, 22.0, 33.0, 22.0, 22.0, 42.0, 32.0, 33.0, 45.0, 51.0, 44.0, 46.0, 43.0, 40.0, 39.0, 39.0, 44.0, 42.0, 36.0, 36.0, 28.0, 16.0, 25.0, 22.0, 21.0, 23.0, 14.0, 9.0, 10.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.10546875, -5.907958984375, -5.71044921875, -5.512939453125, -5.3154296875, -5.117919921875, -4.92041015625, -4.722900390625, -4.525390625, -4.327880859375, -4.13037109375, -3.932861328125, -3.7353515625, -3.537841796875, -3.34033203125, -3.142822265625, -2.9453125, -2.747802734375, -2.55029296875, -2.352783203125, -2.1552734375, -1.957763671875, -1.76025390625, -1.562744140625, -1.365234375, -1.167724609375, -0.97021484375, -0.772705078125, -0.5751953125, -0.377685546875, -0.18017578125, 0.017333984375, 0.21484375, 0.412353515625, 0.60986328125, 0.807373046875, 1.0048828125, 1.202392578125, 1.39990234375, 1.597412109375, 1.794921875, 1.992431640625, 2.18994140625, 2.387451171875, 2.5849609375, 2.782470703125, 2.97998046875, 3.177490234375, 3.375, 3.572509765625, 3.77001953125, 3.967529296875, 4.1650390625, 4.362548828125, 4.56005859375, 4.757568359375, 4.955078125, 5.152587890625, 5.35009765625, 5.547607421875, 5.7451171875, 5.942626953125, 6.14013671875, 6.337646484375, 6.53515625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 7.0, 13.0, 19.0, 24.0, 36.0, 63.0, 78.0, 157.0, 282.0, 510.0, 912.0, 1743.0, 3447.0, 6825.0, 13785.0, 28507.0, 65247.0, 176158.0, 382842.0, 221441.0, 80051.0, 33629.0, 16148.0, 8140.0, 4106.0, 2001.0, 1081.0, 529.0, 317.0, 159.0, 107.0, 78.0, 32.0, 24.0, 13.0, 10.0, 6.0, 10.0, 1.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.05859375, -5.872802734375, -5.68701171875, -5.501220703125, -5.3154296875, -5.129638671875, -4.94384765625, -4.758056640625, -4.572265625, -4.386474609375, -4.20068359375, -4.014892578125, -3.8291015625, -3.643310546875, -3.45751953125, -3.271728515625, -3.0859375, -2.900146484375, -2.71435546875, -2.528564453125, -2.3427734375, -2.156982421875, -1.97119140625, -1.785400390625, -1.599609375, -1.413818359375, -1.22802734375, -1.042236328125, -0.8564453125, -0.670654296875, -0.48486328125, -0.299072265625, -0.11328125, 0.072509765625, 0.25830078125, 0.444091796875, 0.6298828125, 0.815673828125, 1.00146484375, 1.187255859375, 1.373046875, 1.558837890625, 1.74462890625, 1.930419921875, 2.1162109375, 2.302001953125, 2.48779296875, 2.673583984375, 2.859375, 3.045166015625, 3.23095703125, 3.416748046875, 3.6025390625, 3.788330078125, 3.97412109375, 4.159912109375, 4.345703125, 4.531494140625, 4.71728515625, 4.903076171875, 5.0888671875, 5.274658203125, 5.46044921875, 5.646240234375, 5.83203125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 5.0, 8.0, 4.0, 9.0, 7.0, 13.0, 10.0, 23.0, 12.0, 14.0, 18.0, 22.0, 27.0, 24.0, 30.0, 33.0, 34.0, 38.0, 35.0, 54.0, 58.0, 96.0, 275.0, 1469.0, 204.0, 75.0, 60.0, 53.0, 37.0, 29.0, 29.0, 31.0, 16.0, 31.0, 21.0, 16.0, 23.0, 21.0, 9.0, 8.0, 12.0, 10.0, 9.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.984375, -17.4287109375, -16.873046875, -16.3173828125, -15.76171875, -15.2060546875, -14.650390625, -14.0947265625, -13.5390625, -12.9833984375, -12.427734375, -11.8720703125, -11.31640625, -10.7607421875, -10.205078125, -9.6494140625, -9.09375, -8.5380859375, -7.982421875, -7.4267578125, -6.87109375, -6.3154296875, -5.759765625, -5.2041015625, -4.6484375, -4.0927734375, -3.537109375, -2.9814453125, -2.42578125, -1.8701171875, -1.314453125, -0.7587890625, -0.203125, 0.3525390625, 0.908203125, 1.4638671875, 2.01953125, 2.5751953125, 3.130859375, 3.6865234375, 4.2421875, 4.7978515625, 5.353515625, 5.9091796875, 6.46484375, 7.0205078125, 7.576171875, 8.1318359375, 8.6875, 9.2431640625, 9.798828125, 10.3544921875, 10.91015625, 11.4658203125, 12.021484375, 12.5771484375, 13.1328125, 13.6884765625, 14.244140625, 14.7998046875, 15.35546875, 15.9111328125, 16.466796875, 17.0224609375, 17.578125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 8.0, 10.0, 11.0, 12.0, 12.0, 14.0, 15.0, 26.0, 26.0, 34.0, 44.0, 63.0, 77.0, 88.0, 122.0, 181.0, 297.0, 481.0, 1320.0, 6562.0, 121067.0, 2908225.0, 98373.0, 5727.0, 1313.0, 512.0, 272.0, 169.0, 129.0, 105.0, 70.0, 74.0, 51.0, 34.0, 40.0, 19.0, 28.0, 10.0, 16.0, 9.0, 14.0, 13.0, 6.0, 9.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-31.796875, -30.846923828125, -29.89697265625, -28.947021484375, -27.9970703125, -27.047119140625, -26.09716796875, -25.147216796875, -24.197265625, -23.247314453125, -22.29736328125, -21.347412109375, -20.3974609375, -19.447509765625, -18.49755859375, -17.547607421875, -16.59765625, -15.647705078125, -14.69775390625, -13.747802734375, -12.7978515625, -11.847900390625, -10.89794921875, -9.947998046875, -8.998046875, -8.048095703125, -7.09814453125, -6.148193359375, -5.1982421875, -4.248291015625, -3.29833984375, -2.348388671875, -1.3984375, -0.448486328125, 0.50146484375, 1.451416015625, 2.4013671875, 3.351318359375, 4.30126953125, 5.251220703125, 6.201171875, 7.151123046875, 8.10107421875, 9.051025390625, 10.0009765625, 10.950927734375, 11.90087890625, 12.850830078125, 13.80078125, 14.750732421875, 15.70068359375, 16.650634765625, 17.6005859375, 18.550537109375, 19.50048828125, 20.450439453125, 21.400390625, 22.350341796875, 23.30029296875, 24.250244140625, 25.2001953125, 26.150146484375, 27.10009765625, 28.050048828125, 29.0]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 37.0, 817.0, 161.0, 3.0, 0.0, 0.0, 1.0], "bins": [-490.7801208496094, -482.40802001953125, -474.035888671875, -465.6637878417969, -457.2916564941406, -448.9195556640625, -440.54742431640625, -432.1753234863281, -423.80322265625, -415.4311218261719, -407.0589904785156, -398.6868896484375, -390.31475830078125, -381.9426574707031, -373.570556640625, -365.19842529296875, -356.8262939453125, -348.4541931152344, -340.0820617675781, -331.7099609375, -323.33782958984375, -314.9657287597656, -306.5936279296875, -298.22149658203125, -289.8493957519531, -281.477294921875, -273.10516357421875, -264.7330627441406, -256.3609313964844, -247.98883056640625, -239.61671447753906, -231.24459838867188, -222.87249755859375, -214.50038146972656, -206.12826538085938, -197.75616455078125, -189.38404846191406, -181.01193237304688, -172.6398162841797, -164.2677001953125, -155.8955841064453, -147.52346801757812, -139.15135192871094, -130.77923583984375, -122.40713500976562, -114.03501892089844, -105.66290283203125, -97.29078674316406, -88.9186782836914, -80.54656219482422, -72.17445373535156, -63.802337646484375, -55.43022537231445, -47.05811309814453, -38.685997009277344, -30.313884735107422, -21.9417724609375, -13.569659233093262, -5.197546005249023, 3.1745681762695312, 11.546680450439453, 19.918792724609375, 28.290908813476562, 36.663021087646484, 45.035133361816406]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 11.0, 5.0, 11.0, 21.0, 20.0, 26.0, 27.0, 29.0, 36.0, 37.0, 38.0, 39.0, 58.0, 33.0, 28.0, 45.0, 42.0, 45.0, 44.0, 29.0, 44.0, 39.0, 32.0, 27.0, 26.0, 28.0, 25.0, 25.0, 31.0, 10.0, 19.0, 11.0, 12.0, 9.0, 8.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.85529327392578, -48.191490173339844, -46.52769088745117, -44.8638916015625, -43.20008850097656, -41.536285400390625, -39.87248611450195, -38.20868682861328, -36.544883728027344, -34.881080627441406, -33.217281341552734, -31.55348014831543, -29.889678955078125, -28.22587776184082, -26.562076568603516, -24.89827537536621, -23.234474182128906, -21.5706729888916, -19.906871795654297, -18.243070602416992, -16.579269409179688, -14.915468215942383, -13.251667022705078, -11.587865829467773, -9.924064636230469, -8.260263442993164, -6.596462249755859, -4.932661056518555, -3.26885986328125, -1.6050586700439453, 0.058742523193359375, 1.722543716430664, 3.3863449096679688, 5.050146102905273, 6.713947296142578, 8.377748489379883, 10.041549682617188, 11.705350875854492, 13.369152069091797, 15.032953262329102, 16.696754455566406, 18.36055564880371, 20.024356842041016, 21.68815803527832, 23.351959228515625, 25.01576042175293, 26.679561614990234, 28.34336280822754, 30.007164001464844, 31.67096519470215, 33.33476638793945, 34.998565673828125, 36.66236877441406, 38.326171875, 39.98997116088867, 41.653770446777344, 43.31757354736328, 44.98137664794922, 46.64517593383789, 48.30897521972656, 49.9727783203125, 51.63658142089844, 53.30038070678711, 54.96417999267578, 56.62798309326172]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 5.0, 8.0, 9.0, 11.0, 20.0, 24.0, 18.0, 23.0, 23.0, 48.0, 35.0, 35.0, 40.0, 54.0, 41.0, 47.0, 58.0, 45.0, 42.0, 50.0, 44.0, 51.0, 37.0, 38.0, 42.0, 26.0, 20.0, 22.0, 27.0, 12.0, 16.0, 10.0, 4.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.83416748046875, -6.6058349609375, -6.37750244140625, -6.149169921875, -5.92083740234375, -5.6925048828125, -5.46417236328125, -5.23583984375, -5.00750732421875, -4.7791748046875, -4.55084228515625, -4.322509765625, -4.09417724609375, -3.8658447265625, -3.63751220703125, -3.4091796875, -3.18084716796875, -2.9525146484375, -2.72418212890625, -2.495849609375, -2.26751708984375, -2.0391845703125, -1.81085205078125, -1.58251953125, -1.35418701171875, -1.1258544921875, -0.89752197265625, -0.669189453125, -0.44085693359375, -0.2125244140625, 0.01580810546875, 0.244140625, 0.47247314453125, 0.7008056640625, 0.92913818359375, 1.157470703125, 1.38580322265625, 1.6141357421875, 1.84246826171875, 2.07080078125, 2.29913330078125, 2.5274658203125, 2.75579833984375, 2.984130859375, 3.21246337890625, 3.4407958984375, 3.66912841796875, 3.8974609375, 4.12579345703125, 4.3541259765625, 4.58245849609375, 4.810791015625, 5.03912353515625, 5.2674560546875, 5.49578857421875, 5.72412109375, 5.95245361328125, 6.1807861328125, 6.40911865234375, 6.637451171875, 6.86578369140625, 7.0941162109375, 7.32244873046875, 7.55078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 15.0, 14.0, 18.0, 34.0, 53.0, 62.0, 115.0, 199.0, 529.0, 2258.0, 12897.0, 156399.0, 3099466.0, 878119.0, 37718.0, 4726.0, 942.0, 284.0, 145.0, 71.0, 51.0, 47.0, 25.0, 23.0, 12.0, 12.0, 5.0, 14.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -16.950927734375, -16.29248046875, -15.634033203125, -14.9755859375, -14.317138671875, -13.65869140625, -13.000244140625, -12.341796875, -11.683349609375, -11.02490234375, -10.366455078125, -9.7080078125, -9.049560546875, -8.39111328125, -7.732666015625, -7.07421875, -6.415771484375, -5.75732421875, -5.098876953125, -4.4404296875, -3.781982421875, -3.12353515625, -2.465087890625, -1.806640625, -1.148193359375, -0.48974609375, 0.168701171875, 0.8271484375, 1.485595703125, 2.14404296875, 2.802490234375, 3.4609375, 4.119384765625, 4.77783203125, 5.436279296875, 6.0947265625, 6.753173828125, 7.41162109375, 8.070068359375, 8.728515625, 9.386962890625, 10.04541015625, 10.703857421875, 11.3623046875, 12.020751953125, 12.67919921875, 13.337646484375, 13.99609375, 14.654541015625, 15.31298828125, 15.971435546875, 16.6298828125, 17.288330078125, 17.94677734375, 18.605224609375, 19.263671875, 19.922119140625, 20.58056640625, 21.239013671875, 21.8974609375, 22.555908203125, 23.21435546875, 23.872802734375, 24.53125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 9.0, 7.0, 6.0, 13.0, 20.0, 27.0, 20.0, 37.0, 43.0, 38.0, 71.0, 97.0, 148.0, 173.0, 257.0, 334.0, 423.0, 455.0, 400.0, 363.0, 288.0, 209.0, 161.0, 99.0, 89.0, 61.0, 49.0, 37.0, 26.0, 28.0, 20.0, 20.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.765625, -11.469970703125, -11.17431640625, -10.878662109375, -10.5830078125, -10.287353515625, -9.99169921875, -9.696044921875, -9.400390625, -9.104736328125, -8.80908203125, -8.513427734375, -8.2177734375, -7.922119140625, -7.62646484375, -7.330810546875, -7.03515625, -6.739501953125, -6.44384765625, -6.148193359375, -5.8525390625, -5.556884765625, -5.26123046875, -4.965576171875, -4.669921875, -4.374267578125, -4.07861328125, -3.782958984375, -3.4873046875, -3.191650390625, -2.89599609375, -2.600341796875, -2.3046875, -2.009033203125, -1.71337890625, -1.417724609375, -1.1220703125, -0.826416015625, -0.53076171875, -0.235107421875, 0.060546875, 0.356201171875, 0.65185546875, 0.947509765625, 1.2431640625, 1.538818359375, 1.83447265625, 2.130126953125, 2.42578125, 2.721435546875, 3.01708984375, 3.312744140625, 3.6083984375, 3.904052734375, 4.19970703125, 4.495361328125, 4.791015625, 5.086669921875, 5.38232421875, 5.677978515625, 5.9736328125, 6.269287109375, 6.56494140625, 6.860595703125, 7.15625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 16.0, 23.0, 27.0, 40.0, 43.0, 62.0, 89.0, 101.0, 137.0, 199.0, 302.0, 576.0, 2328.0, 24889.0, 868936.0, 3217032.0, 72652.0, 4632.0, 853.0, 410.0, 268.0, 171.0, 104.0, 81.0, 63.0, 55.0, 42.0, 31.0, 32.0, 22.0, 9.0, 11.0, 8.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.640625, -26.542724609375, -25.44482421875, -24.346923828125, -23.2490234375, -22.151123046875, -21.05322265625, -19.955322265625, -18.857421875, -17.759521484375, -16.66162109375, -15.563720703125, -14.4658203125, -13.367919921875, -12.27001953125, -11.172119140625, -10.07421875, -8.976318359375, -7.87841796875, -6.780517578125, -5.6826171875, -4.584716796875, -3.48681640625, -2.388916015625, -1.291015625, -0.193115234375, 0.90478515625, 2.002685546875, 3.1005859375, 4.198486328125, 5.29638671875, 6.394287109375, 7.4921875, 8.590087890625, 9.68798828125, 10.785888671875, 11.8837890625, 12.981689453125, 14.07958984375, 15.177490234375, 16.275390625, 17.373291015625, 18.47119140625, 19.569091796875, 20.6669921875, 21.764892578125, 22.86279296875, 23.960693359375, 25.05859375, 26.156494140625, 27.25439453125, 28.352294921875, 29.4501953125, 30.548095703125, 31.64599609375, 32.743896484375, 33.841796875, 34.939697265625, 36.03759765625, 37.135498046875, 38.2333984375, 39.331298828125, 40.42919921875, 41.527099609375, 42.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 15.0, 44.0, 99.0, 180.0, 242.0, 237.0, 113.0, 51.0, 15.0, 9.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.2986831665039, -81.35879516601562, -78.41890716552734, -75.47901916503906, -72.53913879394531, -69.59925079345703, -66.65936279296875, -63.71947479248047, -60.77958679199219, -57.839698791503906, -54.899810791015625, -51.95992660522461, -49.02003860473633, -46.08015060424805, -43.14026641845703, -40.20037841796875, -37.26049041748047, -34.32060241699219, -31.38071632385254, -28.44083023071289, -25.50094223022461, -22.561054229736328, -19.62116813659668, -16.68128204345703, -13.74139404296875, -10.801506996154785, -7.86161994934082, -4.9217329025268555, -1.9818458557128906, 0.9580411911010742, 3.897928237915039, 6.8378143310546875, 9.777702331542969, 12.717589378356934, 15.657476425170898, 18.597362518310547, 21.537250518798828, 24.47713851928711, 27.417024612426758, 30.356910705566406, 33.29679870605469, 36.23668670654297, 39.17657470703125, 42.116458892822266, 45.05634689331055, 47.99623489379883, 50.936119079589844, 53.876007080078125, 56.815895080566406, 59.75578308105469, 62.69567108154297, 65.63555908203125, 68.575439453125, 71.51532745361328, 74.45521545410156, 77.39510345458984, 80.33499145507812, 83.2748794555664, 86.21476745605469, 89.15465545654297, 92.09454345703125, 95.034423828125, 97.97431182861328, 100.91419982910156, 103.85408782958984]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 0.0, 4.0, 5.0, 4.0, 7.0, 4.0, 12.0, 10.0, 11.0, 11.0, 17.0, 24.0, 12.0, 31.0, 40.0, 26.0, 25.0, 36.0, 21.0, 30.0, 31.0, 41.0, 39.0, 37.0, 45.0, 29.0, 46.0, 40.0, 38.0, 32.0, 39.0, 26.0, 20.0, 27.0, 27.0, 24.0, 24.0, 21.0, 14.0, 11.0, 11.0, 12.0, 13.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.1907958984375, -31.15462875366211, -30.11846160888672, -29.082294464111328, -28.046127319335938, -27.009960174560547, -25.973791122436523, -24.937623977661133, -23.901456832885742, -22.86528968811035, -21.82912254333496, -20.79295539855957, -19.756786346435547, -18.720619201660156, -17.684452056884766, -16.648284912109375, -15.612117767333984, -14.575950622558594, -13.539783477783203, -12.503615379333496, -11.467448234558105, -10.431281089782715, -9.395112991333008, -8.358945846557617, -7.322778701782227, -6.286611557006836, -5.250443935394287, -4.214276313781738, -3.1781091690063477, -2.141942024230957, -1.1057744026184082, -0.06960678100585938, 0.9665603637695312, 2.002727746963501, 3.0388951301574707, 4.0750627517700195, 5.11122989654541, 6.147397041320801, 7.18356466293335, 8.219732284545898, 9.255899429321289, 10.29206657409668, 11.32823371887207, 12.364401817321777, 13.400568962097168, 14.436736106872559, 15.472904205322266, 16.509071350097656, 17.545238494873047, 18.581405639648438, 19.617572784423828, 20.65373992919922, 21.68990707397461, 22.72607421875, 23.762243270874023, 24.798410415649414, 25.834577560424805, 26.870744705200195, 27.906911849975586, 28.943078994750977, 29.979248046875, 31.01541519165039, 32.05158233642578, 33.08774948120117, 34.12391662597656]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 5.0, 10.0, 8.0, 10.0, 19.0, 17.0, 27.0, 13.0, 28.0, 31.0, 31.0, 27.0, 31.0, 53.0, 41.0, 43.0, 41.0, 51.0, 47.0, 53.0, 41.0, 29.0, 47.0, 37.0, 44.0, 27.0, 33.0, 23.0, 18.0, 33.0, 14.0, 18.0, 10.0, 10.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.29034423828125, -6.0806884765625, -5.87103271484375, -5.661376953125, -5.45172119140625, -5.2420654296875, -5.03240966796875, -4.82275390625, -4.61309814453125, -4.4034423828125, -4.19378662109375, -3.984130859375, -3.77447509765625, -3.5648193359375, -3.35516357421875, -3.1455078125, -2.93585205078125, -2.7261962890625, -2.51654052734375, -2.306884765625, -2.09722900390625, -1.8875732421875, -1.67791748046875, -1.46826171875, -1.25860595703125, -1.0489501953125, -0.83929443359375, -0.629638671875, -0.41998291015625, -0.2103271484375, -0.00067138671875, 0.208984375, 0.41864013671875, 0.6282958984375, 0.83795166015625, 1.047607421875, 1.25726318359375, 1.4669189453125, 1.67657470703125, 1.88623046875, 2.09588623046875, 2.3055419921875, 2.51519775390625, 2.724853515625, 2.93450927734375, 3.1441650390625, 3.35382080078125, 3.5634765625, 3.77313232421875, 3.9827880859375, 4.19244384765625, 4.402099609375, 4.61175537109375, 4.8214111328125, 5.03106689453125, 5.24072265625, 5.45037841796875, 5.6600341796875, 5.86968994140625, 6.079345703125, 6.28900146484375, 6.4986572265625, 6.70831298828125, 6.91796875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 8.0, 3.0, 12.0, 16.0, 29.0, 33.0, 48.0, 90.0, 120.0, 200.0, 298.0, 437.0, 698.0, 1052.0, 1652.0, 2579.0, 3983.0, 6463.0, 10073.0, 16139.0, 25116.0, 38807.0, 58866.0, 87374.0, 122264.0, 152149.0, 151965.0, 119865.0, 85522.0, 57679.0, 37761.0, 24380.0, 15658.0, 9903.0, 6362.0, 3959.0, 2517.0, 1621.0, 1030.0, 637.0, 402.0, 272.0, 173.0, 113.0, 86.0, 56.0, 30.0, 24.0, 18.0, 10.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.72119140625, -0.6971282958984375, -0.673065185546875, -0.6490020751953125, -0.62493896484375, -0.6008758544921875, -0.576812744140625, -0.5527496337890625, -0.5286865234375, -0.5046234130859375, -0.480560302734375, -0.4564971923828125, -0.43243408203125, -0.4083709716796875, -0.384307861328125, -0.3602447509765625, -0.336181640625, -0.3121185302734375, -0.288055419921875, -0.2639923095703125, -0.23992919921875, -0.2158660888671875, -0.191802978515625, -0.1677398681640625, -0.1436767578125, -0.1196136474609375, -0.095550537109375, -0.0714874267578125, -0.04742431640625, -0.0233612060546875, 0.000701904296875, 0.0247650146484375, 0.048828125, 0.0728912353515625, 0.096954345703125, 0.1210174560546875, 0.14508056640625, 0.1691436767578125, 0.193206787109375, 0.2172698974609375, 0.2413330078125, 0.2653961181640625, 0.289459228515625, 0.3135223388671875, 0.33758544921875, 0.3616485595703125, 0.385711669921875, 0.4097747802734375, 0.433837890625, 0.4579010009765625, 0.481964111328125, 0.5060272216796875, 0.53009033203125, 0.5541534423828125, 0.578216552734375, 0.6022796630859375, 0.6263427734375, 0.6504058837890625, 0.674468994140625, 0.6985321044921875, 0.72259521484375, 0.7466583251953125, 0.770721435546875, 0.7947845458984375, 0.81884765625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 6.0, 6.0, 12.0, 4.0, 13.0, 22.0, 14.0, 16.0, 31.0, 24.0, 29.0, 29.0, 34.0, 36.0, 30.0, 28.0, 32.0, 41.0, 51.0, 1086.0, 48.0, 36.0, 42.0, 29.0, 27.0, 26.0, 32.0, 31.0, 26.0, 20.0, 21.0, 12.0, 22.0, 19.0, 17.0, 10.0, 7.0, 7.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.771484375, -3.650726318359375, -3.52996826171875, -3.409210205078125, -3.2884521484375, -3.167694091796875, -3.04693603515625, -2.926177978515625, -2.805419921875, -2.684661865234375, -2.56390380859375, -2.443145751953125, -2.3223876953125, -2.201629638671875, -2.08087158203125, -1.960113525390625, -1.83935546875, -1.718597412109375, -1.59783935546875, -1.477081298828125, -1.3563232421875, -1.235565185546875, -1.11480712890625, -0.994049072265625, -0.873291015625, -0.752532958984375, -0.63177490234375, -0.511016845703125, -0.3902587890625, -0.269500732421875, -0.14874267578125, -0.027984619140625, 0.0927734375, 0.213531494140625, 0.33428955078125, 0.455047607421875, 0.5758056640625, 0.696563720703125, 0.81732177734375, 0.938079833984375, 1.058837890625, 1.179595947265625, 1.30035400390625, 1.421112060546875, 1.5418701171875, 1.662628173828125, 1.78338623046875, 1.904144287109375, 2.02490234375, 2.145660400390625, 2.26641845703125, 2.387176513671875, 2.5079345703125, 2.628692626953125, 2.74945068359375, 2.870208740234375, 2.990966796875, 3.111724853515625, 3.23248291015625, 3.353240966796875, 3.4739990234375, 3.594757080078125, 3.71551513671875, 3.836273193359375, 3.95703125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 9.0, 17.0, 16.0, 24.0, 39.0, 47.0, 85.0, 141.0, 208.0, 268.0, 430.0, 613.0, 930.0, 1386.0, 2092.0, 3166.0, 4666.0, 7290.0, 10707.0, 15934.0, 23755.0, 35051.0, 51258.0, 73947.0, 100875.0, 129934.0, 1185746.0, 126724.0, 97986.0, 70870.0, 49749.0, 34238.0, 22895.0, 15456.0, 10199.0, 6628.0, 4496.0, 3069.0, 1959.0, 1376.0, 962.0, 626.0, 388.0, 299.0, 182.0, 137.0, 87.0, 69.0, 37.0, 29.0, 22.0, 11.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.427001953125, -0.4138450622558594, -0.40068817138671875, -0.3875312805175781, -0.3743743896484375, -0.3612174987792969, -0.34806060791015625, -0.3349037170410156, -0.321746826171875, -0.3085899353027344, -0.29543304443359375, -0.2822761535644531, -0.2691192626953125, -0.2559623718261719, -0.24280548095703125, -0.22964859008789062, -0.21649169921875, -0.20333480834960938, -0.19017791748046875, -0.17702102661132812, -0.1638641357421875, -0.15070724487304688, -0.13755035400390625, -0.12439346313476562, -0.111236572265625, -0.09807968139648438, -0.08492279052734375, -0.07176589965820312, -0.0586090087890625, -0.045452117919921875, -0.03229522705078125, -0.019138336181640625, -0.0059814453125, 0.007175445556640625, 0.02033233642578125, 0.033489227294921875, 0.0466461181640625, 0.059803009033203125, 0.07295989990234375, 0.08611679077148438, 0.099273681640625, 0.11243057250976562, 0.12558746337890625, 0.13874435424804688, 0.1519012451171875, 0.16505813598632812, 0.17821502685546875, 0.19137191772460938, 0.20452880859375, 0.21768569946289062, 0.23084259033203125, 0.24399948120117188, 0.2571563720703125, 0.2703132629394531, 0.28347015380859375, 0.2966270446777344, 0.309783935546875, 0.3229408264160156, 0.33609771728515625, 0.3492546081542969, 0.3624114990234375, 0.3755683898925781, 0.38872528076171875, 0.4018821716308594, 0.4150390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 8.0, 6.0, 3.0, 4.0, 7.0, 6.0, 6.0, 10.0, 8.0, 12.0, 15.0, 31.0, 43.0, 64.0, 117.0, 186.0, 181.0, 102.0, 40.0, 37.0, 22.0, 14.0, 16.0, 12.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0202789306640625, -0.01969742774963379, -0.019115924835205078, -0.018534421920776367, -0.017952919006347656, -0.017371416091918945, -0.016789913177490234, -0.016208410263061523, -0.015626907348632812, -0.015045404434204102, -0.01446390151977539, -0.01388239860534668, -0.013300895690917969, -0.012719392776489258, -0.012137889862060547, -0.011556386947631836, -0.010974884033203125, -0.010393381118774414, -0.009811878204345703, -0.009230375289916992, -0.008648872375488281, -0.00806736946105957, -0.007485866546630859, -0.0069043636322021484, -0.0063228607177734375, -0.0057413578033447266, -0.005159854888916016, -0.004578351974487305, -0.003996849060058594, -0.003415346145629883, -0.002833843231201172, -0.002252340316772461, -0.00167083740234375, -0.001089334487915039, -0.0005078315734863281, 7.367134094238281e-05, 0.0006551742553710938, 0.0012366771697998047, 0.0018181800842285156, 0.0023996829986572266, 0.0029811859130859375, 0.0035626888275146484, 0.004144191741943359, 0.00472569465637207, 0.005307197570800781, 0.005888700485229492, 0.006470203399658203, 0.007051706314086914, 0.007633209228515625, 0.008214712142944336, 0.008796215057373047, 0.009377717971801758, 0.009959220886230469, 0.01054072380065918, 0.01112222671508789, 0.011703729629516602, 0.012285232543945312, 0.012866735458374023, 0.013448238372802734, 0.014029741287231445, 0.014611244201660156, 0.015192747116088867, 0.015774250030517578, 0.01635575294494629, 0.016937255859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 7.0, 7.0, 10.0, 12.0, 16.0, 15.0, 16.0, 30.0, 30.0, 72.0, 124.0, 200.0, 526.0, 87212.0, 958772.0, 886.0, 249.0, 130.0, 62.0, 42.0, 25.0, 22.0, 16.0, 12.0, 11.0, 11.0, 3.0, 3.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.365234375, -0.3526878356933594, -0.34014129638671875, -0.3275947570800781, -0.3150482177734375, -0.3025016784667969, -0.28995513916015625, -0.2774085998535156, -0.264862060546875, -0.2523155212402344, -0.23976898193359375, -0.22722244262695312, -0.2146759033203125, -0.20212936401367188, -0.18958282470703125, -0.17703628540039062, -0.16448974609375, -0.15194320678710938, -0.13939666748046875, -0.12685012817382812, -0.1143035888671875, -0.10175704956054688, -0.08921051025390625, -0.07666397094726562, -0.064117431640625, -0.051570892333984375, -0.03902435302734375, -0.026477813720703125, -0.0139312744140625, -0.001384735107421875, 0.01116180419921875, 0.023708343505859375, 0.0362548828125, 0.048801422119140625, 0.06134796142578125, 0.07389450073242188, 0.0864410400390625, 0.09898757934570312, 0.11153411865234375, 0.12408065795898438, 0.136627197265625, 0.14917373657226562, 0.16172027587890625, 0.17426681518554688, 0.1868133544921875, 0.19935989379882812, 0.21190643310546875, 0.22445297241210938, 0.23699951171875, 0.24954605102539062, 0.26209259033203125, 0.2746391296386719, 0.2871856689453125, 0.2997322082519531, 0.31227874755859375, 0.3248252868652344, 0.337371826171875, 0.3499183654785156, 0.36246490478515625, 0.3750114440917969, 0.3875579833984375, 0.4001045227050781, 0.41265106201171875, 0.4251976013183594, 0.437744140625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 82.0, 926.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49372944235801697, -0.4852680563926697, -0.4768066704273224, -0.4683452844619751, -0.4598838984966278, -0.4514225125312805, -0.4429611265659332, -0.43449974060058594, -0.42603835463523865, -0.41757696866989136, -0.40911558270454407, -0.4006541967391968, -0.3921928107738495, -0.3837314248085022, -0.3752700388431549, -0.3668086528778076, -0.3583472967147827, -0.3498859107494354, -0.34142452478408813, -0.33296313881874084, -0.32450175285339355, -0.31604036688804626, -0.307578980922699, -0.2991175949573517, -0.2906562089920044, -0.2821948230266571, -0.2737334370613098, -0.2652720510959625, -0.25681066513061523, -0.24834927916526794, -0.23988789319992065, -0.23142650723457336, -0.22296510636806488, -0.2145037204027176, -0.2060423344373703, -0.197580948472023, -0.18911956250667572, -0.18065817654132843, -0.17219680547714233, -0.16373541951179504, -0.15527403354644775, -0.14681264758110046, -0.13835126161575317, -0.12988987565040588, -0.1214284896850586, -0.1129671037197113, -0.10450572520494461, -0.09604433923959732, -0.08758294582366943, -0.07912155985832214, -0.07066017389297485, -0.06219879165291786, -0.05373740568757057, -0.04527601972222328, -0.03681463748216629, -0.028353251516819, -0.01989186555147171, -0.011430480517446995, -0.0029690954834222794, 0.0054922886192798615, 0.013953674584627151, 0.02241506054997444, 0.030876442790031433, 0.03933782875537872, 0.04779921472072601]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 6.0, 4.0, 3.0, 8.0, 8.0, 8.0, 11.0, 20.0, 28.0, 14.0, 37.0, 32.0, 33.0, 28.0, 38.0, 37.0, 55.0, 49.0, 48.0, 39.0, 48.0, 44.0, 35.0, 55.0, 46.0, 39.0, 40.0, 23.0, 26.0, 25.0, 29.0, 24.0, 16.0, 13.0, 5.0, 12.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017159700393676758, -0.01652485877275467, -0.01589001901447773, -0.015255178324878216, -0.014620337635278702, -0.013985496945679188, -0.013350656256079674, -0.01271581556648016, -0.012080974876880646, -0.011446134187281132, -0.010811293497681618, -0.010176452808082104, -0.00954161211848259, -0.008906771428883076, -0.008271930739283562, -0.007637090049684048, -0.007002249360084534, -0.00636740867048502, -0.005732567980885506, -0.005097727291285992, -0.004462886601686478, -0.0038280459120869637, -0.0031932052224874496, -0.0025583645328879356, -0.0019235238432884216, -0.0012886831536889076, -0.0006538424640893936, -1.9001774489879608e-05, 0.0006158389151096344, 0.0012506796047091484, 0.0018855202943086624, 0.0025203609839081764, 0.0031552016735076904, 0.0037900423631072044, 0.0044248830527067184, 0.0050597237423062325, 0.0056945644319057465, 0.0063294051215052605, 0.0069642458111047745, 0.0075990865007042885, 0.008233927190303802, 0.008868767879903316, 0.00950360856950283, 0.010138449259102345, 0.010773289948701859, 0.011408130638301373, 0.012042971327900887, 0.0126778120175004, 0.013312652707099915, 0.013947493396699429, 0.014582334086298943, 0.015217174775898457, 0.01585201546549797, 0.01648685708642006, 0.017121696844697, 0.017756536602973938, 0.018391378223896027, 0.019026219844818115, 0.019661059603095055, 0.020295899361371994, 0.020930740982294083, 0.02156558260321617, 0.02220042236149311, 0.02283526211977005, 0.02347010374069214]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 6.0, 9.0, 8.0, 10.0, 19.0, 17.0, 27.0, 13.0, 28.0, 31.0, 31.0, 27.0, 32.0, 52.0, 41.0, 43.0, 41.0, 51.0, 47.0, 53.0, 41.0, 29.0, 47.0, 37.0, 44.0, 27.0, 33.0, 23.0, 18.0, 33.0, 14.0, 18.0, 10.0, 10.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.29034423828125, -6.0806884765625, -5.87103271484375, -5.661376953125, -5.45172119140625, -5.2420654296875, -5.03240966796875, -4.82275390625, -4.61309814453125, -4.4034423828125, -4.19378662109375, -3.984130859375, -3.77447509765625, -3.5648193359375, -3.35516357421875, -3.1455078125, -2.93585205078125, -2.7261962890625, -2.51654052734375, -2.306884765625, -2.09722900390625, -1.8875732421875, -1.67791748046875, -1.46826171875, -1.25860595703125, -1.0489501953125, -0.83929443359375, -0.629638671875, -0.41998291015625, -0.2103271484375, -0.00067138671875, 0.208984375, 0.41864013671875, 0.6282958984375, 0.83795166015625, 1.047607421875, 1.25726318359375, 1.4669189453125, 1.67657470703125, 1.88623046875, 2.09588623046875, 2.3055419921875, 2.51519775390625, 2.724853515625, 2.93450927734375, 3.1441650390625, 3.35382080078125, 3.5634765625, 3.77313232421875, 3.9827880859375, 4.19244384765625, 4.402099609375, 4.61175537109375, 4.8214111328125, 5.03106689453125, 5.24072265625, 5.45037841796875, 5.6600341796875, 5.86968994140625, 6.079345703125, 6.28900146484375, 6.4986572265625, 6.70831298828125, 6.91796875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 11.0, 6.0, 10.0, 12.0, 10.0, 28.0, 30.0, 44.0, 32.0, 72.0, 94.0, 131.0, 170.0, 316.0, 790.0, 2491.0, 10549.0, 51058.0, 484211.0, 435882.0, 48504.0, 9978.0, 2439.0, 714.0, 322.0, 182.0, 114.0, 91.0, 61.0, 46.0, 47.0, 27.0, 28.0, 14.0, 11.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6171875, -12.2099609375, -11.802734375, -11.3955078125, -10.98828125, -10.5810546875, -10.173828125, -9.7666015625, -9.359375, -8.9521484375, -8.544921875, -8.1376953125, -7.73046875, -7.3232421875, -6.916015625, -6.5087890625, -6.1015625, -5.6943359375, -5.287109375, -4.8798828125, -4.47265625, -4.0654296875, -3.658203125, -3.2509765625, -2.84375, -2.4365234375, -2.029296875, -1.6220703125, -1.21484375, -0.8076171875, -0.400390625, 0.0068359375, 0.4140625, 0.8212890625, 1.228515625, 1.6357421875, 2.04296875, 2.4501953125, 2.857421875, 3.2646484375, 3.671875, 4.0791015625, 4.486328125, 4.8935546875, 5.30078125, 5.7080078125, 6.115234375, 6.5224609375, 6.9296875, 7.3369140625, 7.744140625, 8.1513671875, 8.55859375, 8.9658203125, 9.373046875, 9.7802734375, 10.1875, 10.5947265625, 11.001953125, 11.4091796875, 11.81640625, 12.2236328125, 12.630859375, 13.0380859375, 13.4453125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 7.0, 6.0, 4.0, 12.0, 15.0, 19.0, 16.0, 21.0, 13.0, 29.0, 25.0, 35.0, 32.0, 44.0, 43.0, 72.0, 97.0, 304.0, 1610.0, 152.0, 83.0, 59.0, 55.0, 47.0, 40.0, 29.0, 27.0, 29.0, 21.0, 11.0, 19.0, 15.0, 8.0, 15.0, 6.0, 4.0, 7.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.46875, -22.803466796875, -22.13818359375, -21.472900390625, -20.8076171875, -20.142333984375, -19.47705078125, -18.811767578125, -18.146484375, -17.481201171875, -16.81591796875, -16.150634765625, -15.4853515625, -14.820068359375, -14.15478515625, -13.489501953125, -12.82421875, -12.158935546875, -11.49365234375, -10.828369140625, -10.1630859375, -9.497802734375, -8.83251953125, -8.167236328125, -7.501953125, -6.836669921875, -6.17138671875, -5.506103515625, -4.8408203125, -4.175537109375, -3.51025390625, -2.844970703125, -2.1796875, -1.514404296875, -0.84912109375, -0.183837890625, 0.4814453125, 1.146728515625, 1.81201171875, 2.477294921875, 3.142578125, 3.807861328125, 4.47314453125, 5.138427734375, 5.8037109375, 6.468994140625, 7.13427734375, 7.799560546875, 8.46484375, 9.130126953125, 9.79541015625, 10.460693359375, 11.1259765625, 11.791259765625, 12.45654296875, 13.121826171875, 13.787109375, 14.452392578125, 15.11767578125, 15.782958984375, 16.4482421875, 17.113525390625, 17.77880859375, 18.444091796875, 19.109375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 10.0, 9.0, 9.0, 18.0, 18.0, 10.0, 31.0, 34.0, 49.0, 57.0, 75.0, 131.0, 185.0, 347.0, 813.0, 6751.0, 2692352.0, 439757.0, 3499.0, 667.0, 298.0, 158.0, 92.0, 76.0, 58.0, 35.0, 27.0, 23.0, 28.0, 10.0, 14.0, 15.0, 7.0, 4.0, 10.0, 8.0, 1.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.9375, -39.47021484375, -38.0029296875, -36.53564453125, -35.068359375, -33.60107421875, -32.1337890625, -30.66650390625, -29.19921875, -27.73193359375, -26.2646484375, -24.79736328125, -23.330078125, -21.86279296875, -20.3955078125, -18.92822265625, -17.4609375, -15.99365234375, -14.5263671875, -13.05908203125, -11.591796875, -10.12451171875, -8.6572265625, -7.18994140625, -5.72265625, -4.25537109375, -2.7880859375, -1.32080078125, 0.146484375, 1.61376953125, 3.0810546875, 4.54833984375, 6.015625, 7.48291015625, 8.9501953125, 10.41748046875, 11.884765625, 13.35205078125, 14.8193359375, 16.28662109375, 17.75390625, 19.22119140625, 20.6884765625, 22.15576171875, 23.623046875, 25.09033203125, 26.5576171875, 28.02490234375, 29.4921875, 30.95947265625, 32.4267578125, 33.89404296875, 35.361328125, 36.82861328125, 38.2958984375, 39.76318359375, 41.23046875, 42.69775390625, 44.1650390625, 45.63232421875, 47.099609375, 48.56689453125, 50.0341796875, 51.50146484375, 52.96875]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 57.0, 495.0, 425.0, 35.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.36098098754883, -47.38888168334961, -43.41678237915039, -39.44468307495117, -35.47258377075195, -31.500486373901367, -27.52838706970215, -23.55628776550293, -19.58418846130371, -15.612089157104492, -11.639989852905273, -7.667891502380371, -3.6957921981811523, 0.27630615234375, 4.248405456542969, 8.220504760742188, 12.192604064941406, 16.164703369140625, 20.136802673339844, 24.108901977539062, 28.08100128173828, 32.0531005859375, 36.02519989013672, 39.99729919433594, 43.969398498535156, 47.941497802734375, 51.913597106933594, 55.88569641113281, 59.85779571533203, 63.82989501953125, 67.80199432373047, 71.77409362792969, 75.7461929321289, 79.71829223632812, 83.69039154052734, 87.66249084472656, 91.63459014892578, 95.606689453125, 99.57878875732422, 103.55088806152344, 107.52298736572266, 111.49508666992188, 115.4671859741211, 119.43928527832031, 123.41138458251953, 127.38348388671875, 131.35557556152344, 135.3276824951172, 139.29977416992188, 143.27186584472656, 147.2439727783203, 151.216064453125, 155.18817138671875, 159.16026306152344, 163.1323699951172, 167.10446166992188, 171.07656860351562, 175.0486602783203, 179.02076721191406, 182.99285888671875, 186.9649658203125, 190.9370574951172, 194.90916442871094, 198.88125610351562, 202.85336303710938]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 2.0, 8.0, 6.0, 5.0, 6.0, 12.0, 10.0, 11.0, 11.0, 20.0, 30.0, 20.0, 27.0, 24.0, 32.0, 33.0, 32.0, 42.0, 45.0, 34.0, 50.0, 40.0, 39.0, 35.0, 36.0, 42.0, 37.0, 33.0, 43.0, 24.0, 23.0, 28.0, 24.0, 25.0, 21.0, 13.0, 16.0, 16.0, 15.0, 4.0, 7.0, 4.0, 4.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.683082580566406, -35.27186965942383, -33.86065673828125, -32.449440002441406, -31.038227081298828, -29.62701416015625, -28.215801239013672, -26.804588317871094, -25.393373489379883, -23.982160568237305, -22.570945739746094, -21.159732818603516, -19.748519897460938, -18.337305068969727, -16.92609214782715, -15.514878273010254, -14.10366439819336, -12.692450523376465, -11.28123664855957, -9.870023727416992, -8.458809852600098, -7.047595977783203, -5.636383056640625, -4.2251691818237305, -2.813955307006836, -1.4027416706085205, 0.008471965789794922, 1.4196853637695312, 2.830899238586426, 4.24211311340332, 5.653326034545898, 7.064539909362793, 8.475753784179688, 9.886967658996582, 11.298181533813477, 12.709394454956055, 14.12060832977295, 15.531822204589844, 16.943035125732422, 18.354248046875, 19.76546287536621, 21.17667579650879, 22.587890625, 23.999103546142578, 25.410316467285156, 26.821531295776367, 28.232744216918945, 29.643959045410156, 31.055171966552734, 32.46638488769531, 33.87759780883789, 35.28881072998047, 36.70002746582031, 38.11124038696289, 39.52245330810547, 40.93366622924805, 42.344879150390625, 43.7560920715332, 45.16730499267578, 46.578521728515625, 47.9897346496582, 49.40094757080078, 50.81216049194336, 52.22337341308594, 53.63459014892578]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 14.0, 10.0, 11.0, 5.0, 17.0, 15.0, 23.0, 18.0, 28.0, 26.0, 17.0, 30.0, 31.0, 45.0, 25.0, 32.0, 37.0, 31.0, 43.0, 44.0, 47.0, 32.0, 31.0, 50.0, 40.0, 30.0, 37.0, 28.0, 30.0, 24.0, 19.0, 29.0, 14.0, 15.0, 14.0, 17.0, 6.0, 11.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.38671875, -6.1954345703125, -6.004150390625, -5.8128662109375, -5.62158203125, -5.4302978515625, -5.239013671875, -5.0477294921875, -4.8564453125, -4.6651611328125, -4.473876953125, -4.2825927734375, -4.09130859375, -3.9000244140625, -3.708740234375, -3.5174560546875, -3.326171875, -3.1348876953125, -2.943603515625, -2.7523193359375, -2.56103515625, -2.3697509765625, -2.178466796875, -1.9871826171875, -1.7958984375, -1.6046142578125, -1.413330078125, -1.2220458984375, -1.03076171875, -0.8394775390625, -0.648193359375, -0.4569091796875, -0.265625, -0.0743408203125, 0.116943359375, 0.3082275390625, 0.49951171875, 0.6907958984375, 0.882080078125, 1.0733642578125, 1.2646484375, 1.4559326171875, 1.647216796875, 1.8385009765625, 2.02978515625, 2.2210693359375, 2.412353515625, 2.6036376953125, 2.794921875, 2.9862060546875, 3.177490234375, 3.3687744140625, 3.56005859375, 3.7513427734375, 3.942626953125, 4.1339111328125, 4.3251953125, 4.5164794921875, 4.707763671875, 4.8990478515625, 5.09033203125, 5.2816162109375, 5.472900390625, 5.6641845703125, 5.85546875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 5.0, 11.0, 11.0, 9.0, 12.0, 17.0, 17.0, 28.0, 43.0, 76.0, 104.0, 196.0, 439.0, 1122.0, 3011.0, 9364.0, 35119.0, 209817.0, 1832809.0, 1841241.0, 212487.0, 34391.0, 9024.0, 2876.0, 1056.0, 451.0, 198.0, 94.0, 62.0, 44.0, 28.0, 24.0, 15.0, 13.0, 14.0, 12.0, 13.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.581787109375, -12.14794921875, -11.714111328125, -11.2802734375, -10.846435546875, -10.41259765625, -9.978759765625, -9.544921875, -9.111083984375, -8.67724609375, -8.243408203125, -7.8095703125, -7.375732421875, -6.94189453125, -6.508056640625, -6.07421875, -5.640380859375, -5.20654296875, -4.772705078125, -4.3388671875, -3.905029296875, -3.47119140625, -3.037353515625, -2.603515625, -2.169677734375, -1.73583984375, -1.302001953125, -0.8681640625, -0.434326171875, -0.00048828125, 0.433349609375, 0.8671875, 1.301025390625, 1.73486328125, 2.168701171875, 2.6025390625, 3.036376953125, 3.47021484375, 3.904052734375, 4.337890625, 4.771728515625, 5.20556640625, 5.639404296875, 6.0732421875, 6.507080078125, 6.94091796875, 7.374755859375, 7.80859375, 8.242431640625, 8.67626953125, 9.110107421875, 9.5439453125, 9.977783203125, 10.41162109375, 10.845458984375, 11.279296875, 11.713134765625, 12.14697265625, 12.580810546875, 13.0146484375, 13.448486328125, 13.88232421875, 14.316162109375, 14.75]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 7.0, 16.0, 22.0, 19.0, 27.0, 43.0, 48.0, 46.0, 75.0, 75.0, 108.0, 167.0, 243.0, 339.0, 374.0, 462.0, 424.0, 413.0, 271.0, 239.0, 139.0, 128.0, 92.0, 49.0, 47.0, 39.0, 34.0, 24.0, 14.0, 19.0, 9.0, 12.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.921875, -8.6234130859375, -8.324951171875, -8.0264892578125, -7.72802734375, -7.4295654296875, -7.131103515625, -6.8326416015625, -6.5341796875, -6.2357177734375, -5.937255859375, -5.6387939453125, -5.34033203125, -5.0418701171875, -4.743408203125, -4.4449462890625, -4.146484375, -3.8480224609375, -3.549560546875, -3.2510986328125, -2.95263671875, -2.6541748046875, -2.355712890625, -2.0572509765625, -1.7587890625, -1.4603271484375, -1.161865234375, -0.8634033203125, -0.56494140625, -0.2664794921875, 0.031982421875, 0.3304443359375, 0.62890625, 0.9273681640625, 1.225830078125, 1.5242919921875, 1.82275390625, 2.1212158203125, 2.419677734375, 2.7181396484375, 3.0166015625, 3.3150634765625, 3.613525390625, 3.9119873046875, 4.21044921875, 4.5089111328125, 4.807373046875, 5.1058349609375, 5.404296875, 5.7027587890625, 6.001220703125, 6.2996826171875, 6.59814453125, 6.8966064453125, 7.195068359375, 7.4935302734375, 7.7919921875, 8.0904541015625, 8.388916015625, 8.6873779296875, 8.98583984375, 9.2843017578125, 9.582763671875, 9.8812255859375, 10.1796875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 8.0, 10.0, 8.0, 19.0, 10.0, 35.0, 43.0, 41.0, 67.0, 91.0, 138.0, 211.0, 332.0, 669.0, 2191.0, 12092.0, 138231.0, 3302799.0, 695351.0, 34846.0, 4588.0, 1206.0, 445.0, 245.0, 151.0, 129.0, 91.0, 59.0, 63.0, 30.0, 20.0, 19.0, 9.0, 8.0, 6.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.475341796875, -23.56005859375, -22.644775390625, -21.7294921875, -20.814208984375, -19.89892578125, -18.983642578125, -18.068359375, -17.153076171875, -16.23779296875, -15.322509765625, -14.4072265625, -13.491943359375, -12.57666015625, -11.661376953125, -10.74609375, -9.830810546875, -8.91552734375, -8.000244140625, -7.0849609375, -6.169677734375, -5.25439453125, -4.339111328125, -3.423828125, -2.508544921875, -1.59326171875, -0.677978515625, 0.2373046875, 1.152587890625, 2.06787109375, 2.983154296875, 3.8984375, 4.813720703125, 5.72900390625, 6.644287109375, 7.5595703125, 8.474853515625, 9.39013671875, 10.305419921875, 11.220703125, 12.135986328125, 13.05126953125, 13.966552734375, 14.8818359375, 15.797119140625, 16.71240234375, 17.627685546875, 18.54296875, 19.458251953125, 20.37353515625, 21.288818359375, 22.2041015625, 23.119384765625, 24.03466796875, 24.949951171875, 25.865234375, 26.780517578125, 27.69580078125, 28.611083984375, 29.5263671875, 30.441650390625, 31.35693359375, 32.272216796875, 33.1875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 12.0, 34.0, 96.0, 136.0, 196.0, 202.0, 191.0, 75.0, 40.0, 11.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.16215515136719, -86.55191802978516, -83.94168090820312, -81.3314437866211, -78.72120666503906, -76.11097717285156, -73.50074005126953, -70.8905029296875, -68.28026580810547, -65.67002868652344, -63.059791564941406, -60.44955825805664, -57.83932113647461, -55.22908401489258, -52.61885070800781, -50.00861358642578, -47.39837646484375, -44.78813934326172, -42.17790222167969, -39.56766891479492, -36.95743179321289, -34.34719467163086, -31.73695945739746, -29.126724243164062, -26.51648712158203, -23.90625, -21.2960147857666, -18.685779571533203, -16.075542449951172, -13.465306282043457, -10.855070114135742, -8.244834899902344, -5.634605407714844, -3.024369239807129, -0.41413307189941406, 2.196103096008301, 4.806339263916016, 7.4165754318237305, 10.026811599731445, 12.637046813964844, 15.247283935546875, 17.857521057128906, 20.467756271362305, 23.077991485595703, 25.688228607177734, 28.298465728759766, 30.908700942993164, 33.51893615722656, 36.129173278808594, 38.739410400390625, 41.349647521972656, 43.95988082885742, 46.57011795043945, 49.180355072021484, 51.79058837890625, 54.40082550048828, 57.01106262207031, 59.621299743652344, 62.231536865234375, 64.8417739868164, 67.45201110839844, 70.06224060058594, 72.67247772216797, 75.28271484375, 77.89295196533203]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 6.0, 9.0, 11.0, 2.0, 12.0, 10.0, 13.0, 9.0, 18.0, 20.0, 25.0, 26.0, 29.0, 42.0, 28.0, 48.0, 35.0, 35.0, 41.0, 37.0, 33.0, 42.0, 29.0, 42.0, 39.0, 38.0, 39.0, 39.0, 22.0, 22.0, 35.0, 31.0, 17.0, 22.0, 12.0, 13.0, 14.0, 6.0, 8.0, 8.0, 11.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.678070068359375, -29.61299705505371, -28.547924041748047, -27.48284912109375, -26.417776107788086, -25.352703094482422, -24.287630081176758, -23.222557067871094, -22.157482147216797, -21.092409133911133, -20.02733612060547, -18.962261199951172, -17.897188186645508, -16.832115173339844, -15.76704216003418, -14.701969146728516, -13.636896133422852, -12.571823120117188, -11.506749153137207, -10.441676139831543, -9.376602172851562, -8.311529159545898, -7.246456146240234, -6.181382656097412, -5.11630916595459, -4.051235675811768, -2.9861624240875244, -1.9210891723632812, -0.856015682220459, 0.20905780792236328, 1.2741308212280273, 2.3392043113708496, 3.404277801513672, 4.469351291656494, 5.534424781799316, 6.5994977951049805, 7.664571285247803, 8.729644775390625, 9.794717788696289, 10.859790802001953, 11.924864768981934, 12.989937782287598, 14.055011749267578, 15.120084762573242, 16.185157775878906, 17.250232696533203, 18.315303802490234, 19.38037872314453, 20.445451736450195, 21.51052474975586, 22.575597763061523, 23.640670776367188, 24.705745697021484, 25.77081871032715, 26.835891723632812, 27.900964736938477, 28.96603775024414, 30.031110763549805, 31.09618377685547, 32.161258697509766, 33.2263298034668, 34.291404724121094, 35.356475830078125, 36.42155075073242, 37.48662567138672]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 10.0, 8.0, 10.0, 13.0, 11.0, 18.0, 21.0, 14.0, 27.0, 29.0, 29.0, 33.0, 35.0, 47.0, 40.0, 40.0, 54.0, 45.0, 42.0, 39.0, 41.0, 46.0, 31.0, 35.0, 32.0, 39.0, 31.0, 25.0, 25.0, 20.0, 20.0, 20.0, 11.0, 9.0, 10.0, 7.0, 5.0, 5.0, 10.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.81640625, -7.607177734375, -7.39794921875, -7.188720703125, -6.9794921875, -6.770263671875, -6.56103515625, -6.351806640625, -6.142578125, -5.933349609375, -5.72412109375, -5.514892578125, -5.3056640625, -5.096435546875, -4.88720703125, -4.677978515625, -4.46875, -4.259521484375, -4.05029296875, -3.841064453125, -3.6318359375, -3.422607421875, -3.21337890625, -3.004150390625, -2.794921875, -2.585693359375, -2.37646484375, -2.167236328125, -1.9580078125, -1.748779296875, -1.53955078125, -1.330322265625, -1.12109375, -0.911865234375, -0.70263671875, -0.493408203125, -0.2841796875, -0.074951171875, 0.13427734375, 0.343505859375, 0.552734375, 0.761962890625, 0.97119140625, 1.180419921875, 1.3896484375, 1.598876953125, 1.80810546875, 2.017333984375, 2.2265625, 2.435791015625, 2.64501953125, 2.854248046875, 3.0634765625, 3.272705078125, 3.48193359375, 3.691162109375, 3.900390625, 4.109619140625, 4.31884765625, 4.528076171875, 4.7373046875, 4.946533203125, 5.15576171875, 5.364990234375, 5.57421875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 11.0, 15.0, 36.0, 54.0, 93.0, 162.0, 217.0, 381.0, 573.0, 853.0, 1377.0, 2060.0, 3192.0, 4748.0, 7289.0, 10927.0, 16725.0, 25090.0, 37508.0, 54251.0, 77746.0, 105630.0, 133966.0, 144077.0, 122418.0, 93490.0, 66917.0, 45881.0, 31124.0, 20869.0, 13997.0, 9417.0, 6100.0, 4070.0, 2589.0, 1639.0, 1037.0, 732.0, 492.0, 292.0, 202.0, 112.0, 83.0, 52.0, 28.0, 13.0, 15.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.763671875, -0.74139404296875, -0.7191162109375, -0.69683837890625, -0.674560546875, -0.65228271484375, -0.6300048828125, -0.60772705078125, -0.58544921875, -0.56317138671875, -0.5408935546875, -0.51861572265625, -0.496337890625, -0.47406005859375, -0.4517822265625, -0.42950439453125, -0.4072265625, -0.38494873046875, -0.3626708984375, -0.34039306640625, -0.318115234375, -0.29583740234375, -0.2735595703125, -0.25128173828125, -0.22900390625, -0.20672607421875, -0.1844482421875, -0.16217041015625, -0.139892578125, -0.11761474609375, -0.0953369140625, -0.07305908203125, -0.05078125, -0.02850341796875, -0.0062255859375, 0.01605224609375, 0.038330078125, 0.06060791015625, 0.0828857421875, 0.10516357421875, 0.12744140625, 0.14971923828125, 0.1719970703125, 0.19427490234375, 0.216552734375, 0.23883056640625, 0.2611083984375, 0.28338623046875, 0.3056640625, 0.32794189453125, 0.3502197265625, 0.37249755859375, 0.394775390625, 0.41705322265625, 0.4393310546875, 0.46160888671875, 0.48388671875, 0.50616455078125, 0.5284423828125, 0.55072021484375, 0.572998046875, 0.59527587890625, 0.6175537109375, 0.63983154296875, 0.662109375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 5.0, 2.0, 4.0, 7.0, 12.0, 9.0, 7.0, 14.0, 15.0, 16.0, 15.0, 17.0, 19.0, 28.0, 24.0, 25.0, 28.0, 26.0, 33.0, 26.0, 44.0, 32.0, 37.0, 50.0, 1065.0, 33.0, 33.0, 38.0, 32.0, 41.0, 33.0, 25.0, 28.0, 23.0, 30.0, 25.0, 15.0, 27.0, 13.0, 10.0, 16.0, 12.0, 3.0, 5.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-4.4921875, -4.361572265625, -4.23095703125, -4.100341796875, -3.9697265625, -3.839111328125, -3.70849609375, -3.577880859375, -3.447265625, -3.316650390625, -3.18603515625, -3.055419921875, -2.9248046875, -2.794189453125, -2.66357421875, -2.532958984375, -2.40234375, -2.271728515625, -2.14111328125, -2.010498046875, -1.8798828125, -1.749267578125, -1.61865234375, -1.488037109375, -1.357421875, -1.226806640625, -1.09619140625, -0.965576171875, -0.8349609375, -0.704345703125, -0.57373046875, -0.443115234375, -0.3125, -0.181884765625, -0.05126953125, 0.079345703125, 0.2099609375, 0.340576171875, 0.47119140625, 0.601806640625, 0.732421875, 0.863037109375, 0.99365234375, 1.124267578125, 1.2548828125, 1.385498046875, 1.51611328125, 1.646728515625, 1.77734375, 1.907958984375, 2.03857421875, 2.169189453125, 2.2998046875, 2.430419921875, 2.56103515625, 2.691650390625, 2.822265625, 2.952880859375, 3.08349609375, 3.214111328125, 3.3447265625, 3.475341796875, 3.60595703125, 3.736572265625, 3.8671875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 18.0, 12.0, 24.0, 41.0, 68.0, 109.0, 143.0, 261.0, 386.0, 577.0, 911.0, 1461.0, 2237.0, 3661.0, 5850.0, 9584.0, 15647.0, 25150.0, 41276.0, 64356.0, 98196.0, 141138.0, 1220245.0, 154649.0, 111542.0, 74453.0, 47359.0, 29400.0, 18554.0, 11292.0, 7006.0, 4257.0, 2746.0, 1648.0, 1049.0, 616.0, 430.0, 253.0, 194.0, 119.0, 72.0, 54.0, 34.0, 21.0, 12.0, 8.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5791015625, -0.561370849609375, -0.54364013671875, -0.525909423828125, -0.5081787109375, -0.490447998046875, -0.47271728515625, -0.454986572265625, -0.437255859375, -0.419525146484375, -0.40179443359375, -0.384063720703125, -0.3663330078125, -0.348602294921875, -0.33087158203125, -0.313140869140625, -0.29541015625, -0.277679443359375, -0.25994873046875, -0.242218017578125, -0.2244873046875, -0.206756591796875, -0.18902587890625, -0.171295166015625, -0.153564453125, -0.135833740234375, -0.11810302734375, -0.100372314453125, -0.0826416015625, -0.064910888671875, -0.04718017578125, -0.029449462890625, -0.01171875, 0.006011962890625, 0.02374267578125, 0.041473388671875, 0.0592041015625, 0.076934814453125, 0.09466552734375, 0.112396240234375, 0.130126953125, 0.147857666015625, 0.16558837890625, 0.183319091796875, 0.2010498046875, 0.218780517578125, 0.23651123046875, 0.254241943359375, 0.27197265625, 0.289703369140625, 0.30743408203125, 0.325164794921875, 0.3428955078125, 0.360626220703125, 0.37835693359375, 0.396087646484375, 0.413818359375, 0.431549072265625, 0.44927978515625, 0.467010498046875, 0.4847412109375, 0.502471923828125, 0.52020263671875, 0.537933349609375, 0.5556640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 9.0, 3.0, 9.0, 10.0, 16.0, 17.0, 18.0, 25.0, 24.0, 37.0, 36.0, 70.0, 76.0, 95.0, 85.0, 103.0, 69.0, 56.0, 47.0, 55.0, 25.0, 27.0, 16.0, 9.0, 14.0, 7.0, 6.0, 15.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01422882080078125, -0.01381528377532959, -0.01340174674987793, -0.01298820972442627, -0.01257467269897461, -0.01216113567352295, -0.011747598648071289, -0.011334061622619629, -0.010920524597167969, -0.010506987571716309, -0.010093450546264648, -0.009679913520812988, -0.009266376495361328, -0.008852839469909668, -0.008439302444458008, -0.008025765419006348, -0.0076122283935546875, -0.007198691368103027, -0.006785154342651367, -0.006371617317199707, -0.005958080291748047, -0.005544543266296387, -0.0051310062408447266, -0.004717469215393066, -0.004303932189941406, -0.003890395164489746, -0.003476858139038086, -0.0030633211135864258, -0.0026497840881347656, -0.0022362470626831055, -0.0018227100372314453, -0.0014091730117797852, -0.000995635986328125, -0.0005820989608764648, -0.0001685619354248047, 0.00024497509002685547, 0.0006585121154785156, 0.0010720491409301758, 0.001485586166381836, 0.001899123191833496, 0.0023126602172851562, 0.0027261972427368164, 0.0031397342681884766, 0.0035532712936401367, 0.003966808319091797, 0.004380345344543457, 0.004793882369995117, 0.005207419395446777, 0.0056209564208984375, 0.006034493446350098, 0.006448030471801758, 0.006861567497253418, 0.007275104522705078, 0.007688641548156738, 0.008102178573608398, 0.008515715599060059, 0.008929252624511719, 0.009342789649963379, 0.009756326675415039, 0.0101698637008667, 0.01058340072631836, 0.01099693775177002, 0.01141047477722168, 0.01182401180267334, 0.012237548828125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 9.0, 10.0, 12.0, 7.0, 14.0, 28.0, 20.0, 40.0, 43.0, 72.0, 84.0, 133.0, 242.0, 477.0, 2925.0, 1033562.0, 9537.0, 603.0, 255.0, 142.0, 71.0, 53.0, 48.0, 39.0, 23.0, 29.0, 19.0, 15.0, 6.0, 7.0, 10.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.249420166015625, -0.24127197265625, -0.233123779296875, -0.2249755859375, -0.216827392578125, -0.20867919921875, -0.200531005859375, -0.1923828125, -0.184234619140625, -0.17608642578125, -0.167938232421875, -0.1597900390625, -0.151641845703125, -0.14349365234375, -0.135345458984375, -0.127197265625, -0.119049072265625, -0.11090087890625, -0.102752685546875, -0.0946044921875, -0.086456298828125, -0.07830810546875, -0.070159912109375, -0.06201171875, -0.053863525390625, -0.04571533203125, -0.037567138671875, -0.0294189453125, -0.021270751953125, -0.01312255859375, -0.004974365234375, 0.003173828125, 0.011322021484375, 0.01947021484375, 0.027618408203125, 0.0357666015625, 0.043914794921875, 0.05206298828125, 0.060211181640625, 0.068359375, 0.076507568359375, 0.08465576171875, 0.092803955078125, 0.1009521484375, 0.109100341796875, 0.11724853515625, 0.125396728515625, 0.133544921875, 0.141693115234375, 0.14984130859375, 0.157989501953125, 0.1661376953125, 0.174285888671875, 0.18243408203125, 0.190582275390625, 0.19873046875, 0.206878662109375, 0.21502685546875, 0.223175048828125, 0.2313232421875, 0.239471435546875, 0.24761962890625, 0.255767822265625, 0.263916015625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1000.0, 16.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39930278062820435, -0.3915659189224243, -0.3838290274143219, -0.37609216570854187, -0.36835530400276184, -0.3606184422969818, -0.3528815507888794, -0.34514468908309937, -0.33740782737731934, -0.3296709656715393, -0.3219340741634369, -0.31419721245765686, -0.30646035075187683, -0.2987234890460968, -0.2909865975379944, -0.28324973583221436, -0.2755128741264343, -0.2677760124206543, -0.2600391209125519, -0.25230225920677185, -0.24456539750099182, -0.2368285208940506, -0.22909165918827057, -0.22135478258132935, -0.21361790597438812, -0.2058810293674469, -0.19814416766166687, -0.19040729105472565, -0.18267042934894562, -0.1749335527420044, -0.16719669103622437, -0.15945981442928314, -0.1517229676246643, -0.14398609101772308, -0.13624922931194305, -0.12851235270500183, -0.1207754909992218, -0.11303861439228058, -0.10530175268650055, -0.09756487607955933, -0.0898279994726181, -0.08209113031625748, -0.07435426115989685, -0.06661739200353622, -0.0588805228471756, -0.05114364996552467, -0.04340678080916405, -0.03566991165280342, -0.027933046221733093, -0.020196177065372467, -0.012459306977689266, -0.004722436890006065, 0.003014432266354561, 0.010751303285360336, 0.018488172441720963, 0.02622504159808159, 0.033961910754442215, 0.04169877991080284, 0.04943564906716347, 0.05717252194881439, 0.06490939110517502, 0.07264626026153564, 0.08038312941789627, 0.0881199985742569, 0.09585686773061752]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 14.0, 10.0, 11.0, 17.0, 21.0, 27.0, 29.0, 36.0, 43.0, 45.0, 50.0, 35.0, 47.0, 52.0, 65.0, 51.0, 49.0, 54.0, 56.0, 50.0, 42.0, 40.0, 28.0, 24.0, 18.0, 23.0, 16.0, 12.0, 8.0, 12.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012001514434814453, -0.011492517776787281, -0.010983521118760109, -0.010474524460732937, -0.009965527802705765, -0.009456531144678593, -0.00894753448665142, -0.008438537828624249, -0.007929541170597076, -0.007420544512569904, -0.006911547854542732, -0.00640255119651556, -0.005893554538488388, -0.005384557880461216, -0.004875561222434044, -0.004366564564406872, -0.0038575679063796997, -0.0033485712483525276, -0.0028395745903253555, -0.0023305779322981834, -0.0018215812742710114, -0.0013125846162438393, -0.0008035879582166672, -0.0002945913001894951, 0.000214405357837677, 0.0007234020158648491, 0.0012323986738920212, 0.0017413953319191933, 0.0022503919899463654, 0.0027593886479735374, 0.0032683853060007095, 0.0037773819640278816, 0.004286378622055054, 0.004795375280082226, 0.005304371938109398, 0.00581336859613657, 0.006322365254163742, 0.006831361912190914, 0.007340358570218086, 0.007849355228245258, 0.00835835188627243, 0.008867348544299603, 0.009376345202326775, 0.009885341860353947, 0.010394338518381119, 0.01090333517640829, 0.011412331834435463, 0.011921328492462635, 0.012430325150489807, 0.01293932180851698, 0.013448318466544151, 0.013957315124571323, 0.014466311782598495, 0.014975308440625668, 0.01548430509865284, 0.015993300825357437, 0.016502298414707184, 0.01701129600405693, 0.017520291730761528, 0.018029287457466125, 0.018538285046815872, 0.01904728263616562, 0.019556278362870216, 0.020065274089574814, 0.02057427167892456]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 10.0, 8.0, 10.0, 13.0, 11.0, 18.0, 21.0, 14.0, 27.0, 29.0, 29.0, 33.0, 34.0, 48.0, 40.0, 40.0, 54.0, 45.0, 42.0, 39.0, 41.0, 45.0, 32.0, 35.0, 32.0, 39.0, 31.0, 25.0, 25.0, 20.0, 20.0, 20.0, 11.0, 9.0, 10.0, 7.0, 5.0, 5.0, 10.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0], "bins": [-7.81640625, -7.607177734375, -7.39794921875, -7.188720703125, -6.9794921875, -6.770263671875, -6.56103515625, -6.351806640625, -6.142578125, -5.933349609375, -5.72412109375, -5.514892578125, -5.3056640625, -5.096435546875, -4.88720703125, -4.677978515625, -4.46875, -4.259521484375, -4.05029296875, -3.841064453125, -3.6318359375, -3.422607421875, -3.21337890625, -3.004150390625, -2.794921875, -2.585693359375, -2.37646484375, -2.167236328125, -1.9580078125, -1.748779296875, -1.53955078125, -1.330322265625, -1.12109375, -0.911865234375, -0.70263671875, -0.493408203125, -0.2841796875, -0.074951171875, 0.13427734375, 0.343505859375, 0.552734375, 0.761962890625, 0.97119140625, 1.180419921875, 1.3896484375, 1.598876953125, 1.80810546875, 2.017333984375, 2.2265625, 2.435791015625, 2.64501953125, 2.854248046875, 3.0634765625, 3.272705078125, 3.48193359375, 3.691162109375, 3.900390625, 4.109619140625, 4.31884765625, 4.528076171875, 4.7373046875, 4.946533203125, 5.15576171875, 5.364990234375, 5.57421875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 11.0, 8.0, 22.0, 22.0, 27.0, 28.0, 39.0, 50.0, 91.0, 95.0, 130.0, 183.0, 246.0, 378.0, 577.0, 1180.0, 2598.0, 7476.0, 24430.0, 134084.0, 777829.0, 72142.0, 16696.0, 5514.0, 2045.0, 919.0, 470.0, 334.0, 234.0, 179.0, 124.0, 87.0, 69.0, 69.0, 41.0, 22.0, 25.0, 15.0, 20.0, 10.0, 15.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0], "bins": [-18.203125, -17.7158203125, -17.228515625, -16.7412109375, -16.25390625, -15.7666015625, -15.279296875, -14.7919921875, -14.3046875, -13.8173828125, -13.330078125, -12.8427734375, -12.35546875, -11.8681640625, -11.380859375, -10.8935546875, -10.40625, -9.9189453125, -9.431640625, -8.9443359375, -8.45703125, -7.9697265625, -7.482421875, -6.9951171875, -6.5078125, -6.0205078125, -5.533203125, -5.0458984375, -4.55859375, -4.0712890625, -3.583984375, -3.0966796875, -2.609375, -2.1220703125, -1.634765625, -1.1474609375, -0.66015625, -0.1728515625, 0.314453125, 0.8017578125, 1.2890625, 1.7763671875, 2.263671875, 2.7509765625, 3.23828125, 3.7255859375, 4.212890625, 4.7001953125, 5.1875, 5.6748046875, 6.162109375, 6.6494140625, 7.13671875, 7.6240234375, 8.111328125, 8.5986328125, 9.0859375, 9.5732421875, 10.060546875, 10.5478515625, 11.03515625, 11.5224609375, 12.009765625, 12.4970703125, 12.984375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 2.0, 11.0, 6.0, 9.0, 7.0, 10.0, 14.0, 11.0, 16.0, 8.0, 14.0, 24.0, 25.0, 28.0, 32.0, 41.0, 44.0, 39.0, 45.0, 68.0, 117.0, 322.0, 1534.0, 135.0, 63.0, 47.0, 51.0, 36.0, 42.0, 38.0, 30.0, 23.0, 29.0, 27.0, 21.0, 14.0, 10.0, 8.0, 11.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.482666015625, -16.90283203125, -16.322998046875, -15.7431640625, -15.163330078125, -14.58349609375, -14.003662109375, -13.423828125, -12.843994140625, -12.26416015625, -11.684326171875, -11.1044921875, -10.524658203125, -9.94482421875, -9.364990234375, -8.78515625, -8.205322265625, -7.62548828125, -7.045654296875, -6.4658203125, -5.885986328125, -5.30615234375, -4.726318359375, -4.146484375, -3.566650390625, -2.98681640625, -2.406982421875, -1.8271484375, -1.247314453125, -0.66748046875, -0.087646484375, 0.4921875, 1.072021484375, 1.65185546875, 2.231689453125, 2.8115234375, 3.391357421875, 3.97119140625, 4.551025390625, 5.130859375, 5.710693359375, 6.29052734375, 6.870361328125, 7.4501953125, 8.030029296875, 8.60986328125, 9.189697265625, 9.76953125, 10.349365234375, 10.92919921875, 11.509033203125, 12.0888671875, 12.668701171875, 13.24853515625, 13.828369140625, 14.408203125, 14.988037109375, 15.56787109375, 16.147705078125, 16.7275390625, 17.307373046875, 17.88720703125, 18.467041015625, 19.046875]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 3.0, 2.0, 6.0, 9.0, 6.0, 11.0, 10.0, 13.0, 7.0, 22.0, 20.0, 26.0, 40.0, 34.0, 44.0, 62.0, 82.0, 111.0, 178.0, 333.0, 870.0, 5535.0, 312157.0, 2812079.0, 11675.0, 1224.0, 399.0, 208.0, 119.0, 86.0, 60.0, 45.0, 42.0, 31.0, 23.0, 18.0, 13.0, 21.0, 9.0, 14.0, 11.0, 12.0, 6.0, 5.0, 11.0, 4.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-46.375, -44.931640625, -43.48828125, -42.044921875, -40.6015625, -39.158203125, -37.71484375, -36.271484375, -34.828125, -33.384765625, -31.94140625, -30.498046875, -29.0546875, -27.611328125, -26.16796875, -24.724609375, -23.28125, -21.837890625, -20.39453125, -18.951171875, -17.5078125, -16.064453125, -14.62109375, -13.177734375, -11.734375, -10.291015625, -8.84765625, -7.404296875, -5.9609375, -4.517578125, -3.07421875, -1.630859375, -0.1875, 1.255859375, 2.69921875, 4.142578125, 5.5859375, 7.029296875, 8.47265625, 9.916015625, 11.359375, 12.802734375, 14.24609375, 15.689453125, 17.1328125, 18.576171875, 20.01953125, 21.462890625, 22.90625, 24.349609375, 25.79296875, 27.236328125, 28.6796875, 30.123046875, 31.56640625, 33.009765625, 34.453125, 35.896484375, 37.33984375, 38.783203125, 40.2265625, 41.669921875, 43.11328125, 44.556640625, 46.0]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 287.0, 720.0, 11.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.47290802001953, -92.93209838867188, -86.39128875732422, -79.85047912597656, -73.30967712402344, -66.76885986328125, -60.228057861328125, -53.68724822998047, -47.14643859863281, -40.605628967285156, -34.0648193359375, -27.52401351928711, -20.983203887939453, -14.442394256591797, -7.901588439941406, -1.36077880859375, 5.180030822753906, 11.720839500427246, 18.261648178100586, 24.80245590209961, 31.343265533447266, 37.88407516479492, 44.42488098144531, 50.96569061279297, 57.506500244140625, 64.04730987548828, 70.58811950683594, 77.12892150878906, 83.66973876953125, 90.21054077148438, 96.75135040283203, 103.29216003417969, 109.83297729492188, 116.37378692626953, 122.91459655761719, 129.4553985595703, 135.9962158203125, 142.53701782226562, 149.07781982421875, 155.61863708496094, 162.15945434570312, 168.70025634765625, 175.24107360839844, 181.78187561035156, 188.32269287109375, 194.86349487304688, 201.404296875, 207.9451141357422, 214.4859161376953, 221.02671813964844, 227.56753540039062, 234.10833740234375, 240.64915466308594, 247.18995666503906, 253.73077392578125, 260.2715759277344, 266.8123779296875, 273.3531799316406, 279.89398193359375, 286.434814453125, 292.9756164550781, 299.51641845703125, 306.0572204589844, 312.5980224609375, 319.13885498046875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 4.0, 5.0, 7.0, 10.0, 12.0, 16.0, 8.0, 16.0, 20.0, 35.0, 20.0, 26.0, 29.0, 24.0, 35.0, 36.0, 34.0, 44.0, 51.0, 44.0, 41.0, 46.0, 43.0, 45.0, 35.0, 47.0, 41.0, 39.0, 21.0, 19.0, 19.0, 22.0, 14.0, 17.0, 14.0, 11.0, 7.0, 10.0, 8.0, 2.0, 6.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.92170333862305, -50.31410217285156, -48.70650100708008, -47.098899841308594, -45.49129867553711, -43.883697509765625, -42.27609634399414, -40.668495178222656, -39.06089401245117, -37.45329284667969, -35.8456916809082, -34.23809051513672, -32.630489349365234, -31.02288818359375, -29.415287017822266, -27.80768585205078, -26.20008659362793, -24.592485427856445, -22.98488426208496, -21.377283096313477, -19.769681930541992, -18.16208267211914, -16.554481506347656, -14.946879386901855, -13.339278221130371, -11.731677055358887, -10.124075889587402, -8.516475677490234, -6.908874034881592, -5.301273345947266, -3.6936721801757812, -2.086071014404297, -0.4784698486328125, 1.1291311979293823, 2.736732244491577, 4.344333171844482, 5.951934337615967, 7.559535026550293, 9.167136192321777, 10.774737358093262, 12.382338523864746, 13.98993968963623, 15.597540855407715, 17.205141067504883, 18.812742233276367, 20.42034339904785, 22.027944564819336, 23.63554573059082, 25.243146896362305, 26.85074806213379, 28.458349227905273, 30.065950393676758, 31.673551559448242, 33.281150817871094, 34.88875198364258, 36.49635314941406, 38.10395431518555, 39.71155548095703, 41.319156646728516, 42.9267578125, 44.534358978271484, 46.14196014404297, 47.74956130981445, 49.35716247558594, 50.96476364135742]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 10.0, 13.0, 16.0, 8.0, 16.0, 17.0, 22.0, 28.0, 31.0, 48.0, 22.0, 43.0, 30.0, 47.0, 55.0, 57.0, 42.0, 52.0, 45.0, 39.0, 37.0, 42.0, 32.0, 39.0, 30.0, 25.0, 24.0, 27.0, 15.0, 17.0, 13.0, 13.0, 9.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 3.0], "bins": [-8.796875, -8.569580078125, -8.34228515625, -8.114990234375, -7.8876953125, -7.660400390625, -7.43310546875, -7.205810546875, -6.978515625, -6.751220703125, -6.52392578125, -6.296630859375, -6.0693359375, -5.842041015625, -5.61474609375, -5.387451171875, -5.16015625, -4.932861328125, -4.70556640625, -4.478271484375, -4.2509765625, -4.023681640625, -3.79638671875, -3.569091796875, -3.341796875, -3.114501953125, -2.88720703125, -2.659912109375, -2.4326171875, -2.205322265625, -1.97802734375, -1.750732421875, -1.5234375, -1.296142578125, -1.06884765625, -0.841552734375, -0.6142578125, -0.386962890625, -0.15966796875, 0.067626953125, 0.294921875, 0.522216796875, 0.74951171875, 0.976806640625, 1.2041015625, 1.431396484375, 1.65869140625, 1.885986328125, 2.11328125, 2.340576171875, 2.56787109375, 2.795166015625, 3.0224609375, 3.249755859375, 3.47705078125, 3.704345703125, 3.931640625, 4.158935546875, 4.38623046875, 4.613525390625, 4.8408203125, 5.068115234375, 5.29541015625, 5.522705078125, 5.75]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 4.0, 8.0, 6.0, 15.0, 25.0, 41.0, 42.0, 61.0, 86.0, 159.0, 225.0, 370.0, 632.0, 1093.0, 2191.0, 4789.0, 12589.0, 37698.0, 161111.0, 950943.0, 2214042.0, 647452.0, 112278.0, 29304.0, 10205.0, 4351.0, 1971.0, 1020.0, 564.0, 340.0, 206.0, 136.0, 95.0, 65.0, 46.0, 33.0, 19.0, 25.0, 8.0, 8.0, 9.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-12.625, -12.278076171875, -11.93115234375, -11.584228515625, -11.2373046875, -10.890380859375, -10.54345703125, -10.196533203125, -9.849609375, -9.502685546875, -9.15576171875, -8.808837890625, -8.4619140625, -8.114990234375, -7.76806640625, -7.421142578125, -7.07421875, -6.727294921875, -6.38037109375, -6.033447265625, -5.6865234375, -5.339599609375, -4.99267578125, -4.645751953125, -4.298828125, -3.951904296875, -3.60498046875, -3.258056640625, -2.9111328125, -2.564208984375, -2.21728515625, -1.870361328125, -1.5234375, -1.176513671875, -0.82958984375, -0.482666015625, -0.1357421875, 0.211181640625, 0.55810546875, 0.905029296875, 1.251953125, 1.598876953125, 1.94580078125, 2.292724609375, 2.6396484375, 2.986572265625, 3.33349609375, 3.680419921875, 4.02734375, 4.374267578125, 4.72119140625, 5.068115234375, 5.4150390625, 5.761962890625, 6.10888671875, 6.455810546875, 6.802734375, 7.149658203125, 7.49658203125, 7.843505859375, 8.1904296875, 8.537353515625, 8.88427734375, 9.231201171875, 9.578125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 11.0, 14.0, 8.0, 18.0, 30.0, 33.0, 49.0, 65.0, 94.0, 118.0, 156.0, 230.0, 319.0, 425.0, 487.0, 470.0, 376.0, 268.0, 185.0, 171.0, 141.0, 95.0, 67.0, 47.0, 44.0, 31.0, 26.0, 15.0, 15.0, 19.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4288330078125, -8.115478515625, -7.8021240234375, -7.48876953125, -7.1754150390625, -6.862060546875, -6.5487060546875, -6.2353515625, -5.9219970703125, -5.608642578125, -5.2952880859375, -4.98193359375, -4.6685791015625, -4.355224609375, -4.0418701171875, -3.728515625, -3.4151611328125, -3.101806640625, -2.7884521484375, -2.47509765625, -2.1617431640625, -1.848388671875, -1.5350341796875, -1.2216796875, -0.9083251953125, -0.594970703125, -0.2816162109375, 0.03173828125, 0.3450927734375, 0.658447265625, 0.9718017578125, 1.28515625, 1.5985107421875, 1.911865234375, 2.2252197265625, 2.53857421875, 2.8519287109375, 3.165283203125, 3.4786376953125, 3.7919921875, 4.1053466796875, 4.418701171875, 4.7320556640625, 5.04541015625, 5.3587646484375, 5.672119140625, 5.9854736328125, 6.298828125, 6.6121826171875, 6.925537109375, 7.2388916015625, 7.55224609375, 7.8656005859375, 8.178955078125, 8.4923095703125, 8.8056640625, 9.1190185546875, 9.432373046875, 9.7457275390625, 10.05908203125, 10.3724365234375, 10.685791015625, 10.9991455078125, 11.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 8.0, 10.0, 8.0, 24.0, 27.0, 29.0, 40.0, 54.0, 75.0, 116.0, 177.0, 277.0, 472.0, 1148.0, 5514.0, 48905.0, 1282601.0, 2754530.0, 88908.0, 8337.0, 1587.0, 574.0, 282.0, 195.0, 125.0, 75.0, 61.0, 37.0, 14.0, 15.0, 18.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.53125, -34.598876953125, -33.66650390625, -32.734130859375, -31.8017578125, -30.869384765625, -29.93701171875, -29.004638671875, -28.072265625, -27.139892578125, -26.20751953125, -25.275146484375, -24.3427734375, -23.410400390625, -22.47802734375, -21.545654296875, -20.61328125, -19.680908203125, -18.74853515625, -17.816162109375, -16.8837890625, -15.951416015625, -15.01904296875, -14.086669921875, -13.154296875, -12.221923828125, -11.28955078125, -10.357177734375, -9.4248046875, -8.492431640625, -7.56005859375, -6.627685546875, -5.6953125, -4.762939453125, -3.83056640625, -2.898193359375, -1.9658203125, -1.033447265625, -0.10107421875, 0.831298828125, 1.763671875, 2.696044921875, 3.62841796875, 4.560791015625, 5.4931640625, 6.425537109375, 7.35791015625, 8.290283203125, 9.22265625, 10.155029296875, 11.08740234375, 12.019775390625, 12.9521484375, 13.884521484375, 14.81689453125, 15.749267578125, 16.681640625, 17.614013671875, 18.54638671875, 19.478759765625, 20.4111328125, 21.343505859375, 22.27587890625, 23.208251953125, 24.140625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 61.0, 488.0, 420.0, 41.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.49292755126953, -118.51420593261719, -110.53548431396484, -102.5567626953125, -94.57804107666016, -86.59931945800781, -78.62059020996094, -70.64187622070312, -62.663150787353516, -54.68442916870117, -46.70570755004883, -38.72698211669922, -30.748262405395508, -22.76953887939453, -14.790817260742188, -6.812095642089844, 1.1666259765625, 9.145347595214844, 17.124069213867188, 25.102792739868164, 33.081512451171875, 41.060237884521484, 49.03895950317383, 57.01768112182617, 64.99639892578125, 72.9751205444336, 80.95384216308594, 88.93256378173828, 96.91128540039062, 104.8900146484375, 112.86872863769531, 120.84745788574219, 128.82618713378906, 136.80491638183594, 144.78363037109375, 152.76235961914062, 160.74107360839844, 168.7198028564453, 176.69851684570312, 184.67724609375, 192.6559600830078, 200.6346893310547, 208.6134033203125, 216.59213256835938, 224.5708465576172, 232.54957580566406, 240.52828979492188, 248.50701904296875, 256.4857482910156, 264.4644775390625, 272.4432067871094, 280.4219055175781, 288.400634765625, 296.3793640136719, 304.35809326171875, 312.3367919921875, 320.3155212402344, 328.29425048828125, 336.2729797363281, 344.2516784667969, 352.23040771484375, 360.2091369628906, 368.1878662109375, 376.16656494140625, 384.1452941894531]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 6.0, 12.0, 11.0, 17.0, 8.0, 9.0, 16.0, 21.0, 21.0, 22.0, 29.0, 26.0, 24.0, 42.0, 34.0, 39.0, 30.0, 45.0, 54.0, 35.0, 36.0, 42.0, 45.0, 29.0, 21.0, 39.0, 41.0, 31.0, 28.0, 30.0, 20.0, 19.0, 16.0, 17.0, 17.0, 11.0, 9.0, 6.0, 8.0, 8.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-36.29107666015625, -35.27434158325195, -34.25760269165039, -33.240867614746094, -32.22412872314453, -31.207393646240234, -30.190656661987305, -29.173919677734375, -28.157184600830078, -27.14044761657715, -26.12371063232422, -25.106975555419922, -24.090238571166992, -23.073501586914062, -22.056764602661133, -21.040027618408203, -20.023290634155273, -19.006553649902344, -17.989816665649414, -16.973079681396484, -15.956344604492188, -14.939607620239258, -13.922870635986328, -12.906133651733398, -11.889397621154785, -10.872660636901855, -9.855924606323242, -8.839187622070312, -7.822451114654541, -6.8057146072387695, -5.78897762298584, -4.772241115570068, -3.755504608154297, -2.7387681007385254, -1.7220313549041748, -0.7052946090698242, 0.31144189834594727, 1.3281784057617188, 2.3449153900146484, 3.36165189743042, 4.378388404846191, 5.395124912261963, 6.411861419677734, 7.428598403930664, 8.445335388183594, 9.462071418762207, 10.478808403015137, 11.49554443359375, 12.51228141784668, 13.52901840209961, 14.545754432678223, 15.562491416931152, 16.579227447509766, 17.595964431762695, 18.612701416015625, 19.629438400268555, 20.646175384521484, 21.662912368774414, 22.679649353027344, 23.69638442993164, 24.71312141418457, 25.7298583984375, 26.74659538269043, 27.76333236694336, 28.780067443847656]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 2.0, 5.0, 11.0, 5.0, 11.0, 12.0, 16.0, 16.0, 20.0, 20.0, 26.0, 28.0, 26.0, 18.0, 36.0, 35.0, 39.0, 30.0, 35.0, 39.0, 38.0, 39.0, 37.0, 53.0, 38.0, 37.0, 36.0, 28.0, 30.0, 24.0, 29.0, 26.0, 27.0, 20.0, 15.0, 11.0, 16.0, 14.0, 15.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.7890625, -6.5859375, -6.3828125, -6.1796875, -5.9765625, -5.7734375, -5.5703125, -5.3671875, -5.1640625, -4.9609375, -4.7578125, -4.5546875, -4.3515625, -4.1484375, -3.9453125, -3.7421875, -3.5390625, -3.3359375, -3.1328125, -2.9296875, -2.7265625, -2.5234375, -2.3203125, -2.1171875, -1.9140625, -1.7109375, -1.5078125, -1.3046875, -1.1015625, -0.8984375, -0.6953125, -0.4921875, -0.2890625, -0.0859375, 0.1171875, 0.3203125, 0.5234375, 0.7265625, 0.9296875, 1.1328125, 1.3359375, 1.5390625, 1.7421875, 1.9453125, 2.1484375, 2.3515625, 2.5546875, 2.7578125, 2.9609375, 3.1640625, 3.3671875, 3.5703125, 3.7734375, 3.9765625, 4.1796875, 4.3828125, 4.5859375, 4.7890625, 4.9921875, 5.1953125, 5.3984375, 5.6015625, 5.8046875, 6.0078125, 6.2109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 13.0, 24.0, 37.0, 49.0, 76.0, 128.0, 193.0, 295.0, 468.0, 740.0, 1139.0, 1715.0, 2615.0, 3896.0, 5860.0, 8965.0, 13553.0, 20777.0, 31267.0, 46063.0, 66694.0, 93178.0, 121479.0, 143435.0, 133858.0, 106863.0, 78316.0, 55630.0, 37470.0, 25124.0, 16779.0, 10971.0, 7218.0, 4670.0, 3049.0, 2008.0, 1384.0, 872.0, 575.0, 392.0, 242.0, 165.0, 110.0, 70.0, 40.0, 31.0, 22.0, 11.0, 6.0, 11.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.7587890625, -0.736297607421875, -0.71380615234375, -0.691314697265625, -0.6688232421875, -0.646331787109375, -0.62384033203125, -0.601348876953125, -0.578857421875, -0.556365966796875, -0.53387451171875, -0.511383056640625, -0.4888916015625, -0.466400146484375, -0.44390869140625, -0.421417236328125, -0.39892578125, -0.376434326171875, -0.35394287109375, -0.331451416015625, -0.3089599609375, -0.286468505859375, -0.26397705078125, -0.241485595703125, -0.218994140625, -0.196502685546875, -0.17401123046875, -0.151519775390625, -0.1290283203125, -0.106536865234375, -0.08404541015625, -0.061553955078125, -0.0390625, -0.016571044921875, 0.00592041015625, 0.028411865234375, 0.0509033203125, 0.073394775390625, 0.09588623046875, 0.118377685546875, 0.140869140625, 0.163360595703125, 0.18585205078125, 0.208343505859375, 0.2308349609375, 0.253326416015625, 0.27581787109375, 0.298309326171875, 0.32080078125, 0.343292236328125, 0.36578369140625, 0.388275146484375, 0.4107666015625, 0.433258056640625, 0.45574951171875, 0.478240966796875, 0.500732421875, 0.523223876953125, 0.54571533203125, 0.568206787109375, 0.5906982421875, 0.613189697265625, 0.63568115234375, 0.658172607421875, 0.6806640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 9.0, 11.0, 14.0, 21.0, 13.0, 21.0, 18.0, 22.0, 26.0, 34.0, 25.0, 36.0, 40.0, 45.0, 39.0, 44.0, 43.0, 1061.0, 36.0, 41.0, 33.0, 25.0, 42.0, 29.0, 33.0, 35.0, 21.0, 33.0, 22.0, 20.0, 11.0, 12.0, 16.0, 13.0, 9.0, 6.0, 11.0, 9.0, 4.0, 2.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.515625, -4.382965087890625, -4.25030517578125, -4.117645263671875, -3.9849853515625, -3.852325439453125, -3.71966552734375, -3.587005615234375, -3.454345703125, -3.321685791015625, -3.18902587890625, -3.056365966796875, -2.9237060546875, -2.791046142578125, -2.65838623046875, -2.525726318359375, -2.39306640625, -2.260406494140625, -2.12774658203125, -1.995086669921875, -1.8624267578125, -1.729766845703125, -1.59710693359375, -1.464447021484375, -1.331787109375, -1.199127197265625, -1.06646728515625, -0.933807373046875, -0.8011474609375, -0.668487548828125, -0.53582763671875, -0.403167724609375, -0.2705078125, -0.137847900390625, -0.00518798828125, 0.127471923828125, 0.2601318359375, 0.392791748046875, 0.52545166015625, 0.658111572265625, 0.790771484375, 0.923431396484375, 1.05609130859375, 1.188751220703125, 1.3214111328125, 1.454071044921875, 1.58673095703125, 1.719390869140625, 1.85205078125, 1.984710693359375, 2.11737060546875, 2.250030517578125, 2.3826904296875, 2.515350341796875, 2.64801025390625, 2.780670166015625, 2.913330078125, 3.045989990234375, 3.17864990234375, 3.311309814453125, 3.4439697265625, 3.576629638671875, 3.70928955078125, 3.841949462890625, 3.974609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 10.0, 15.0, 34.0, 37.0, 40.0, 83.0, 97.0, 170.0, 231.0, 329.0, 467.0, 672.0, 1003.0, 1414.0, 2212.0, 3073.0, 4719.0, 6959.0, 10129.0, 15092.0, 22503.0, 32714.0, 47271.0, 66999.0, 91256.0, 118086.0, 1181075.0, 131636.0, 103993.0, 77584.0, 55409.0, 38982.0, 26800.0, 18151.0, 12214.0, 8305.0, 5519.0, 3708.0, 2688.0, 1678.0, 1152.0, 848.0, 590.0, 386.0, 234.0, 176.0, 133.0, 92.0, 53.0, 36.0, 32.0, 16.0, 12.0, 8.0, 6.0, 3.0], "bins": [-0.48876953125, -0.4746971130371094, -0.46062469482421875, -0.4465522766113281, -0.4324798583984375, -0.4184074401855469, -0.40433502197265625, -0.3902626037597656, -0.376190185546875, -0.3621177673339844, -0.34804534912109375, -0.3339729309082031, -0.3199005126953125, -0.3058280944824219, -0.29175567626953125, -0.2776832580566406, -0.26361083984375, -0.24953842163085938, -0.23546600341796875, -0.22139358520507812, -0.2073211669921875, -0.19324874877929688, -0.17917633056640625, -0.16510391235351562, -0.151031494140625, -0.13695907592773438, -0.12288665771484375, -0.10881423950195312, -0.0947418212890625, -0.08066940307617188, -0.06659698486328125, -0.052524566650390625, -0.0384521484375, -0.024379730224609375, -0.01030731201171875, 0.003765106201171875, 0.0178375244140625, 0.031909942626953125, 0.04598236083984375, 0.060054779052734375, 0.074127197265625, 0.08819961547851562, 0.10227203369140625, 0.11634445190429688, 0.1304168701171875, 0.14448928833007812, 0.15856170654296875, 0.17263412475585938, 0.18670654296875, 0.20077896118164062, 0.21485137939453125, 0.22892379760742188, 0.2429962158203125, 0.2570686340332031, 0.27114105224609375, 0.2852134704589844, 0.299285888671875, 0.3133583068847656, 0.32743072509765625, 0.3415031433105469, 0.3555755615234375, 0.3696479797363281, 0.38372039794921875, 0.3977928161621094, 0.411865234375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 3.0, 7.0, 9.0, 4.0, 9.0, 6.0, 5.0, 11.0, 13.0, 11.0, 19.0, 30.0, 28.0, 42.0, 43.0, 67.0, 101.0, 113.0, 105.0, 85.0, 59.0, 63.0, 32.0, 20.0, 25.0, 17.0, 10.0, 6.0, 5.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0081939697265625, -0.007952392101287842, -0.007710814476013184, -0.007469236850738525, -0.007227659225463867, -0.006986081600189209, -0.006744503974914551, -0.006502926349639893, -0.006261348724365234, -0.006019771099090576, -0.005778193473815918, -0.00553661584854126, -0.0052950382232666016, -0.005053460597991943, -0.004811882972717285, -0.004570305347442627, -0.004328727722167969, -0.0040871500968933105, -0.0038455724716186523, -0.003603994846343994, -0.003362417221069336, -0.0031208395957946777, -0.0028792619705200195, -0.0026376843452453613, -0.002396106719970703, -0.002154529094696045, -0.0019129514694213867, -0.0016713738441467285, -0.0014297962188720703, -0.0011882185935974121, -0.0009466409683227539, -0.0007050633430480957, -0.0004634857177734375, -0.0002219080924987793, 1.9669532775878906e-05, 0.0002612471580505371, 0.0005028247833251953, 0.0007444024085998535, 0.0009859800338745117, 0.00122755765914917, 0.0014691352844238281, 0.0017107129096984863, 0.0019522905349731445, 0.0021938681602478027, 0.002435445785522461, 0.002677023410797119, 0.0029186010360717773, 0.0031601786613464355, 0.0034017562866210938, 0.003643333911895752, 0.00388491153717041, 0.004126489162445068, 0.0043680667877197266, 0.004609644412994385, 0.004851222038269043, 0.005092799663543701, 0.005334377288818359, 0.005575954914093018, 0.005817532539367676, 0.006059110164642334, 0.006300687789916992, 0.00654226541519165, 0.006783843040466309, 0.007025420665740967, 0.007266998291015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 4.0, 8.0, 10.0, 14.0, 8.0, 13.0, 24.0, 27.0, 24.0, 59.0, 89.0, 128.0, 209.0, 395.0, 2126.0, 993118.0, 50650.0, 723.0, 285.0, 172.0, 114.0, 78.0, 57.0, 42.0, 29.0, 18.0, 17.0, 18.0, 8.0, 16.0, 17.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15022850036621094, -0.14518356323242188, -0.1401386260986328, -0.13509368896484375, -0.1300487518310547, -0.12500381469726562, -0.11995887756347656, -0.1149139404296875, -0.10986900329589844, -0.10482406616210938, -0.09977912902832031, -0.09473419189453125, -0.08968925476074219, -0.08464431762695312, -0.07959938049316406, -0.074554443359375, -0.06950950622558594, -0.06446456909179688, -0.05941963195800781, -0.05437469482421875, -0.04932975769042969, -0.044284820556640625, -0.03923988342285156, -0.0341949462890625, -0.029150009155273438, -0.024105072021484375, -0.019060134887695312, -0.01401519775390625, -0.008970260620117188, -0.003925323486328125, 0.0011196136474609375, 0.00616455078125, 0.011209487915039062, 0.016254425048828125, 0.021299362182617188, 0.02634429931640625, 0.03138923645019531, 0.036434173583984375, 0.04147911071777344, 0.0465240478515625, 0.05156898498535156, 0.056613922119140625, 0.06165885925292969, 0.06670379638671875, 0.07174873352050781, 0.07679367065429688, 0.08183860778808594, 0.086883544921875, 0.09192848205566406, 0.09697341918945312, 0.10201835632324219, 0.10706329345703125, 0.11210823059082031, 0.11715316772460938, 0.12219810485839844, 0.1272430419921875, 0.13228797912597656, 0.13733291625976562, 0.1423778533935547, 0.14742279052734375, 0.1524677276611328, 0.15751266479492188, 0.16255760192871094, 0.1676025390625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 240.0, 770.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13831637799739838, -0.13538292050361633, -0.1324494481086731, -0.12951599061489105, -0.12658251821994781, -0.12364906072616577, -0.12071559578180313, -0.11778213083744049, -0.11484867334365845, -0.1119152083992958, -0.10898174345493317, -0.10604828596115112, -0.10311482101678848, -0.10018135607242584, -0.0972478911280632, -0.09431442618370056, -0.09138096868991852, -0.08844750374555588, -0.08551403880119324, -0.0825805813074112, -0.07964711636304855, -0.07671365141868591, -0.07378018647432327, -0.07084672152996063, -0.06791325658559799, -0.06497979164123535, -0.06204633042216301, -0.05911286547780037, -0.05617940425872803, -0.05324593931436539, -0.05031247437000275, -0.047379013150930405, -0.04444555193185806, -0.04151208698749542, -0.03857862576842308, -0.03564516082406044, -0.0327116996049881, -0.029778234660625458, -0.026844771578907967, -0.023911308497190475, -0.020977845415472984, -0.018044382333755493, -0.015110919252038002, -0.012177455238997936, -0.009243992157280445, -0.006310529075562954, -0.003377065062522888, -0.00044360198080539703, 0.002489861100912094, 0.005423324182629585, 0.008356787264347076, 0.011290251277387142, 0.014223714359104633, 0.0171571783721447, 0.02009064145386219, 0.02302410453557968, 0.025957567617297173, 0.028891030699014664, 0.031824495643377304, 0.034757956862449646, 0.037691421806812286, 0.04062488302588463, 0.04355834797024727, 0.04649180918931961, 0.04942527413368225]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 6.0, 15.0, 11.0, 14.0, 15.0, 21.0, 26.0, 24.0, 49.0, 31.0, 41.0, 40.0, 55.0, 50.0, 52.0, 59.0, 50.0, 48.0, 47.0, 49.0, 40.0, 35.0, 28.0, 32.0, 27.0, 20.0, 30.0, 18.0, 20.0, 5.0, 11.0, 8.0, 7.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00505983829498291, -0.00487139355391264, -0.004682948812842369, -0.0044945040717720985, -0.004306059330701828, -0.0041176145896315575, -0.003929169848561287, -0.0037407251074910164, -0.003552280366420746, -0.0033638356253504753, -0.0031753908842802048, -0.0029869461432099342, -0.0027985014021396637, -0.002610056661069393, -0.0024216119199991226, -0.002233167178928852, -0.0020447224378585815, -0.001856277696788311, -0.0016678329557180405, -0.00147938821464777, -0.0012909434735774994, -0.0011024987325072289, -0.0009140539914369583, -0.0007256092503666878, -0.0005371645092964172, -0.0003487197682261467, -0.00016027502715587616, 2.816971391439438e-05, 0.00021661445498466492, 0.00040505919605493546, 0.000593503937125206, 0.0007819486781954765, 0.0009703934192657471, 0.0011588381603360176, 0.0013472829014062881, 0.0015357276424765587, 0.0017241723835468292, 0.0019126171246170998, 0.0021010618656873703, 0.002289506606757641, 0.0024779513478279114, 0.002666396088898182, 0.0028548408299684525, 0.003043285571038723, 0.0032317303121089935, 0.003420175053179264, 0.0036086197942495346, 0.003797064535319805, 0.003985509276390076, 0.004173954017460346, 0.004362398758530617, 0.004550843499600887, 0.004739288240671158, 0.004927732981741428, 0.005116177722811699, 0.0053046224638819695, 0.00549306720495224, 0.0056815119460225105, 0.005869956687092781, 0.006058401428163052, 0.006246846169233322, 0.006435290910303593, 0.006623735651373863, 0.006812180392444134, 0.007000625133514404]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 9.0, 2.0, 5.0, 11.0, 5.0, 11.0, 12.0, 16.0, 16.0, 20.0, 20.0, 26.0, 28.0, 26.0, 18.0, 36.0, 35.0, 39.0, 30.0, 35.0, 39.0, 38.0, 39.0, 37.0, 53.0, 38.0, 37.0, 36.0, 28.0, 30.0, 24.0, 28.0, 27.0, 27.0, 20.0, 15.0, 11.0, 16.0, 13.0, 16.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.7890625, -6.5859375, -6.3828125, -6.1796875, -5.9765625, -5.7734375, -5.5703125, -5.3671875, -5.1640625, -4.9609375, -4.7578125, -4.5546875, -4.3515625, -4.1484375, -3.9453125, -3.7421875, -3.5390625, -3.3359375, -3.1328125, -2.9296875, -2.7265625, -2.5234375, -2.3203125, -2.1171875, -1.9140625, -1.7109375, -1.5078125, -1.3046875, -1.1015625, -0.8984375, -0.6953125, -0.4921875, -0.2890625, -0.0859375, 0.1171875, 0.3203125, 0.5234375, 0.7265625, 0.9296875, 1.1328125, 1.3359375, 1.5390625, 1.7421875, 1.9453125, 2.1484375, 2.3515625, 2.5546875, 2.7578125, 2.9609375, 3.1640625, 3.3671875, 3.5703125, 3.7734375, 3.9765625, 4.1796875, 4.3828125, 4.5859375, 4.7890625, 4.9921875, 5.1953125, 5.3984375, 5.6015625, 5.8046875, 6.0078125, 6.2109375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 7.0, 7.0, 18.0, 21.0, 27.0, 34.0, 50.0, 68.0, 97.0, 128.0, 227.0, 334.0, 524.0, 892.0, 1481.0, 2631.0, 4586.0, 8621.0, 16851.0, 34984.0, 79921.0, 210423.0, 406995.0, 157703.0, 62884.0, 28287.0, 13807.0, 7292.0, 3983.0, 2232.0, 1299.0, 800.0, 438.0, 278.0, 181.0, 125.0, 87.0, 61.0, 41.0, 37.0, 15.0, 24.0, 14.0, 8.0, 6.0, 5.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.2734375, -8.02545166015625, -7.7774658203125, -7.52947998046875, -7.281494140625, -7.03350830078125, -6.7855224609375, -6.53753662109375, -6.28955078125, -6.04156494140625, -5.7935791015625, -5.54559326171875, -5.297607421875, -5.04962158203125, -4.8016357421875, -4.55364990234375, -4.3056640625, -4.05767822265625, -3.8096923828125, -3.56170654296875, -3.313720703125, -3.06573486328125, -2.8177490234375, -2.56976318359375, -2.32177734375, -2.07379150390625, -1.8258056640625, -1.57781982421875, -1.329833984375, -1.08184814453125, -0.8338623046875, -0.58587646484375, -0.337890625, -0.08990478515625, 0.1580810546875, 0.40606689453125, 0.654052734375, 0.90203857421875, 1.1500244140625, 1.39801025390625, 1.64599609375, 1.89398193359375, 2.1419677734375, 2.38995361328125, 2.637939453125, 2.88592529296875, 3.1339111328125, 3.38189697265625, 3.6298828125, 3.87786865234375, 4.1258544921875, 4.37384033203125, 4.621826171875, 4.86981201171875, 5.1177978515625, 5.36578369140625, 5.61376953125, 5.86175537109375, 6.1097412109375, 6.35772705078125, 6.605712890625, 6.85369873046875, 7.1016845703125, 7.34967041015625, 7.59765625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 12.0, 17.0, 21.0, 17.0, 31.0, 20.0, 28.0, 26.0, 35.0, 33.0, 42.0, 63.0, 89.0, 98.0, 230.0, 1507.0, 158.0, 85.0, 96.0, 52.0, 59.0, 50.0, 33.0, 29.0, 28.0, 22.0, 22.0, 21.0, 18.0, 10.0, 11.0, 12.0, 8.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.671875, -19.062744140625, -18.45361328125, -17.844482421875, -17.2353515625, -16.626220703125, -16.01708984375, -15.407958984375, -14.798828125, -14.189697265625, -13.58056640625, -12.971435546875, -12.3623046875, -11.753173828125, -11.14404296875, -10.534912109375, -9.92578125, -9.316650390625, -8.70751953125, -8.098388671875, -7.4892578125, -6.880126953125, -6.27099609375, -5.661865234375, -5.052734375, -4.443603515625, -3.83447265625, -3.225341796875, -2.6162109375, -2.007080078125, -1.39794921875, -0.788818359375, -0.1796875, 0.429443359375, 1.03857421875, 1.647705078125, 2.2568359375, 2.865966796875, 3.47509765625, 4.084228515625, 4.693359375, 5.302490234375, 5.91162109375, 6.520751953125, 7.1298828125, 7.739013671875, 8.34814453125, 8.957275390625, 9.56640625, 10.175537109375, 10.78466796875, 11.393798828125, 12.0029296875, 12.612060546875, 13.22119140625, 13.830322265625, 14.439453125, 15.048583984375, 15.65771484375, 16.266845703125, 16.8759765625, 17.485107421875, 18.09423828125, 18.703369140625, 19.3125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 5.0, 7.0, 5.0, 12.0, 18.0, 22.0, 23.0, 36.0, 49.0, 45.0, 83.0, 106.0, 143.0, 192.0, 297.0, 673.0, 2755.0, 32923.0, 1222219.0, 1842467.0, 38746.0, 3190.0, 683.0, 277.0, 177.0, 159.0, 110.0, 72.0, 61.0, 37.0, 31.0, 25.0, 12.0, 10.0, 11.0, 5.0, 7.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.75, -23.866943359375, -22.98388671875, -22.100830078125, -21.2177734375, -20.334716796875, -19.45166015625, -18.568603515625, -17.685546875, -16.802490234375, -15.91943359375, -15.036376953125, -14.1533203125, -13.270263671875, -12.38720703125, -11.504150390625, -10.62109375, -9.738037109375, -8.85498046875, -7.971923828125, -7.0888671875, -6.205810546875, -5.32275390625, -4.439697265625, -3.556640625, -2.673583984375, -1.79052734375, -0.907470703125, -0.0244140625, 0.858642578125, 1.74169921875, 2.624755859375, 3.5078125, 4.390869140625, 5.27392578125, 6.156982421875, 7.0400390625, 7.923095703125, 8.80615234375, 9.689208984375, 10.572265625, 11.455322265625, 12.33837890625, 13.221435546875, 14.1044921875, 14.987548828125, 15.87060546875, 16.753662109375, 17.63671875, 18.519775390625, 19.40283203125, 20.285888671875, 21.1689453125, 22.052001953125, 22.93505859375, 23.818115234375, 24.701171875, 25.584228515625, 26.46728515625, 27.350341796875, 28.2333984375, 29.116455078125, 29.99951171875, 30.882568359375, 31.765625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 48.0, 505.0, 421.0, 40.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.5990219116211, -97.46178436279297, -92.32453918457031, -87.18730163574219, -82.05006408691406, -76.91282653808594, -71.77558135986328, -66.63834381103516, -61.501102447509766, -56.363861083984375, -51.22662353515625, -46.08938217163086, -40.95214080810547, -35.814903259277344, -30.677661895751953, -25.540424346923828, -20.403182983398438, -15.26594352722168, -10.128703117370605, -4.991462707519531, 0.14577674865722656, 5.283016204833984, 10.420257568359375, 15.5574951171875, 20.69473648071289, 25.83197593688965, 30.969215393066406, 36.1064567565918, 41.24369812011719, 46.38093566894531, 51.5181770324707, 56.65541458129883, 61.79266357421875, 66.92990112304688, 72.06714630126953, 77.20438385009766, 82.34162139892578, 87.47886657714844, 92.61610412597656, 97.75334167480469, 102.89057922363281, 108.02781677246094, 113.1650619506836, 118.30229949951172, 123.43953704833984, 128.5767822265625, 133.71401977539062, 138.85125732421875, 143.98849487304688, 149.125732421875, 154.26296997070312, 159.40020751953125, 164.53746032714844, 169.67469787597656, 174.8119354248047, 179.9491729736328, 185.08642578125, 190.22366333007812, 195.36090087890625, 200.49813842773438, 205.63539123535156, 210.7726287841797, 215.9098663330078, 221.04710388183594, 226.18434143066406]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 6.0, 11.0, 7.0, 12.0, 16.0, 21.0, 27.0, 25.0, 34.0, 40.0, 40.0, 42.0, 42.0, 48.0, 44.0, 35.0, 39.0, 51.0, 46.0, 41.0, 44.0, 45.0, 37.0, 38.0, 31.0, 35.0, 17.0, 25.0, 19.0, 16.0, 13.0, 13.0, 5.0, 7.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-63.679962158203125, -62.05965805053711, -60.439353942871094, -58.81904983520508, -57.19874572753906, -55.57844161987305, -53.95813751220703, -52.33782958984375, -50.717529296875, -49.097225189208984, -47.47692108154297, -45.85661697387695, -44.23631286621094, -42.61600875854492, -40.995704650878906, -39.375396728515625, -37.75509262084961, -36.134788513183594, -34.51448440551758, -32.89418029785156, -31.273876190185547, -29.65357208251953, -28.033266067504883, -26.412961959838867, -24.79265785217285, -23.172353744506836, -21.55204963684082, -19.931743621826172, -18.311439514160156, -16.69113540649414, -15.070831298828125, -13.45052719116211, -11.83022689819336, -10.209922790527344, -8.589618682861328, -6.969313621520996, -5.3490095138549805, -3.728705406188965, -2.108400344848633, -0.4880962371826172, 1.1322078704833984, 2.752512216567993, 4.372816562652588, 5.993121147155762, 7.613425254821777, 9.233729362487793, 10.854034423828125, 12.47433853149414, 14.094642639160156, 15.714946746826172, 17.335250854492188, 18.955554962158203, 20.57585906982422, 22.196163177490234, 23.816469192504883, 25.4367733001709, 27.057077407836914, 28.67738151550293, 30.297685623168945, 31.917991638183594, 33.53829574584961, 35.158599853515625, 36.77890396118164, 38.399208068847656, 40.01951217651367]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 10.0, 6.0, 8.0, 11.0, 21.0, 14.0, 16.0, 15.0, 29.0, 27.0, 21.0, 28.0, 34.0, 35.0, 39.0, 33.0, 44.0, 51.0, 49.0, 43.0, 44.0, 50.0, 28.0, 26.0, 34.0, 28.0, 29.0, 24.0, 24.0, 27.0, 19.0, 24.0, 26.0, 14.0, 13.0, 13.0, 9.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -7.0284423828125, -6.810791015625, -6.5931396484375, -6.37548828125, -6.1578369140625, -5.940185546875, -5.7225341796875, -5.5048828125, -5.2872314453125, -5.069580078125, -4.8519287109375, -4.63427734375, -4.4166259765625, -4.198974609375, -3.9813232421875, -3.763671875, -3.5460205078125, -3.328369140625, -3.1107177734375, -2.89306640625, -2.6754150390625, -2.457763671875, -2.2401123046875, -2.0224609375, -1.8048095703125, -1.587158203125, -1.3695068359375, -1.15185546875, -0.9342041015625, -0.716552734375, -0.4989013671875, -0.28125, -0.0635986328125, 0.154052734375, 0.3717041015625, 0.58935546875, 0.8070068359375, 1.024658203125, 1.2423095703125, 1.4599609375, 1.6776123046875, 1.895263671875, 2.1129150390625, 2.33056640625, 2.5482177734375, 2.765869140625, 2.9835205078125, 3.201171875, 3.4188232421875, 3.636474609375, 3.8541259765625, 4.07177734375, 4.2894287109375, 4.507080078125, 4.7247314453125, 4.9423828125, 5.1600341796875, 5.377685546875, 5.5953369140625, 5.81298828125, 6.0306396484375, 6.248291015625, 6.4659423828125, 6.68359375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 19.0, 22.0, 34.0, 58.0, 103.0, 181.0, 303.0, 676.0, 1304.0, 3164.0, 8600.0, 27826.0, 134819.0, 1077231.0, 2388049.0, 457576.0, 66908.0, 17211.0, 5855.0, 2211.0, 1014.0, 500.0, 279.0, 136.0, 81.0, 38.0, 30.0, 16.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7249755859375, -10.317138671875, -9.9093017578125, -9.50146484375, -9.0936279296875, -8.685791015625, -8.2779541015625, -7.8701171875, -7.4622802734375, -7.054443359375, -6.6466064453125, -6.23876953125, -5.8309326171875, -5.423095703125, -5.0152587890625, -4.607421875, -4.1995849609375, -3.791748046875, -3.3839111328125, -2.97607421875, -2.5682373046875, -2.160400390625, -1.7525634765625, -1.3447265625, -0.9368896484375, -0.529052734375, -0.1212158203125, 0.28662109375, 0.6944580078125, 1.102294921875, 1.5101318359375, 1.91796875, 2.3258056640625, 2.733642578125, 3.1414794921875, 3.54931640625, 3.9571533203125, 4.364990234375, 4.7728271484375, 5.1806640625, 5.5885009765625, 5.996337890625, 6.4041748046875, 6.81201171875, 7.2198486328125, 7.627685546875, 8.0355224609375, 8.443359375, 8.8511962890625, 9.259033203125, 9.6668701171875, 10.07470703125, 10.4825439453125, 10.890380859375, 11.2982177734375, 11.7060546875, 12.1138916015625, 12.521728515625, 12.9295654296875, 13.33740234375, 13.7452392578125, 14.153076171875, 14.5609130859375, 14.96875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 10.0, 3.0, 13.0, 9.0, 9.0, 17.0, 18.0, 19.0, 36.0, 40.0, 70.0, 79.0, 84.0, 120.0, 199.0, 240.0, 316.0, 397.0, 452.0, 466.0, 338.0, 290.0, 196.0, 148.0, 100.0, 99.0, 65.0, 51.0, 31.0, 30.0, 31.0, 18.0, 12.0, 14.0, 8.0, 5.0, 8.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.453125, -9.18731689453125, -8.9215087890625, -8.65570068359375, -8.389892578125, -8.12408447265625, -7.8582763671875, -7.59246826171875, -7.32666015625, -7.06085205078125, -6.7950439453125, -6.52923583984375, -6.263427734375, -5.99761962890625, -5.7318115234375, -5.46600341796875, -5.2001953125, -4.93438720703125, -4.6685791015625, -4.40277099609375, -4.136962890625, -3.87115478515625, -3.6053466796875, -3.33953857421875, -3.07373046875, -2.80792236328125, -2.5421142578125, -2.27630615234375, -2.010498046875, -1.74468994140625, -1.4788818359375, -1.21307373046875, -0.947265625, -0.68145751953125, -0.4156494140625, -0.14984130859375, 0.115966796875, 0.38177490234375, 0.6475830078125, 0.91339111328125, 1.17919921875, 1.44500732421875, 1.7108154296875, 1.97662353515625, 2.242431640625, 2.50823974609375, 2.7740478515625, 3.03985595703125, 3.3056640625, 3.57147216796875, 3.8372802734375, 4.10308837890625, 4.368896484375, 4.63470458984375, 4.9005126953125, 5.16632080078125, 5.43212890625, 5.69793701171875, 5.9637451171875, 6.22955322265625, 6.495361328125, 6.76116943359375, 7.0269775390625, 7.29278564453125, 7.55859375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 5.0, 4.0, 8.0, 22.0, 23.0, 40.0, 45.0, 73.0, 101.0, 143.0, 266.0, 547.0, 1208.0, 3103.0, 9445.0, 32981.0, 140897.0, 1024531.0, 2564029.0, 327664.0, 63788.0, 16601.0, 5151.0, 1855.0, 776.0, 357.0, 217.0, 110.0, 77.0, 57.0, 46.0, 31.0, 12.0, 9.0, 17.0, 10.0, 4.0, 7.0, 4.0, 5.0, 1.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.4420166015625, -10.969970703125, -10.4979248046875, -10.02587890625, -9.5538330078125, -9.081787109375, -8.6097412109375, -8.1376953125, -7.6656494140625, -7.193603515625, -6.7215576171875, -6.24951171875, -5.7774658203125, -5.305419921875, -4.8333740234375, -4.361328125, -3.8892822265625, -3.417236328125, -2.9451904296875, -2.47314453125, -2.0010986328125, -1.529052734375, -1.0570068359375, -0.5849609375, -0.1129150390625, 0.359130859375, 0.8311767578125, 1.30322265625, 1.7752685546875, 2.247314453125, 2.7193603515625, 3.19140625, 3.6634521484375, 4.135498046875, 4.6075439453125, 5.07958984375, 5.5516357421875, 6.023681640625, 6.4957275390625, 6.9677734375, 7.4398193359375, 7.911865234375, 8.3839111328125, 8.85595703125, 9.3280029296875, 9.800048828125, 10.2720947265625, 10.744140625, 11.2161865234375, 11.688232421875, 12.1602783203125, 12.63232421875, 13.1043701171875, 13.576416015625, 14.0484619140625, 14.5205078125, 14.9925537109375, 15.464599609375, 15.9366455078125, 16.40869140625, 16.8807373046875, 17.352783203125, 17.8248291015625, 18.296875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 14.0, 69.0, 155.0, 303.0, 291.0, 134.0, 42.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-177.25592041015625, -173.464599609375, -169.6732635498047, -165.88194274902344, -162.09060668945312, -158.29928588867188, -154.50794982910156, -150.7166290283203, -146.92529296875, -143.13397216796875, -139.34263610839844, -135.5513153076172, -131.75997924804688, -127.96865844726562, -124.17733001708984, -120.38600158691406, -116.59468078613281, -112.80335235595703, -109.01202392578125, -105.22069549560547, -101.42936706542969, -97.63804626464844, -93.84671783447266, -90.05538940429688, -86.2640609741211, -82.47273254394531, -78.68140411376953, -74.89007568359375, -71.0987548828125, -67.30741882324219, -63.51609802246094, -59.724769592285156, -55.933433532714844, -52.14210510253906, -48.35077667236328, -44.559452056884766, -40.768123626708984, -36.9767951965332, -33.18547058105469, -29.394142150878906, -25.602813720703125, -21.811485290527344, -18.020158767700195, -14.22883129119873, -10.437503814697266, -6.646175384521484, -2.854848861694336, 0.9364776611328125, 4.727806091308594, 8.519133567810059, 12.310461044311523, 16.101787567138672, 19.893115997314453, 23.684444427490234, 27.475770950317383, 31.26709747314453, 35.05842590332031, 38.849754333496094, 42.641082763671875, 46.43240737915039, 50.22373580932617, 54.01506423950195, 57.80638885498047, 61.59771728515625, 65.38904571533203]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 3.0, 8.0, 7.0, 7.0, 11.0, 5.0, 14.0, 10.0, 17.0, 25.0, 25.0, 16.0, 27.0, 24.0, 32.0, 25.0, 29.0, 35.0, 57.0, 39.0, 39.0, 45.0, 52.0, 53.0, 40.0, 31.0, 31.0, 36.0, 27.0, 33.0, 38.0, 28.0, 23.0, 18.0, 17.0, 12.0, 14.0, 14.0, 10.0, 8.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.863357543945312, -29.7106876373291, -28.558019638061523, -27.405349731445312, -26.252681732177734, -25.100011825561523, -23.947341918945312, -22.794673919677734, -21.642004013061523, -20.489334106445312, -19.336666107177734, -18.183996200561523, -17.031326293945312, -15.878658294677734, -14.725988388061523, -13.573319435119629, -12.420650482177734, -11.26798152923584, -10.115312576293945, -8.962642669677734, -7.80997371673584, -6.657304763793945, -5.504635334014893, -4.35196590423584, -3.1992969512939453, -2.0466277599334717, -0.893958568572998, 0.2587106227874756, 1.4113798141479492, 2.5640487670898438, 3.7167181968688965, 4.869387626647949, 6.022056579589844, 7.174725532531738, 8.327394485473633, 9.480064392089844, 10.632733345031738, 11.785402297973633, 12.938072204589844, 14.090741157531738, 15.243410110473633, 16.396080017089844, 17.548748016357422, 18.701417922973633, 19.854087829589844, 21.006755828857422, 22.159425735473633, 23.312095642089844, 24.464763641357422, 25.617433547973633, 26.77010154724121, 27.922771453857422, 29.075439453125, 30.22810935974121, 31.380779266357422, 32.533447265625, 33.686119079589844, 34.83878707885742, 35.991458892822266, 37.144126892089844, 38.29679489135742, 39.449462890625, 40.602134704589844, 41.75480270385742, 42.907470703125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 12.0, 15.0, 11.0, 11.0, 11.0, 6.0, 15.0, 16.0, 27.0, 29.0, 28.0, 25.0, 34.0, 32.0, 40.0, 38.0, 48.0, 36.0, 38.0, 32.0, 38.0, 39.0, 38.0, 30.0, 29.0, 32.0, 29.0, 29.0, 26.0, 26.0, 25.0, 20.0, 26.0, 13.0, 16.0, 5.0, 8.0, 7.0, 5.0, 6.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.3359375, -6.133544921875, -5.93115234375, -5.728759765625, -5.5263671875, -5.323974609375, -5.12158203125, -4.919189453125, -4.716796875, -4.514404296875, -4.31201171875, -4.109619140625, -3.9072265625, -3.704833984375, -3.50244140625, -3.300048828125, -3.09765625, -2.895263671875, -2.69287109375, -2.490478515625, -2.2880859375, -2.085693359375, -1.88330078125, -1.680908203125, -1.478515625, -1.276123046875, -1.07373046875, -0.871337890625, -0.6689453125, -0.466552734375, -0.26416015625, -0.061767578125, 0.140625, 0.343017578125, 0.54541015625, 0.747802734375, 0.9501953125, 1.152587890625, 1.35498046875, 1.557373046875, 1.759765625, 1.962158203125, 2.16455078125, 2.366943359375, 2.5693359375, 2.771728515625, 2.97412109375, 3.176513671875, 3.37890625, 3.581298828125, 3.78369140625, 3.986083984375, 4.1884765625, 4.390869140625, 4.59326171875, 4.795654296875, 4.998046875, 5.200439453125, 5.40283203125, 5.605224609375, 5.8076171875, 6.010009765625, 6.21240234375, 6.414794921875, 6.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 4.0, 5.0, 13.0, 24.0, 46.0, 58.0, 102.0, 135.0, 238.0, 344.0, 543.0, 932.0, 1447.0, 2380.0, 3876.0, 6308.0, 9960.0, 15891.0, 25865.0, 40709.0, 63095.0, 95757.0, 138375.0, 171510.0, 154023.0, 111260.0, 74743.0, 48636.0, 31086.0, 19583.0, 12087.0, 7498.0, 4532.0, 2844.0, 1728.0, 1118.0, 651.0, 401.0, 306.0, 155.0, 98.0, 65.0, 59.0, 28.0, 19.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82763671875, -0.8006744384765625, -0.773712158203125, -0.7467498779296875, -0.71978759765625, -0.6928253173828125, -0.665863037109375, -0.6389007568359375, -0.6119384765625, -0.5849761962890625, -0.558013916015625, -0.5310516357421875, -0.50408935546875, -0.4771270751953125, -0.450164794921875, -0.4232025146484375, -0.396240234375, -0.3692779541015625, -0.342315673828125, -0.3153533935546875, -0.28839111328125, -0.2614288330078125, -0.234466552734375, -0.2075042724609375, -0.1805419921875, -0.1535797119140625, -0.126617431640625, -0.0996551513671875, -0.07269287109375, -0.0457305908203125, -0.018768310546875, 0.0081939697265625, 0.03515625, 0.0621185302734375, 0.089080810546875, 0.1160430908203125, 0.14300537109375, 0.1699676513671875, 0.196929931640625, 0.2238922119140625, 0.2508544921875, 0.2778167724609375, 0.304779052734375, 0.3317413330078125, 0.35870361328125, 0.3856658935546875, 0.412628173828125, 0.4395904541015625, 0.466552734375, 0.4935150146484375, 0.520477294921875, 0.5474395751953125, 0.57440185546875, 0.6013641357421875, 0.628326416015625, 0.6552886962890625, 0.6822509765625, 0.7092132568359375, 0.736175537109375, 0.7631378173828125, 0.79010009765625, 0.8170623779296875, 0.844024658203125, 0.8709869384765625, 0.89794921875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 9.0, 7.0, 11.0, 13.0, 11.0, 18.0, 19.0, 17.0, 19.0, 30.0, 34.0, 27.0, 38.0, 42.0, 39.0, 30.0, 41.0, 31.0, 1066.0, 47.0, 35.0, 42.0, 32.0, 46.0, 27.0, 30.0, 26.0, 30.0, 23.0, 19.0, 20.0, 23.0, 20.0, 12.0, 15.0, 9.0, 9.0, 8.0, 8.0, 3.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0], "bins": [-5.0078125, -4.864013671875, -4.72021484375, -4.576416015625, -4.4326171875, -4.288818359375, -4.14501953125, -4.001220703125, -3.857421875, -3.713623046875, -3.56982421875, -3.426025390625, -3.2822265625, -3.138427734375, -2.99462890625, -2.850830078125, -2.70703125, -2.563232421875, -2.41943359375, -2.275634765625, -2.1318359375, -1.988037109375, -1.84423828125, -1.700439453125, -1.556640625, -1.412841796875, -1.26904296875, -1.125244140625, -0.9814453125, -0.837646484375, -0.69384765625, -0.550048828125, -0.40625, -0.262451171875, -0.11865234375, 0.025146484375, 0.1689453125, 0.312744140625, 0.45654296875, 0.600341796875, 0.744140625, 0.887939453125, 1.03173828125, 1.175537109375, 1.3193359375, 1.463134765625, 1.60693359375, 1.750732421875, 1.89453125, 2.038330078125, 2.18212890625, 2.325927734375, 2.4697265625, 2.613525390625, 2.75732421875, 2.901123046875, 3.044921875, 3.188720703125, 3.33251953125, 3.476318359375, 3.6201171875, 3.763916015625, 3.90771484375, 4.051513671875, 4.1953125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 12.0, 9.0, 17.0, 25.0, 38.0, 47.0, 70.0, 122.0, 183.0, 267.0, 394.0, 598.0, 927.0, 1471.0, 2177.0, 3460.0, 5466.0, 8529.0, 13471.0, 21432.0, 33223.0, 51462.0, 78590.0, 114058.0, 148397.0, 1204543.0, 132328.0, 95965.0, 64640.0, 41726.0, 26819.0, 16916.0, 10597.0, 6863.0, 4344.0, 2750.0, 1772.0, 1160.0, 782.0, 469.0, 338.0, 220.0, 143.0, 106.0, 64.0, 46.0, 32.0, 21.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0], "bins": [-0.61572265625, -0.597747802734375, -0.57977294921875, -0.561798095703125, -0.5438232421875, -0.525848388671875, -0.50787353515625, -0.489898681640625, -0.471923828125, -0.453948974609375, -0.43597412109375, -0.417999267578125, -0.4000244140625, -0.382049560546875, -0.36407470703125, -0.346099853515625, -0.328125, -0.310150146484375, -0.29217529296875, -0.274200439453125, -0.2562255859375, -0.238250732421875, -0.22027587890625, -0.202301025390625, -0.184326171875, -0.166351318359375, -0.14837646484375, -0.130401611328125, -0.1124267578125, -0.094451904296875, -0.07647705078125, -0.058502197265625, -0.04052734375, -0.022552490234375, -0.00457763671875, 0.013397216796875, 0.0313720703125, 0.049346923828125, 0.06732177734375, 0.085296630859375, 0.103271484375, 0.121246337890625, 0.13922119140625, 0.157196044921875, 0.1751708984375, 0.193145751953125, 0.21112060546875, 0.229095458984375, 0.2470703125, 0.265045166015625, 0.28302001953125, 0.300994873046875, 0.3189697265625, 0.336944580078125, 0.35491943359375, 0.372894287109375, 0.390869140625, 0.408843994140625, 0.42681884765625, 0.444793701171875, 0.4627685546875, 0.480743408203125, 0.49871826171875, 0.516693115234375, 0.53466796875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 9.0, 12.0, 21.0, 16.0, 32.0, 43.0, 62.0, 94.0, 139.0, 153.0, 122.0, 74.0, 44.0, 31.0, 32.0, 15.0, 14.0, 11.0, 12.0, 4.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01031494140625, -0.009949445724487305, -0.00958395004272461, -0.009218454360961914, -0.008852958679199219, -0.008487462997436523, -0.008121967315673828, -0.007756471633911133, -0.0073909759521484375, -0.007025480270385742, -0.006659984588623047, -0.0062944889068603516, -0.005928993225097656, -0.005563497543334961, -0.005198001861572266, -0.00483250617980957, -0.004467010498046875, -0.00410151481628418, -0.0037360191345214844, -0.003370523452758789, -0.0030050277709960938, -0.0026395320892333984, -0.002274036407470703, -0.0019085407257080078, -0.0015430450439453125, -0.0011775493621826172, -0.0008120536804199219, -0.00044655799865722656, -8.106231689453125e-05, 0.00028443336486816406, 0.0006499290466308594, 0.0010154247283935547, 0.00138092041015625, 0.0017464160919189453, 0.0021119117736816406, 0.002477407455444336, 0.0028429031372070312, 0.0032083988189697266, 0.003573894500732422, 0.003939390182495117, 0.0043048858642578125, 0.004670381546020508, 0.005035877227783203, 0.0054013729095458984, 0.005766868591308594, 0.006132364273071289, 0.006497859954833984, 0.00686335563659668, 0.007228851318359375, 0.00759434700012207, 0.007959842681884766, 0.008325338363647461, 0.008690834045410156, 0.009056329727172852, 0.009421825408935547, 0.009787321090698242, 0.010152816772460938, 0.010518312454223633, 0.010883808135986328, 0.011249303817749023, 0.011614799499511719, 0.011980295181274414, 0.01234579086303711, 0.012711286544799805, 0.0130767822265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 5.0, 0.0, 2.0, 7.0, 5.0, 7.0, 4.0, 11.0, 14.0, 18.0, 22.0, 32.0, 39.0, 75.0, 98.0, 178.0, 383.0, 3481.0, 1009110.0, 33573.0, 851.0, 235.0, 127.0, 77.0, 57.0, 43.0, 29.0, 11.0, 15.0, 10.0, 8.0, 6.0, 4.0, 7.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.28076171875, -0.2729072570800781, -0.26505279541015625, -0.2571983337402344, -0.2493438720703125, -0.24148941040039062, -0.23363494873046875, -0.22578048706054688, -0.217926025390625, -0.21007156372070312, -0.20221710205078125, -0.19436264038085938, -0.1865081787109375, -0.17865371704101562, -0.17079925537109375, -0.16294479370117188, -0.15509033203125, -0.14723587036132812, -0.13938140869140625, -0.13152694702148438, -0.1236724853515625, -0.11581802368164062, -0.10796356201171875, -0.10010910034179688, -0.092254638671875, -0.08440017700195312, -0.07654571533203125, -0.06869125366210938, -0.0608367919921875, -0.052982330322265625, -0.04512786865234375, -0.037273406982421875, -0.0294189453125, -0.021564483642578125, -0.01371002197265625, -0.005855560302734375, 0.0019989013671875, 0.009853363037109375, 0.01770782470703125, 0.025562286376953125, 0.033416748046875, 0.041271209716796875, 0.04912567138671875, 0.056980133056640625, 0.0648345947265625, 0.07268905639648438, 0.08054351806640625, 0.08839797973632812, 0.09625244140625, 0.10410690307617188, 0.11196136474609375, 0.11981582641601562, 0.1276702880859375, 0.13552474975585938, 0.14337921142578125, 0.15123367309570312, 0.159088134765625, 0.16694259643554688, 0.17479705810546875, 0.18265151977539062, 0.1905059814453125, 0.19836044311523438, 0.20621490478515625, 0.21406936645507812, 0.221923828125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 34.0, 286.0, 606.0, 81.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00883872527629137, -0.00674484483897686, -0.004650963936001062, -0.0025570830330252647, -0.0004632025957107544, 0.001630677841603756, 0.003724559210240841, 0.005818439647555351, 0.007912320084869862, 0.010006200522184372, 0.012100081890821457, 0.014193962328135967, 0.016287842765450478, 0.018381722271442413, 0.0204756036400795, 0.022569485008716583, 0.024663366377353668, 0.026757247745990753, 0.02885112725198269, 0.030945008620619774, 0.03303888812661171, 0.035132769495248795, 0.03722665086388588, 0.039320532232522964, 0.04141440987586975, 0.043508291244506836, 0.04560217261314392, 0.047696053981781006, 0.04978993162512779, 0.05188381299376488, 0.05397769436240196, 0.05607157573103905, 0.058165453374385834, 0.06025933474302292, 0.062353216111660004, 0.06444709748029709, 0.06654097884893417, 0.06863485276699066, 0.07072873413562775, 0.07282261550426483, 0.07491649687290192, 0.077010378241539, 0.07910425961017609, 0.08119814097881317, 0.08329202234745026, 0.08538590371608734, 0.08747978508472443, 0.08957365900278091, 0.0916675478219986, 0.09376142919063568, 0.09585531055927277, 0.09794919192790985, 0.10004307329654694, 0.10213695466518402, 0.1042308360338211, 0.1063247099518776, 0.10841859132051468, 0.11051247268915176, 0.11260635405778885, 0.11470023542642593, 0.11679411679506302, 0.1188879907131195, 0.12098187208175659, 0.12307575345039368, 0.12516963481903076]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 10.0, 4.0, 10.0, 9.0, 8.0, 12.0, 18.0, 20.0, 23.0, 21.0, 17.0, 35.0, 26.0, 34.0, 37.0, 36.0, 41.0, 31.0, 53.0, 48.0, 50.0, 43.0, 33.0, 41.0, 25.0, 32.0, 31.0, 33.0, 34.0, 27.0, 10.0, 22.0, 15.0, 26.0, 10.0, 15.0, 13.0, 11.0, 7.0, 7.0, 8.0, 8.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006030440330505371, -0.005854674614965916, -0.00567890889942646, -0.005503143183887005, -0.0053273774683475494, -0.005151611752808094, -0.004975846037268639, -0.004800080321729183, -0.004624314606189728, -0.004448548890650272, -0.004272783175110817, -0.0040970174595713615, -0.003921251744031906, -0.0037454860284924507, -0.0035697203129529953, -0.00339395459741354, -0.0032181888818740845, -0.003042423166334629, -0.0028666574507951736, -0.0026908917352557182, -0.002515126019716263, -0.0023393603041768074, -0.002163594588637352, -0.0019878288730978966, -0.0018120631575584412, -0.0016362974420189857, -0.0014605317264795303, -0.001284766010940075, -0.0011090002954006195, -0.0009332345798611641, -0.0007574688643217087, -0.0005817031487822533, -0.00040593743324279785, -0.00023017171770334244, -5.4406002163887024e-05, 0.00012135971337556839, 0.0002971254289150238, 0.0004728911444544792, 0.0006486568599939346, 0.00082442257553339, 0.0010001882910728455, 0.0011759540066123009, 0.0013517197221517563, 0.0015274854376912117, 0.0017032511532306671, 0.0018790168687701225, 0.002054782584309578, 0.0022305482998490334, 0.0024063140153884888, 0.002582079730927944, 0.0027578454464673996, 0.002933611162006855, 0.0031093768775463104, 0.003285142593085766, 0.0034609083086252213, 0.0036366740241646767, 0.003812439739704132, 0.0039882054552435875, 0.004163971170783043, 0.004339736886322498, 0.004515502601861954, 0.004691268317401409, 0.0048670340329408646, 0.00504279974848032, 0.005218565464019775]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 6.0, 12.0, 15.0, 11.0, 11.0, 11.0, 6.0, 15.0, 16.0, 27.0, 29.0, 28.0, 25.0, 34.0, 32.0, 40.0, 38.0, 47.0, 37.0, 38.0, 32.0, 38.0, 39.0, 38.0, 31.0, 28.0, 32.0, 29.0, 29.0, 26.0, 26.0, 25.0, 20.0, 26.0, 13.0, 16.0, 5.0, 8.0, 6.0, 6.0, 6.0, 10.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-6.3359375, -6.133544921875, -5.93115234375, -5.728759765625, -5.5263671875, -5.323974609375, -5.12158203125, -4.919189453125, -4.716796875, -4.514404296875, -4.31201171875, -4.109619140625, -3.9072265625, -3.704833984375, -3.50244140625, -3.300048828125, -3.09765625, -2.895263671875, -2.69287109375, -2.490478515625, -2.2880859375, -2.085693359375, -1.88330078125, -1.680908203125, -1.478515625, -1.276123046875, -1.07373046875, -0.871337890625, -0.6689453125, -0.466552734375, -0.26416015625, -0.061767578125, 0.140625, 0.343017578125, 0.54541015625, 0.747802734375, 0.9501953125, 1.152587890625, 1.35498046875, 1.557373046875, 1.759765625, 1.962158203125, 2.16455078125, 2.366943359375, 2.5693359375, 2.771728515625, 2.97412109375, 3.176513671875, 3.37890625, 3.581298828125, 3.78369140625, 3.986083984375, 4.1884765625, 4.390869140625, 4.59326171875, 4.795654296875, 4.998046875, 5.200439453125, 5.40283203125, 5.605224609375, 5.8076171875, 6.010009765625, 6.21240234375, 6.414794921875, 6.6171875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 10.0, 7.0, 8.0, 18.0, 19.0, 16.0, 34.0, 42.0, 56.0, 69.0, 120.0, 151.0, 226.0, 354.0, 543.0, 962.0, 1827.0, 3404.0, 7218.0, 15661.0, 35507.0, 87883.0, 295242.0, 399833.0, 117166.0, 44830.0, 19206.0, 8750.0, 4267.0, 2075.0, 1119.0, 633.0, 402.0, 276.0, 191.0, 100.0, 78.0, 58.0, 57.0, 35.0, 22.0, 12.0, 19.0, 9.0, 15.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.4140625, -9.1116943359375, -8.809326171875, -8.5069580078125, -8.20458984375, -7.9022216796875, -7.599853515625, -7.2974853515625, -6.9951171875, -6.6927490234375, -6.390380859375, -6.0880126953125, -5.78564453125, -5.4832763671875, -5.180908203125, -4.8785400390625, -4.576171875, -4.2738037109375, -3.971435546875, -3.6690673828125, -3.36669921875, -3.0643310546875, -2.761962890625, -2.4595947265625, -2.1572265625, -1.8548583984375, -1.552490234375, -1.2501220703125, -0.94775390625, -0.6453857421875, -0.343017578125, -0.0406494140625, 0.26171875, 0.5640869140625, 0.866455078125, 1.1688232421875, 1.47119140625, 1.7735595703125, 2.075927734375, 2.3782958984375, 2.6806640625, 2.9830322265625, 3.285400390625, 3.5877685546875, 3.89013671875, 4.1925048828125, 4.494873046875, 4.7972412109375, 5.099609375, 5.4019775390625, 5.704345703125, 6.0067138671875, 6.30908203125, 6.6114501953125, 6.913818359375, 7.2161865234375, 7.5185546875, 7.8209228515625, 8.123291015625, 8.4256591796875, 8.72802734375, 9.0303955078125, 9.332763671875, 9.6351318359375, 9.9375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 6.0, 5.0, 6.0, 12.0, 9.0, 21.0, 20.0, 18.0, 14.0, 24.0, 19.0, 32.0, 39.0, 48.0, 58.0, 60.0, 75.0, 104.0, 169.0, 1408.0, 243.0, 135.0, 87.0, 56.0, 44.0, 32.0, 31.0, 35.0, 43.0, 36.0, 25.0, 21.0, 27.0, 12.0, 18.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.176025390625, -16.61767578125, -16.059326171875, -15.5009765625, -14.942626953125, -14.38427734375, -13.825927734375, -13.267578125, -12.709228515625, -12.15087890625, -11.592529296875, -11.0341796875, -10.475830078125, -9.91748046875, -9.359130859375, -8.80078125, -8.242431640625, -7.68408203125, -7.125732421875, -6.5673828125, -6.009033203125, -5.45068359375, -4.892333984375, -4.333984375, -3.775634765625, -3.21728515625, -2.658935546875, -2.1005859375, -1.542236328125, -0.98388671875, -0.425537109375, 0.1328125, 0.691162109375, 1.24951171875, 1.807861328125, 2.3662109375, 2.924560546875, 3.48291015625, 4.041259765625, 4.599609375, 5.157958984375, 5.71630859375, 6.274658203125, 6.8330078125, 7.391357421875, 7.94970703125, 8.508056640625, 9.06640625, 9.624755859375, 10.18310546875, 10.741455078125, 11.2998046875, 11.858154296875, 12.41650390625, 12.974853515625, 13.533203125, 14.091552734375, 14.64990234375, 15.208251953125, 15.7666015625, 16.324951171875, 16.88330078125, 17.441650390625, 18.0]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 8.0, 7.0, 12.0, 9.0, 27.0, 23.0, 32.0, 50.0, 60.0, 113.0, 146.0, 188.0, 313.0, 577.0, 2160.0, 37812.0, 2831532.0, 262989.0, 7493.0, 955.0, 377.0, 239.0, 143.0, 97.0, 94.0, 70.0, 50.0, 27.0, 27.0, 19.0, 12.0, 10.0, 9.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.34765625, -32.2265625, -31.10546875, -29.984375, -28.86328125, -27.7421875, -26.62109375, -25.5, -24.37890625, -23.2578125, -22.13671875, -21.015625, -19.89453125, -18.7734375, -17.65234375, -16.53125, -15.41015625, -14.2890625, -13.16796875, -12.046875, -10.92578125, -9.8046875, -8.68359375, -7.5625, -6.44140625, -5.3203125, -4.19921875, -3.078125, -1.95703125, -0.8359375, 0.28515625, 1.40625, 2.52734375, 3.6484375, 4.76953125, 5.890625, 7.01171875, 8.1328125, 9.25390625, 10.375, 11.49609375, 12.6171875, 13.73828125, 14.859375, 15.98046875, 17.1015625, 18.22265625, 19.34375, 20.46484375, 21.5859375, 22.70703125, 23.828125, 24.94921875, 26.0703125, 27.19140625, 28.3125, 29.43359375, 30.5546875, 31.67578125, 32.796875, 33.91796875, 35.0390625, 36.16015625, 37.28125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 67.0, 820.0, 125.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.2432861328125, -338.2997131347656, -330.35614013671875, -322.4125671386719, -314.468994140625, -306.52545166015625, -298.58184814453125, -290.6383056640625, -282.6947326660156, -274.75115966796875, -266.8075866699219, -258.864013671875, -250.9204559326172, -242.9768829345703, -235.03330993652344, -227.08973693847656, -219.1461639404297, -211.2025909423828, -203.25901794433594, -195.31546020507812, -187.37188720703125, -179.42831420898438, -171.4847412109375, -163.54116821289062, -155.59759521484375, -147.65402221679688, -139.71044921875, -131.76687622070312, -123.82331848144531, -115.87974548339844, -107.93617248535156, -99.99259948730469, -92.04905700683594, -84.10548400878906, -76.16191864013672, -68.21834564208984, -60.274776458740234, -52.331207275390625, -44.38763427734375, -36.44406509399414, -28.50049591064453, -20.556926727294922, -12.61335563659668, -4.6697845458984375, 3.273784637451172, 11.217353820800781, 19.160926818847656, 27.104496002197266, 35.048065185546875, 42.991634368896484, 50.935203552246094, 58.87877655029297, 66.82234191894531, 74.76591491699219, 82.70948791503906, 90.65306091308594, 98.59662628173828, 106.54019927978516, 114.4837646484375, 122.42733764648438, 130.37091064453125, 138.31448364257812, 146.258056640625, 154.2016143798828, 162.1451873779297]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 6.0, 4.0, 4.0, 7.0, 5.0, 12.0, 13.0, 6.0, 18.0, 20.0, 23.0, 26.0, 20.0, 24.0, 26.0, 27.0, 37.0, 45.0, 41.0, 41.0, 40.0, 39.0, 33.0, 41.0, 48.0, 40.0, 50.0, 31.0, 33.0, 23.0, 26.0, 24.0, 23.0, 25.0, 24.0, 18.0, 12.0, 9.0, 13.0, 4.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-46.47265625, -45.122901916503906, -43.77314758300781, -42.42338943481445, -41.07363510131836, -39.723880767822266, -38.374122619628906, -37.02436828613281, -35.67461395263672, -34.324859619140625, -32.97510528564453, -31.625347137451172, -30.275592803955078, -28.925838470458984, -27.576082229614258, -26.22632598876953, -24.876571655273438, -23.526817321777344, -22.177061080932617, -20.82730484008789, -19.477550506591797, -18.127796173095703, -16.778039932250977, -15.428284645080566, -14.078529357910156, -12.728774070739746, -11.379018783569336, -10.029263496398926, -8.679508209228516, -7.3297529220581055, -5.979997634887695, -4.630242347717285, -3.280487060546875, -1.9307317733764648, -0.5809764862060547, 0.7687788009643555, 2.1185340881347656, 3.468289375305176, 4.818044662475586, 6.167799949645996, 7.517555236816406, 8.867310523986816, 10.217065811157227, 11.566821098327637, 12.916576385498047, 14.266331672668457, 15.616086959838867, 16.965843200683594, 18.315597534179688, 19.66535186767578, 21.015108108520508, 22.364864349365234, 23.714618682861328, 25.064373016357422, 26.41412925720215, 27.763885498046875, 29.11363983154297, 30.463394165039062, 31.81315040588379, 33.162906646728516, 34.51266098022461, 35.8624153137207, 37.21217346191406, 38.561927795410156, 39.91168212890625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 9.0, 4.0, 4.0, 10.0, 9.0, 5.0, 14.0, 21.0, 20.0, 17.0, 15.0, 21.0, 31.0, 18.0, 25.0, 32.0, 45.0, 44.0, 34.0, 25.0, 54.0, 37.0, 37.0, 29.0, 38.0, 22.0, 30.0, 40.0, 40.0, 27.0, 34.0, 32.0, 23.0, 17.0, 21.0, 16.0, 17.0, 9.0, 12.0, 8.0, 6.0, 10.0, 8.0, 6.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.421875, -6.21624755859375, -6.0106201171875, -5.80499267578125, -5.599365234375, -5.39373779296875, -5.1881103515625, -4.98248291015625, -4.77685546875, -4.57122802734375, -4.3656005859375, -4.15997314453125, -3.954345703125, -3.74871826171875, -3.5430908203125, -3.33746337890625, -3.1318359375, -2.92620849609375, -2.7205810546875, -2.51495361328125, -2.309326171875, -2.10369873046875, -1.8980712890625, -1.69244384765625, -1.48681640625, -1.28118896484375, -1.0755615234375, -0.86993408203125, -0.664306640625, -0.45867919921875, -0.2530517578125, -0.04742431640625, 0.158203125, 0.36383056640625, 0.5694580078125, 0.77508544921875, 0.980712890625, 1.18634033203125, 1.3919677734375, 1.59759521484375, 1.80322265625, 2.00885009765625, 2.2144775390625, 2.42010498046875, 2.625732421875, 2.83135986328125, 3.0369873046875, 3.24261474609375, 3.4482421875, 3.65386962890625, 3.8594970703125, 4.06512451171875, 4.270751953125, 4.47637939453125, 4.6820068359375, 4.88763427734375, 5.09326171875, 5.29888916015625, 5.5045166015625, 5.71014404296875, 5.915771484375, 6.12139892578125, 6.3270263671875, 6.53265380859375, 6.73828125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 14.0, 17.0, 17.0, 23.0, 43.0, 50.0, 61.0, 98.0, 144.0, 223.0, 342.0, 536.0, 4059.0, 4176062.0, 10884.0, 586.0, 339.0, 246.0, 144.0, 115.0, 68.0, 49.0, 39.0, 27.0, 21.0, 18.0, 16.0, 5.0, 11.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.0, -91.5556640625, -88.111328125, -84.6669921875, -81.22265625, -77.7783203125, -74.333984375, -70.8896484375, -67.4453125, -64.0009765625, -60.556640625, -57.1123046875, -53.66796875, -50.2236328125, -46.779296875, -43.3349609375, -39.890625, -36.4462890625, -33.001953125, -29.5576171875, -26.11328125, -22.6689453125, -19.224609375, -15.7802734375, -12.3359375, -8.8916015625, -5.447265625, -2.0029296875, 1.44140625, 4.8857421875, 8.330078125, 11.7744140625, 15.21875, 18.6630859375, 22.107421875, 25.5517578125, 28.99609375, 32.4404296875, 35.884765625, 39.3291015625, 42.7734375, 46.2177734375, 49.662109375, 53.1064453125, 56.55078125, 59.9951171875, 63.439453125, 66.8837890625, 70.328125, 73.7724609375, 77.216796875, 80.6611328125, 84.10546875, 87.5498046875, 90.994140625, 94.4384765625, 97.8828125, 101.3271484375, 104.771484375, 108.2158203125, 111.66015625, 115.1044921875, 118.548828125, 121.9931640625, 125.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 9.0, 3.0, 4.0, 6.0, 10.0, 7.0, 16.0, 21.0, 18.0, 27.0, 31.0, 31.0, 53.0, 57.0, 88.0, 132.0, 183.0, 266.0, 367.0, 554.0, 590.0, 515.0, 350.0, 205.0, 146.0, 107.0, 67.0, 46.0, 30.0, 32.0, 24.0, 22.0, 19.0, 8.0, 7.0, 11.0, 6.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.1038818359375, -9.770263671875, -9.4366455078125, -9.10302734375, -8.7694091796875, -8.435791015625, -8.1021728515625, -7.7685546875, -7.4349365234375, -7.101318359375, -6.7677001953125, -6.43408203125, -6.1004638671875, -5.766845703125, -5.4332275390625, -5.099609375, -4.7659912109375, -4.432373046875, -4.0987548828125, -3.76513671875, -3.4315185546875, -3.097900390625, -2.7642822265625, -2.4306640625, -2.0970458984375, -1.763427734375, -1.4298095703125, -1.09619140625, -0.7625732421875, -0.428955078125, -0.0953369140625, 0.23828125, 0.5718994140625, 0.905517578125, 1.2391357421875, 1.57275390625, 1.9063720703125, 2.239990234375, 2.5736083984375, 2.9072265625, 3.2408447265625, 3.574462890625, 3.9080810546875, 4.24169921875, 4.5753173828125, 4.908935546875, 5.2425537109375, 5.576171875, 5.9097900390625, 6.243408203125, 6.5770263671875, 6.91064453125, 7.2442626953125, 7.577880859375, 7.9114990234375, 8.2451171875, 8.5787353515625, 8.912353515625, 9.2459716796875, 9.57958984375, 9.9132080078125, 10.246826171875, 10.5804443359375, 10.9140625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 8.0, 5.0, 3.0, 8.0, 11.0, 12.0, 21.0, 19.0, 21.0, 32.0, 40.0, 50.0, 78.0, 120.0, 294.0, 984.0, 11419.0, 738924.0, 3410465.0, 29193.0, 1664.0, 389.0, 165.0, 97.0, 65.0, 34.0, 33.0, 25.0, 20.0, 18.0, 11.0, 7.0, 6.0, 14.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.40625, -41.04443359375, -39.6826171875, -38.32080078125, -36.958984375, -35.59716796875, -34.2353515625, -32.87353515625, -31.51171875, -30.14990234375, -28.7880859375, -27.42626953125, -26.064453125, -24.70263671875, -23.3408203125, -21.97900390625, -20.6171875, -19.25537109375, -17.8935546875, -16.53173828125, -15.169921875, -13.80810546875, -12.4462890625, -11.08447265625, -9.72265625, -8.36083984375, -6.9990234375, -5.63720703125, -4.275390625, -2.91357421875, -1.5517578125, -0.18994140625, 1.171875, 2.53369140625, 3.8955078125, 5.25732421875, 6.619140625, 7.98095703125, 9.3427734375, 10.70458984375, 12.06640625, 13.42822265625, 14.7900390625, 16.15185546875, 17.513671875, 18.87548828125, 20.2373046875, 21.59912109375, 22.9609375, 24.32275390625, 25.6845703125, 27.04638671875, 28.408203125, 29.77001953125, 31.1318359375, 32.49365234375, 33.85546875, 35.21728515625, 36.5791015625, 37.94091796875, 39.302734375, 40.66455078125, 42.0263671875, 43.38818359375, 44.75]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 10.0, 42.0, 84.0, 155.0, 195.0, 210.0, 152.0, 89.0, 47.0, 18.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.4842300415039, -68.35020446777344, -66.2161865234375, -64.08216094970703, -61.94813537597656, -59.81411361694336, -57.680091857910156, -55.54606628417969, -53.412044525146484, -51.27802276611328, -49.14399719238281, -47.00997543334961, -44.875953674316406, -42.74192810058594, -40.607906341552734, -38.47388458251953, -36.33985900878906, -34.20583724975586, -32.07181167602539, -29.937789916992188, -27.80376625061035, -25.669742584228516, -23.535720825195312, -21.401697158813477, -19.26767349243164, -17.133649826049805, -14.999627113342285, -12.865604400634766, -10.73158073425293, -8.597557067871094, -6.463534355163574, -4.329511642456055, -2.1954803466796875, -0.061457157135009766, 2.072566032409668, 4.206589221954346, 6.340612411499023, 8.47463607788086, 10.608658790588379, 12.742681503295898, 14.876705169677734, 17.01072883605957, 19.144752502441406, 21.27877426147461, 23.412797927856445, 25.54682159423828, 27.680843353271484, 29.81486701965332, 31.948890686035156, 34.08291244506836, 36.21693801879883, 38.35095977783203, 40.4849853515625, 42.6190071105957, 44.753028869628906, 46.887054443359375, 49.02107620239258, 51.15509796142578, 53.28912353515625, 55.42314529418945, 57.557167053222656, 59.691192626953125, 61.82521438598633, 63.95923614501953, 66.09326171875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 11.0, 8.0, 13.0, 15.0, 13.0, 24.0, 18.0, 21.0, 40.0, 27.0, 17.0, 43.0, 35.0, 43.0, 45.0, 38.0, 44.0, 49.0, 41.0, 42.0, 50.0, 42.0, 37.0, 33.0, 44.0, 32.0, 16.0, 24.0, 19.0, 18.0, 13.0, 18.0, 10.0, 16.0, 5.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.228668212890625, -33.13459014892578, -32.04050827026367, -30.946430206298828, -29.85235023498535, -28.758270263671875, -27.66419219970703, -26.570112228393555, -25.476032257080078, -24.3819522857666, -23.287872314453125, -22.19379425048828, -21.099714279174805, -20.005634307861328, -18.911556243896484, -17.817476272583008, -16.72339630126953, -15.629316329956055, -14.535237312316895, -13.441158294677734, -12.347078323364258, -11.252998352050781, -10.158919334411621, -9.064840316772461, -7.970760345458984, -6.876680850982666, -5.782601356506348, -4.688521862030029, -3.594442367553711, -2.5003628730773926, -1.4062833786010742, -0.31220388412475586, 0.7818756103515625, 1.8759551048278809, 2.970034599304199, 4.064114093780518, 5.158193588256836, 6.252273082733154, 7.346352577209473, 8.440431594848633, 9.53451156616211, 10.628591537475586, 11.722670555114746, 12.816749572753906, 13.910829544067383, 15.00490951538086, 16.098987579345703, 17.19306755065918, 18.287147521972656, 19.381227493286133, 20.47530746459961, 21.569385528564453, 22.66346549987793, 23.757545471191406, 24.85162353515625, 25.945703506469727, 27.039783477783203, 28.13386344909668, 29.227943420410156, 30.322021484375, 31.416101455688477, 32.51018142700195, 33.6042594909668, 34.698341369628906, 35.79241943359375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 5.0, 11.0, 14.0, 19.0, 17.0, 22.0, 15.0, 20.0, 28.0, 39.0, 30.0, 28.0, 47.0, 36.0, 36.0, 47.0, 40.0, 36.0, 45.0, 43.0, 32.0, 38.0, 40.0, 37.0, 24.0, 34.0, 30.0, 24.0, 26.0, 22.0, 20.0, 17.0, 16.0, 4.0, 13.0, 6.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.30706787109375, -6.0946044921875, -5.88214111328125, -5.669677734375, -5.45721435546875, -5.2447509765625, -5.03228759765625, -4.81982421875, -4.60736083984375, -4.3948974609375, -4.18243408203125, -3.969970703125, -3.75750732421875, -3.5450439453125, -3.33258056640625, -3.1201171875, -2.90765380859375, -2.6951904296875, -2.48272705078125, -2.270263671875, -2.05780029296875, -1.8453369140625, -1.63287353515625, -1.42041015625, -1.20794677734375, -0.9954833984375, -0.78302001953125, -0.570556640625, -0.35809326171875, -0.1456298828125, 0.06683349609375, 0.279296875, 0.49176025390625, 0.7042236328125, 0.91668701171875, 1.129150390625, 1.34161376953125, 1.5540771484375, 1.76654052734375, 1.97900390625, 2.19146728515625, 2.4039306640625, 2.61639404296875, 2.828857421875, 3.04132080078125, 3.2537841796875, 3.46624755859375, 3.6787109375, 3.89117431640625, 4.1036376953125, 4.31610107421875, 4.528564453125, 4.74102783203125, 4.9534912109375, 5.16595458984375, 5.37841796875, 5.59088134765625, 5.8033447265625, 6.01580810546875, 6.228271484375, 6.44073486328125, 6.6531982421875, 6.86566162109375, 7.078125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 5.0, 14.0, 21.0, 41.0, 50.0, 75.0, 113.0, 173.0, 240.0, 332.0, 484.0, 757.0, 1158.0, 1569.0, 2237.0, 3276.0, 4611.0, 6565.0, 9481.0, 13646.0, 19496.0, 27334.0, 38839.0, 54003.0, 73089.0, 96919.0, 118557.0, 127875.0, 114857.0, 91682.0, 69306.0, 50214.0, 36334.0, 25402.0, 18099.0, 12587.0, 8963.0, 6171.0, 4377.0, 2970.0, 2088.0, 1437.0, 959.0, 701.0, 465.0, 317.0, 228.0, 143.0, 101.0, 82.0, 47.0, 23.0, 19.0, 15.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.60986328125, -0.5904388427734375, -0.571014404296875, -0.5515899658203125, -0.53216552734375, -0.5127410888671875, -0.493316650390625, -0.4738922119140625, -0.4544677734375, -0.4350433349609375, -0.415618896484375, -0.3961944580078125, -0.37677001953125, -0.3573455810546875, -0.337921142578125, -0.3184967041015625, -0.299072265625, -0.2796478271484375, -0.260223388671875, -0.2407989501953125, -0.22137451171875, -0.2019500732421875, -0.182525634765625, -0.1631011962890625, -0.1436767578125, -0.1242523193359375, -0.104827880859375, -0.0854034423828125, -0.06597900390625, -0.0465545654296875, -0.027130126953125, -0.0077056884765625, 0.01171875, 0.0311431884765625, 0.050567626953125, 0.0699920654296875, 0.08941650390625, 0.1088409423828125, 0.128265380859375, 0.1476898193359375, 0.1671142578125, 0.1865386962890625, 0.205963134765625, 0.2253875732421875, 0.24481201171875, 0.2642364501953125, 0.283660888671875, 0.3030853271484375, 0.322509765625, 0.3419342041015625, 0.361358642578125, 0.3807830810546875, 0.40020751953125, 0.4196319580078125, 0.439056396484375, 0.4584808349609375, 0.4779052734375, 0.4973297119140625, 0.516754150390625, 0.5361785888671875, 0.55560302734375, 0.5750274658203125, 0.594451904296875, 0.6138763427734375, 0.63330078125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 9.0, 2.0, 4.0, 13.0, 7.0, 12.0, 8.0, 13.0, 22.0, 24.0, 22.0, 27.0, 28.0, 31.0, 32.0, 46.0, 37.0, 45.0, 44.0, 39.0, 35.0, 1070.0, 37.0, 37.0, 35.0, 43.0, 38.0, 30.0, 29.0, 28.0, 24.0, 20.0, 18.0, 20.0, 24.0, 16.0, 16.0, 12.0, 7.0, 2.0, 4.0, 4.0, 8.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.6343994140625, -4.491455078125, -4.3485107421875, -4.20556640625, -4.0626220703125, -3.919677734375, -3.7767333984375, -3.6337890625, -3.4908447265625, -3.347900390625, -3.2049560546875, -3.06201171875, -2.9190673828125, -2.776123046875, -2.6331787109375, -2.490234375, -2.3472900390625, -2.204345703125, -2.0614013671875, -1.91845703125, -1.7755126953125, -1.632568359375, -1.4896240234375, -1.3466796875, -1.2037353515625, -1.060791015625, -0.9178466796875, -0.77490234375, -0.6319580078125, -0.489013671875, -0.3460693359375, -0.203125, -0.0601806640625, 0.082763671875, 0.2257080078125, 0.36865234375, 0.5115966796875, 0.654541015625, 0.7974853515625, 0.9404296875, 1.0833740234375, 1.226318359375, 1.3692626953125, 1.51220703125, 1.6551513671875, 1.798095703125, 1.9410400390625, 2.083984375, 2.2269287109375, 2.369873046875, 2.5128173828125, 2.65576171875, 2.7987060546875, 2.941650390625, 3.0845947265625, 3.2275390625, 3.3704833984375, 3.513427734375, 3.6563720703125, 3.79931640625, 3.9422607421875, 4.085205078125, 4.2281494140625, 4.37109375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 16.0, 37.0, 45.0, 58.0, 109.0, 147.0, 198.0, 310.0, 487.0, 679.0, 1104.0, 1617.0, 2418.0, 3634.0, 5570.0, 8566.0, 13073.0, 20065.0, 30821.0, 46424.0, 68391.0, 99783.0, 132663.0, 1200410.0, 136932.0, 105310.0, 73314.0, 49589.0, 32985.0, 21612.0, 14081.0, 9098.0, 5959.0, 3811.0, 2646.0, 1653.0, 1137.0, 728.0, 548.0, 351.0, 233.0, 170.0, 91.0, 82.0, 51.0, 39.0, 31.0, 13.0, 8.0, 6.0, 7.0, 5.0, 1.0, 1.0], "bins": [-0.546875, -0.5305900573730469, -0.5143051147460938, -0.4980201721191406, -0.4817352294921875, -0.4654502868652344, -0.44916534423828125, -0.4328804016113281, -0.416595458984375, -0.4003105163574219, -0.38402557373046875, -0.3677406311035156, -0.3514556884765625, -0.3351707458496094, -0.31888580322265625, -0.3026008605957031, -0.28631591796875, -0.2700309753417969, -0.25374603271484375, -0.23746109008789062, -0.2211761474609375, -0.20489120483398438, -0.18860626220703125, -0.17232131958007812, -0.156036376953125, -0.13975143432617188, -0.12346649169921875, -0.10718154907226562, -0.0908966064453125, -0.07461166381835938, -0.05832672119140625, -0.042041778564453125, -0.0257568359375, -0.009471893310546875, 0.00681304931640625, 0.023097991943359375, 0.0393829345703125, 0.055667877197265625, 0.07195281982421875, 0.08823776245117188, 0.104522705078125, 0.12080764770507812, 0.13709259033203125, 0.15337753295898438, 0.1696624755859375, 0.18594741821289062, 0.20223236083984375, 0.21851730346679688, 0.23480224609375, 0.2510871887207031, 0.26737213134765625, 0.2836570739746094, 0.2999420166015625, 0.3162269592285156, 0.33251190185546875, 0.3487968444824219, 0.365081787109375, 0.3813667297363281, 0.39765167236328125, 0.4139366149902344, 0.4302215576171875, 0.4465065002441406, 0.46279144287109375, 0.4790763854980469, 0.495361328125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 9.0, 11.0, 13.0, 13.0, 27.0, 30.0, 29.0, 23.0, 47.0, 53.0, 54.0, 91.0, 76.0, 83.0, 77.0, 59.0, 49.0, 40.0, 45.0, 30.0, 24.0, 33.0, 17.0, 12.0, 13.0, 10.0, 5.0, 4.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007083892822265625, -0.006883978843688965, -0.006684064865112305, -0.0064841508865356445, -0.006284236907958984, -0.006084322929382324, -0.005884408950805664, -0.005684494972229004, -0.005484580993652344, -0.005284667015075684, -0.0050847530364990234, -0.004884839057922363, -0.004684925079345703, -0.004485011100769043, -0.004285097122192383, -0.004085183143615723, -0.0038852691650390625, -0.0036853551864624023, -0.003485441207885742, -0.003285527229309082, -0.003085613250732422, -0.0028856992721557617, -0.0026857852935791016, -0.0024858713150024414, -0.0022859573364257812, -0.002086043357849121, -0.001886129379272461, -0.0016862154006958008, -0.0014863014221191406, -0.0012863874435424805, -0.0010864734649658203, -0.0008865594863891602, -0.0006866455078125, -0.00048673152923583984, -0.0002868175506591797, -8.690357208251953e-05, 0.00011301040649414062, 0.0003129243850708008, 0.0005128383636474609, 0.0007127523422241211, 0.0009126663208007812, 0.0011125802993774414, 0.0013124942779541016, 0.0015124082565307617, 0.0017123222351074219, 0.001912236213684082, 0.002112150192260742, 0.0023120641708374023, 0.0025119781494140625, 0.0027118921279907227, 0.002911806106567383, 0.003111720085144043, 0.003311634063720703, 0.0035115480422973633, 0.0037114620208740234, 0.003911375999450684, 0.004111289978027344, 0.004311203956604004, 0.004511117935180664, 0.004711031913757324, 0.004910945892333984, 0.0051108598709106445, 0.005310773849487305, 0.005510687828063965, 0.005710601806640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 10.0, 8.0, 10.0, 11.0, 34.0, 32.0, 38.0, 65.0, 99.0, 129.0, 213.0, 434.0, 2883.0, 686213.0, 354988.0, 2338.0, 413.0, 201.0, 130.0, 83.0, 68.0, 49.0, 31.0, 20.0, 10.0, 9.0, 17.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1373291015625, -0.13258743286132812, -0.12784576416015625, -0.12310409545898438, -0.1183624267578125, -0.11362075805664062, -0.10887908935546875, -0.10413742065429688, -0.099395751953125, -0.09465408325195312, -0.08991241455078125, -0.08517074584960938, -0.0804290771484375, -0.07568740844726562, -0.07094573974609375, -0.06620407104492188, -0.06146240234375, -0.056720733642578125, -0.05197906494140625, -0.047237396240234375, -0.0424957275390625, -0.037754058837890625, -0.03301239013671875, -0.028270721435546875, -0.023529052734375, -0.018787384033203125, -0.01404571533203125, -0.009304046630859375, -0.0045623779296875, 0.000179290771484375, 0.00492095947265625, 0.009662628173828125, 0.014404296875, 0.019145965576171875, 0.02388763427734375, 0.028629302978515625, 0.0333709716796875, 0.038112640380859375, 0.04285430908203125, 0.047595977783203125, 0.052337646484375, 0.057079315185546875, 0.06182098388671875, 0.06656265258789062, 0.0713043212890625, 0.07604598999023438, 0.08078765869140625, 0.08552932739257812, 0.09027099609375, 0.09501266479492188, 0.09975433349609375, 0.10449600219726562, 0.1092376708984375, 0.11397933959960938, 0.11872100830078125, 0.12346267700195312, 0.128204345703125, 0.13294601440429688, 0.13768768310546875, 0.14242935180664062, 0.1471710205078125, 0.15191268920898438, 0.15665435791015625, 0.16139602661132812, 0.1661376953125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 77.0, 726.0, 191.0, 13.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11796111613512039, -0.11572128534317017, -0.11348145455121994, -0.11124162375926971, -0.10900179296731949, -0.10676196217536926, -0.10452213883399963, -0.10228230804204941, -0.10004247725009918, -0.09780264645814896, -0.09556281566619873, -0.0933229848742485, -0.09108315408229828, -0.08884333074092865, -0.08660349249839783, -0.0843636691570282, -0.08212383091449738, -0.07988400012254715, -0.07764416933059692, -0.0754043385386467, -0.07316450774669647, -0.07092468440532684, -0.06868484616279602, -0.06644502282142639, -0.06420519202947617, -0.06196536123752594, -0.059725530445575714, -0.05748569965362549, -0.05524587258696556, -0.053006041795015335, -0.05076621100306511, -0.04852638393640518, -0.04628654941916466, -0.04404671862721443, -0.041806887835264206, -0.03956706076860428, -0.03732722997665405, -0.03508739918470383, -0.0328475683927536, -0.030607739463448524, -0.0283679086714983, -0.026128077879548073, -0.023888248950242996, -0.02164841815829277, -0.019408587366342545, -0.017168758437037468, -0.014928927645087242, -0.012689098715782166, -0.01044926792383194, -0.008209438063204288, -0.00596960773691535, -0.0037297774106264114, -0.0014899475499987602, 0.000749882310628891, 0.002989713102579117, 0.005229542031884193, 0.007469372823834419, 0.00970920268446207, 0.011949032545089722, 0.014188863337039948, 0.016428694128990173, 0.01866852305829525, 0.020908353850245476, 0.023148182779550552, 0.025388013571500778]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 10.0, 7.0, 13.0, 7.0, 15.0, 21.0, 24.0, 29.0, 30.0, 32.0, 31.0, 39.0, 37.0, 35.0, 44.0, 42.0, 66.0, 48.0, 49.0, 35.0, 41.0, 52.0, 38.0, 47.0, 28.0, 29.0, 35.0, 19.0, 18.0, 14.0, 13.0, 11.0, 7.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003938257694244385, -0.0037847906351089478, -0.0036313235759735107, -0.0034778565168380737, -0.0033243894577026367, -0.0031709223985671997, -0.0030174553394317627, -0.0028639882802963257, -0.0027105212211608887, -0.0025570541620254517, -0.0024035871028900146, -0.0022501200437545776, -0.0020966529846191406, -0.0019431859254837036, -0.0017897188663482666, -0.0016362518072128296, -0.0014827847480773926, -0.0013293176889419556, -0.0011758506298065186, -0.0010223835706710815, -0.0008689165115356445, -0.0007154494524002075, -0.0005619823932647705, -0.0004085153341293335, -0.0002550482749938965, -0.00010158121585845947, 5.188584327697754e-05, 0.00020535290241241455, 0.00035881996154785156, 0.0005122870206832886, 0.0006657540798187256, 0.0008192211389541626, 0.0009726881980895996, 0.0011261552572250366, 0.0012796223163604736, 0.0014330893754959106, 0.0015865564346313477, 0.0017400234937667847, 0.0018934905529022217, 0.0020469576120376587, 0.0022004246711730957, 0.0023538917303085327, 0.0025073587894439697, 0.0026608258485794067, 0.0028142929077148438, 0.0029677599668502808, 0.0031212270259857178, 0.003274694085121155, 0.003428161144256592, 0.003581628203392029, 0.003735095262527466, 0.003888562321662903, 0.00404202938079834, 0.004195496439933777, 0.004348963499069214, 0.004502430558204651, 0.004655897617340088, 0.004809364676475525, 0.004962831735610962, 0.005116298794746399, 0.005269765853881836, 0.005423232913017273, 0.00557669997215271, 0.005730167031288147, 0.005883634090423584]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 5.0, 11.0, 14.0, 19.0, 17.0, 22.0, 15.0, 20.0, 28.0, 39.0, 30.0, 28.0, 47.0, 36.0, 36.0, 47.0, 40.0, 36.0, 45.0, 43.0, 32.0, 38.0, 40.0, 37.0, 24.0, 34.0, 29.0, 25.0, 25.0, 23.0, 20.0, 17.0, 16.0, 4.0, 13.0, 6.0, 8.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.30706787109375, -6.0946044921875, -5.88214111328125, -5.669677734375, -5.45721435546875, -5.2447509765625, -5.03228759765625, -4.81982421875, -4.60736083984375, -4.3948974609375, -4.18243408203125, -3.969970703125, -3.75750732421875, -3.5450439453125, -3.33258056640625, -3.1201171875, -2.90765380859375, -2.6951904296875, -2.48272705078125, -2.270263671875, -2.05780029296875, -1.8453369140625, -1.63287353515625, -1.42041015625, -1.20794677734375, -0.9954833984375, -0.78302001953125, -0.570556640625, -0.35809326171875, -0.1456298828125, 0.06683349609375, 0.279296875, 0.49176025390625, 0.7042236328125, 0.91668701171875, 1.129150390625, 1.34161376953125, 1.5540771484375, 1.76654052734375, 1.97900390625, 2.19146728515625, 2.4039306640625, 2.61639404296875, 2.828857421875, 3.04132080078125, 3.2537841796875, 3.46624755859375, 3.6787109375, 3.89117431640625, 4.1036376953125, 4.31610107421875, 4.528564453125, 4.74102783203125, 4.9534912109375, 5.16595458984375, 5.37841796875, 5.59088134765625, 5.8033447265625, 6.01580810546875, 6.228271484375, 6.44073486328125, 6.6531982421875, 6.86566162109375, 7.078125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 4.0, 8.0, 15.0, 20.0, 45.0, 41.0, 63.0, 88.0, 126.0, 158.0, 206.0, 301.0, 439.0, 584.0, 718.0, 1072.0, 2089.0, 4598.0, 14103.0, 50890.0, 217044.0, 509345.0, 181021.0, 43583.0, 12221.0, 4070.0, 1912.0, 1041.0, 727.0, 523.0, 429.0, 265.0, 212.0, 152.0, 134.0, 74.0, 63.0, 42.0, 37.0, 23.0, 16.0, 11.0, 10.0, 5.0, 11.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.40625, -11.04345703125, -10.6806640625, -10.31787109375, -9.955078125, -9.59228515625, -9.2294921875, -8.86669921875, -8.50390625, -8.14111328125, -7.7783203125, -7.41552734375, -7.052734375, -6.68994140625, -6.3271484375, -5.96435546875, -5.6015625, -5.23876953125, -4.8759765625, -4.51318359375, -4.150390625, -3.78759765625, -3.4248046875, -3.06201171875, -2.69921875, -2.33642578125, -1.9736328125, -1.61083984375, -1.248046875, -0.88525390625, -0.5224609375, -0.15966796875, 0.203125, 0.56591796875, 0.9287109375, 1.29150390625, 1.654296875, 2.01708984375, 2.3798828125, 2.74267578125, 3.10546875, 3.46826171875, 3.8310546875, 4.19384765625, 4.556640625, 4.91943359375, 5.2822265625, 5.64501953125, 6.0078125, 6.37060546875, 6.7333984375, 7.09619140625, 7.458984375, 7.82177734375, 8.1845703125, 8.54736328125, 8.91015625, 9.27294921875, 9.6357421875, 9.99853515625, 10.361328125, 10.72412109375, 11.0869140625, 11.44970703125, 11.8125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 10.0, 16.0, 14.0, 14.0, 14.0, 25.0, 23.0, 29.0, 36.0, 26.0, 46.0, 54.0, 67.0, 115.0, 164.0, 317.0, 1351.0, 180.0, 81.0, 73.0, 57.0, 59.0, 41.0, 38.0, 31.0, 28.0, 10.0, 14.0, 12.0, 17.0, 10.0, 7.0, 11.0, 8.0, 8.0, 5.0, 2.0, 7.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.453125, -16.925537109375, -16.39794921875, -15.870361328125, -15.3427734375, -14.815185546875, -14.28759765625, -13.760009765625, -13.232421875, -12.704833984375, -12.17724609375, -11.649658203125, -11.1220703125, -10.594482421875, -10.06689453125, -9.539306640625, -9.01171875, -8.484130859375, -7.95654296875, -7.428955078125, -6.9013671875, -6.373779296875, -5.84619140625, -5.318603515625, -4.791015625, -4.263427734375, -3.73583984375, -3.208251953125, -2.6806640625, -2.153076171875, -1.62548828125, -1.097900390625, -0.5703125, -0.042724609375, 0.48486328125, 1.012451171875, 1.5400390625, 2.067626953125, 2.59521484375, 3.122802734375, 3.650390625, 4.177978515625, 4.70556640625, 5.233154296875, 5.7607421875, 6.288330078125, 6.81591796875, 7.343505859375, 7.87109375, 8.398681640625, 8.92626953125, 9.453857421875, 9.9814453125, 10.509033203125, 11.03662109375, 11.564208984375, 12.091796875, 12.619384765625, 13.14697265625, 13.674560546875, 14.2021484375, 14.729736328125, 15.25732421875, 15.784912109375, 16.3125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 4.0, 5.0, 16.0, 18.0, 16.0, 21.0, 34.0, 30.0, 45.0, 51.0, 75.0, 135.0, 191.0, 348.0, 701.0, 1716.0, 66974.0, 3067677.0, 5143.0, 1093.0, 543.0, 282.0, 163.0, 111.0, 65.0, 49.0, 52.0, 28.0, 20.0, 15.0, 13.0, 14.0, 13.0, 5.0, 9.0, 6.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.5625, -48.8359375, -47.109375, -45.3828125, -43.65625, -41.9296875, -40.203125, -38.4765625, -36.75, -35.0234375, -33.296875, -31.5703125, -29.84375, -28.1171875, -26.390625, -24.6640625, -22.9375, -21.2109375, -19.484375, -17.7578125, -16.03125, -14.3046875, -12.578125, -10.8515625, -9.125, -7.3984375, -5.671875, -3.9453125, -2.21875, -0.4921875, 1.234375, 2.9609375, 4.6875, 6.4140625, 8.140625, 9.8671875, 11.59375, 13.3203125, 15.046875, 16.7734375, 18.5, 20.2265625, 21.953125, 23.6796875, 25.40625, 27.1328125, 28.859375, 30.5859375, 32.3125, 34.0390625, 35.765625, 37.4921875, 39.21875, 40.9453125, 42.671875, 44.3984375, 46.125, 47.8515625, 49.578125, 51.3046875, 53.03125, 54.7578125, 56.484375, 58.2109375, 59.9375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 806.0, 205.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.63294982910156, -186.7904052734375, -174.9478759765625, -163.1053466796875, -151.26280212402344, -139.42025756835938, -127.57772827148438, -115.73519134521484, -103.89265441894531, -92.05011749267578, -80.20758056640625, -68.36504364013672, -56.52250671386719, -44.679969787597656, -32.837432861328125, -20.994895935058594, -9.152359008789062, 2.6901779174804688, 14.53271484375, 26.37525177001953, 38.21778869628906, 50.060325622558594, 61.902862548828125, 73.74539947509766, 85.58793640136719, 97.43047332763672, 109.27301025390625, 121.11554718017578, 132.9580841064453, 144.80062866210938, 156.64315795898438, 168.48568725585938, 180.3282470703125, 192.1707763671875, 204.01332092285156, 215.85586547851562, 227.69839477539062, 239.54092407226562, 251.3834686279297, 263.22601318359375, 275.06854248046875, 286.91107177734375, 298.75360107421875, 310.5961608886719, 322.4386901855469, 334.2812194824219, 346.123779296875, 357.96630859375, 369.808837890625, 381.6513671875, 393.493896484375, 405.3364562988281, 417.1789855957031, 429.0215148925781, 440.86407470703125, 452.70660400390625, 464.54913330078125, 476.39166259765625, 488.23419189453125, 500.0767517089844, 511.9192810058594, 523.7618408203125, 535.6043701171875, 547.4468994140625, 559.2894287109375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 11.0, 14.0, 16.0, 11.0, 13.0, 16.0, 31.0, 30.0, 33.0, 26.0, 27.0, 33.0, 45.0, 34.0, 39.0, 46.0, 44.0, 48.0, 44.0, 34.0, 26.0, 45.0, 44.0, 35.0, 22.0, 33.0, 26.0, 19.0, 14.0, 16.0, 13.0, 18.0, 18.0, 9.0, 8.0, 10.0, 3.0, 8.0, 8.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0], "bins": [-57.44349670410156, -55.92447280883789, -54.40544891357422, -52.88642501831055, -51.367401123046875, -49.8483772277832, -48.32935333251953, -46.81032943725586, -45.29130554199219, -43.772281646728516, -42.253257751464844, -40.73423385620117, -39.2152099609375, -37.69618606567383, -36.177162170410156, -34.658138275146484, -33.13911437988281, -31.62009048461914, -30.10106658935547, -28.582042694091797, -27.063018798828125, -25.543994903564453, -24.02497100830078, -22.50594711303711, -20.986927032470703, -19.46790313720703, -17.94887924194336, -16.429855346679688, -14.910831451416016, -13.391807556152344, -11.872784614562988, -10.353760719299316, -8.834735870361328, -7.315711975097656, -5.796688079833984, -4.277664661407471, -2.758640766143799, -1.239616870880127, 0.2794065475463867, 1.7984304428100586, 3.3174543380737305, 4.836478233337402, 6.355502128601074, 7.874525547027588, 9.393548965454102, 10.912572860717773, 12.431596755981445, 13.950620651245117, 15.469644546508789, 16.98866844177246, 18.507692337036133, 20.026716232299805, 21.545740127563477, 23.06476402282715, 24.583786010742188, 26.10280990600586, 27.62183380126953, 29.140857696533203, 30.659881591796875, 32.17890548706055, 33.69792938232422, 35.21695327758789, 36.73597717285156, 38.255001068115234, 39.774024963378906]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 2.0, 5.0, 9.0, 10.0, 8.0, 14.0, 14.0, 17.0, 16.0, 22.0, 30.0, 31.0, 32.0, 35.0, 41.0, 35.0, 33.0, 46.0, 38.0, 36.0, 41.0, 56.0, 52.0, 41.0, 25.0, 35.0, 36.0, 48.0, 27.0, 25.0, 18.0, 22.0, 24.0, 19.0, 12.0, 10.0, 9.0, 2.0, 3.0, 10.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.2578125, -7.03167724609375, -6.8055419921875, -6.57940673828125, -6.353271484375, -6.12713623046875, -5.9010009765625, -5.67486572265625, -5.44873046875, -5.22259521484375, -4.9964599609375, -4.77032470703125, -4.544189453125, -4.31805419921875, -4.0919189453125, -3.86578369140625, -3.6396484375, -3.41351318359375, -3.1873779296875, -2.96124267578125, -2.735107421875, -2.50897216796875, -2.2828369140625, -2.05670166015625, -1.83056640625, -1.60443115234375, -1.3782958984375, -1.15216064453125, -0.926025390625, -0.69989013671875, -0.4737548828125, -0.24761962890625, -0.021484375, 0.20465087890625, 0.4307861328125, 0.65692138671875, 0.883056640625, 1.10919189453125, 1.3353271484375, 1.56146240234375, 1.78759765625, 2.01373291015625, 2.2398681640625, 2.46600341796875, 2.692138671875, 2.91827392578125, 3.1444091796875, 3.37054443359375, 3.5966796875, 3.82281494140625, 4.0489501953125, 4.27508544921875, 4.501220703125, 4.72735595703125, 4.9534912109375, 5.17962646484375, 5.40576171875, 5.63189697265625, 5.8580322265625, 6.08416748046875, 6.310302734375, 6.53643798828125, 6.7625732421875, 6.98870849609375, 7.21484375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 10.0, 5.0, 13.0, 24.0, 24.0, 27.0, 54.0, 55.0, 91.0, 96.0, 163.0, 243.0, 332.0, 454.0, 706.0, 1207.0, 2248.0, 4523.0, 10442.0, 31057.0, 139668.0, 777190.0, 2101557.0, 898736.0, 167409.0, 35448.0, 11401.0, 4919.0, 2441.0, 1308.0, 801.0, 465.0, 372.0, 220.0, 148.0, 119.0, 91.0, 52.0, 43.0, 34.0, 25.0, 23.0, 9.0, 6.0, 6.0, 7.0, 4.0, 3.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9447021484375, -9.608154296875, -9.2716064453125, -8.93505859375, -8.5985107421875, -8.261962890625, -7.9254150390625, -7.5888671875, -7.2523193359375, -6.915771484375, -6.5792236328125, -6.24267578125, -5.9061279296875, -5.569580078125, -5.2330322265625, -4.896484375, -4.5599365234375, -4.223388671875, -3.8868408203125, -3.55029296875, -3.2137451171875, -2.877197265625, -2.5406494140625, -2.2041015625, -1.8675537109375, -1.531005859375, -1.1944580078125, -0.85791015625, -0.5213623046875, -0.184814453125, 0.1517333984375, 0.48828125, 0.8248291015625, 1.161376953125, 1.4979248046875, 1.83447265625, 2.1710205078125, 2.507568359375, 2.8441162109375, 3.1806640625, 3.5172119140625, 3.853759765625, 4.1903076171875, 4.52685546875, 4.8634033203125, 5.199951171875, 5.5364990234375, 5.873046875, 6.2095947265625, 6.546142578125, 6.8826904296875, 7.21923828125, 7.5557861328125, 7.892333984375, 8.2288818359375, 8.5654296875, 8.9019775390625, 9.238525390625, 9.5750732421875, 9.91162109375, 10.2481689453125, 10.584716796875, 10.9212646484375, 11.2578125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 7.0, 11.0, 13.0, 15.0, 37.0, 40.0, 50.0, 78.0, 121.0, 173.0, 234.0, 336.0, 500.0, 661.0, 557.0, 372.0, 238.0, 177.0, 129.0, 79.0, 65.0, 47.0, 26.0, 27.0, 18.0, 13.0, 14.0, 5.0, 6.0, 6.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.4610595703125, -9.023681640625, -8.5863037109375, -8.14892578125, -7.7115478515625, -7.274169921875, -6.8367919921875, -6.3994140625, -5.9620361328125, -5.524658203125, -5.0872802734375, -4.64990234375, -4.2125244140625, -3.775146484375, -3.3377685546875, -2.900390625, -2.4630126953125, -2.025634765625, -1.5882568359375, -1.15087890625, -0.7135009765625, -0.276123046875, 0.1612548828125, 0.5986328125, 1.0360107421875, 1.473388671875, 1.9107666015625, 2.34814453125, 2.7855224609375, 3.222900390625, 3.6602783203125, 4.09765625, 4.5350341796875, 4.972412109375, 5.4097900390625, 5.84716796875, 6.2845458984375, 6.721923828125, 7.1593017578125, 7.5966796875, 8.0340576171875, 8.471435546875, 8.9088134765625, 9.34619140625, 9.7835693359375, 10.220947265625, 10.6583251953125, 11.095703125, 11.5330810546875, 11.970458984375, 12.4078369140625, 12.84521484375, 13.2825927734375, 13.719970703125, 14.1573486328125, 14.5947265625, 15.0321044921875, 15.469482421875, 15.9068603515625, 16.34423828125, 16.7816162109375, 17.218994140625, 17.6563720703125, 18.09375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 11.0, 3.0, 9.0, 14.0, 21.0, 28.0, 54.0, 85.0, 159.0, 272.0, 548.0, 1132.0, 3234.0, 16182.0, 205264.0, 3426076.0, 503685.0, 29891.0, 4699.0, 1533.0, 609.0, 346.0, 172.0, 98.0, 59.0, 45.0, 21.0, 13.0, 9.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.78125, -31.974609375, -31.16796875, -30.361328125, -29.5546875, -28.748046875, -27.94140625, -27.134765625, -26.328125, -25.521484375, -24.71484375, -23.908203125, -23.1015625, -22.294921875, -21.48828125, -20.681640625, -19.875, -19.068359375, -18.26171875, -17.455078125, -16.6484375, -15.841796875, -15.03515625, -14.228515625, -13.421875, -12.615234375, -11.80859375, -11.001953125, -10.1953125, -9.388671875, -8.58203125, -7.775390625, -6.96875, -6.162109375, -5.35546875, -4.548828125, -3.7421875, -2.935546875, -2.12890625, -1.322265625, -0.515625, 0.291015625, 1.09765625, 1.904296875, 2.7109375, 3.517578125, 4.32421875, 5.130859375, 5.9375, 6.744140625, 7.55078125, 8.357421875, 9.1640625, 9.970703125, 10.77734375, 11.583984375, 12.390625, 13.197265625, 14.00390625, 14.810546875, 15.6171875, 16.423828125, 17.23046875, 18.037109375, 18.84375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 989.0, 21.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-313.2666015625, -283.7605285644531, -254.2544708251953, -224.7484130859375, -195.24234008789062, -165.73626708984375, -136.23020935058594, -106.72415161132812, -77.21807861328125, -47.712013244628906, -18.205947875976562, 11.300117492675781, 40.806182861328125, 70.312255859375, 99.81831359863281, 129.32437133789062, 158.8304443359375, 188.33651733398438, 217.8425750732422, 247.3486328125, 276.8547058105469, 306.36077880859375, 335.8668212890625, 365.3728942871094, 394.87896728515625, 424.3850402832031, 453.89111328125, 483.39715576171875, 512.9031982421875, 542.4093017578125, 571.9153442382812, 601.42138671875, 630.927490234375, 660.4335327148438, 689.9396362304688, 719.4456787109375, 748.9517822265625, 778.4578247070312, 807.9638671875, 837.469970703125, 866.9760131835938, 896.4820556640625, 925.9881591796875, 955.4942016601562, 985.000244140625, 1014.50634765625, 1044.012451171875, 1073.5184326171875, 1103.0245361328125, 1132.5306396484375, 1162.03662109375, 1191.542724609375, 1221.048828125, 1250.554931640625, 1280.0609130859375, 1309.5670166015625, 1339.072998046875, 1368.5791015625, 1398.0850830078125, 1427.5911865234375, 1457.0972900390625, 1486.603271484375, 1516.109375, 1545.615478515625, 1575.12158203125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 11.0, 11.0, 21.0, 20.0, 30.0, 35.0, 56.0, 49.0, 47.0, 50.0, 73.0, 79.0, 75.0, 63.0, 67.0, 74.0, 68.0, 33.0, 28.0, 34.0, 24.0, 11.0, 15.0, 9.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-98.267578125, -95.94879913330078, -93.63002014160156, -91.31124114990234, -88.99246215820312, -86.67369079589844, -84.35491180419922, -82.0361328125, -79.71735382080078, -77.39857482910156, -75.07979583740234, -72.76101684570312, -70.44224548339844, -68.12346649169922, -65.8046875, -63.48590850830078, -61.16712951660156, -58.848350524902344, -56.529571533203125, -54.21079635620117, -51.89201736450195, -49.573238372802734, -47.25446319580078, -44.93568420410156, -42.616905212402344, -40.298126220703125, -37.979347229003906, -35.66057205200195, -33.341793060302734, -31.023014068603516, -28.70423698425293, -26.385459899902344, -24.066680908203125, -21.747901916503906, -19.42912483215332, -17.110347747802734, -14.791568756103516, -12.472790718078613, -10.154012680053711, -7.835235595703125, -5.516456604003906, -3.197678565979004, -0.8789005279541016, 1.4398775100708008, 3.758655548095703, 6.0774335861206055, 8.396211624145508, 10.714988708496094, 13.033767700195312, 15.352545738220215, 17.671323776245117, 19.990100860595703, 22.308879852294922, 24.62765884399414, 26.946435928344727, 29.265213012695312, 31.58399200439453, 33.90277099609375, 36.22154998779297, 38.54032516479492, 40.85910415649414, 43.17788314819336, 45.49665832519531, 47.81543731689453, 50.13421630859375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 3.0, 10.0, 10.0, 11.0, 12.0, 16.0, 23.0, 25.0, 25.0, 29.0, 22.0, 27.0, 25.0, 41.0, 41.0, 39.0, 41.0, 39.0, 42.0, 47.0, 47.0, 25.0, 46.0, 43.0, 35.0, 22.0, 32.0, 23.0, 21.0, 23.0, 27.0, 14.0, 14.0, 21.0, 18.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.59765625, -5.422119140625, -5.24658203125, -5.071044921875, -4.8955078125, -4.719970703125, -4.54443359375, -4.368896484375, -4.193359375, -4.017822265625, -3.84228515625, -3.666748046875, -3.4912109375, -3.315673828125, -3.14013671875, -2.964599609375, -2.7890625, -2.613525390625, -2.43798828125, -2.262451171875, -2.0869140625, -1.911376953125, -1.73583984375, -1.560302734375, -1.384765625, -1.209228515625, -1.03369140625, -0.858154296875, -0.6826171875, -0.507080078125, -0.33154296875, -0.156005859375, 0.01953125, 0.195068359375, 0.37060546875, 0.546142578125, 0.7216796875, 0.897216796875, 1.07275390625, 1.248291015625, 1.423828125, 1.599365234375, 1.77490234375, 1.950439453125, 2.1259765625, 2.301513671875, 2.47705078125, 2.652587890625, 2.828125, 3.003662109375, 3.17919921875, 3.354736328125, 3.5302734375, 3.705810546875, 3.88134765625, 4.056884765625, 4.232421875, 4.407958984375, 4.58349609375, 4.759033203125, 4.9345703125, 5.110107421875, 5.28564453125, 5.461181640625, 5.63671875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 14.0, 14.0, 16.0, 25.0, 61.0, 79.0, 135.0, 196.0, 270.0, 467.0, 688.0, 1125.0, 1614.0, 2533.0, 4008.0, 6151.0, 9783.0, 15256.0, 23858.0, 37393.0, 58323.0, 87052.0, 124328.0, 156624.0, 155137.0, 121467.0, 85019.0, 56355.0, 36262.0, 23040.0, 14870.0, 9622.0, 6069.0, 3774.0, 2533.0, 1559.0, 1017.0, 614.0, 401.0, 264.0, 185.0, 117.0, 82.0, 47.0, 35.0, 16.0, 15.0, 18.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.65380859375, -0.6333541870117188, -0.6128997802734375, -0.5924453735351562, -0.571990966796875, -0.5515365600585938, -0.5310821533203125, -0.5106277465820312, -0.49017333984375, -0.46971893310546875, -0.4492645263671875, -0.42881011962890625, -0.408355712890625, -0.38790130615234375, -0.3674468994140625, -0.34699249267578125, -0.3265380859375, -0.30608367919921875, -0.2856292724609375, -0.26517486572265625, -0.244720458984375, -0.22426605224609375, -0.2038116455078125, -0.18335723876953125, -0.16290283203125, -0.14244842529296875, -0.1219940185546875, -0.10153961181640625, -0.081085205078125, -0.06063079833984375, -0.0401763916015625, -0.01972198486328125, 0.000732421875, 0.02118682861328125, 0.0416412353515625, 0.06209564208984375, 0.082550048828125, 0.10300445556640625, 0.1234588623046875, 0.14391326904296875, 0.16436767578125, 0.18482208251953125, 0.2052764892578125, 0.22573089599609375, 0.246185302734375, 0.26663970947265625, 0.2870941162109375, 0.30754852294921875, 0.3280029296875, 0.34845733642578125, 0.3689117431640625, 0.38936614990234375, 0.409820556640625, 0.43027496337890625, 0.4507293701171875, 0.47118377685546875, 0.49163818359375, 0.5120925903320312, 0.5325469970703125, 0.5530014038085938, 0.573455810546875, 0.5939102172851562, 0.6143646240234375, 0.6348190307617188, 0.6552734375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 9.0, 8.0, 7.0, 8.0, 14.0, 12.0, 6.0, 17.0, 18.0, 19.0, 23.0, 20.0, 25.0, 24.0, 28.0, 33.0, 20.0, 23.0, 42.0, 33.0, 21.0, 43.0, 1058.0, 26.0, 36.0, 36.0, 32.0, 31.0, 42.0, 31.0, 27.0, 30.0, 26.0, 20.0, 24.0, 17.0, 11.0, 19.0, 21.0, 10.0, 15.0, 5.0, 7.0, 6.0, 5.0, 8.0, 4.0, 6.0, 4.0, 1.0, 5.0, 3.0, 2.0, 4.0], "bins": [-3.357421875, -3.25341796875, -3.1494140625, -3.04541015625, -2.94140625, -2.83740234375, -2.7333984375, -2.62939453125, -2.525390625, -2.42138671875, -2.3173828125, -2.21337890625, -2.109375, -2.00537109375, -1.9013671875, -1.79736328125, -1.693359375, -1.58935546875, -1.4853515625, -1.38134765625, -1.27734375, -1.17333984375, -1.0693359375, -0.96533203125, -0.861328125, -0.75732421875, -0.6533203125, -0.54931640625, -0.4453125, -0.34130859375, -0.2373046875, -0.13330078125, -0.029296875, 0.07470703125, 0.1787109375, 0.28271484375, 0.38671875, 0.49072265625, 0.5947265625, 0.69873046875, 0.802734375, 0.90673828125, 1.0107421875, 1.11474609375, 1.21875, 1.32275390625, 1.4267578125, 1.53076171875, 1.634765625, 1.73876953125, 1.8427734375, 1.94677734375, 2.05078125, 2.15478515625, 2.2587890625, 2.36279296875, 2.466796875, 2.57080078125, 2.6748046875, 2.77880859375, 2.8828125, 2.98681640625, 3.0908203125, 3.19482421875, 3.298828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 9.0, 12.0, 14.0, 28.0, 43.0, 59.0, 95.0, 151.0, 187.0, 304.0, 503.0, 674.0, 958.0, 1479.0, 2263.0, 3696.0, 5343.0, 7960.0, 12093.0, 18499.0, 27463.0, 41440.0, 60522.0, 86710.0, 117394.0, 1046470.0, 284904.0, 114626.0, 84281.0, 58881.0, 40259.0, 27006.0, 17855.0, 11845.0, 7836.0, 5101.0, 3409.0, 2209.0, 1508.0, 947.0, 712.0, 466.0, 301.0, 205.0, 140.0, 99.0, 55.0, 46.0, 28.0, 20.0, 15.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.422119140625, -0.40848541259765625, -0.3948516845703125, -0.38121795654296875, -0.367584228515625, -0.35395050048828125, -0.3403167724609375, -0.32668304443359375, -0.31304931640625, -0.29941558837890625, -0.2857818603515625, -0.27214813232421875, -0.258514404296875, -0.24488067626953125, -0.2312469482421875, -0.21761322021484375, -0.2039794921875, -0.19034576416015625, -0.1767120361328125, -0.16307830810546875, -0.149444580078125, -0.13581085205078125, -0.1221771240234375, -0.10854339599609375, -0.09490966796875, -0.08127593994140625, -0.0676422119140625, -0.05400848388671875, -0.040374755859375, -0.02674102783203125, -0.0131072998046875, 0.00052642822265625, 0.01416015625, 0.02779388427734375, 0.0414276123046875, 0.05506134033203125, 0.068695068359375, 0.08232879638671875, 0.0959625244140625, 0.10959625244140625, 0.12322998046875, 0.13686370849609375, 0.1504974365234375, 0.16413116455078125, 0.177764892578125, 0.19139862060546875, 0.2050323486328125, 0.21866607666015625, 0.2322998046875, 0.24593353271484375, 0.2595672607421875, 0.27320098876953125, 0.286834716796875, 0.30046844482421875, 0.3141021728515625, 0.32773590087890625, 0.34136962890625, 0.35500335693359375, 0.3686370849609375, 0.38227081298828125, 0.395904541015625, 0.40953826904296875, 0.4231719970703125, 0.43680572509765625, 0.450439453125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 18.0, 7.0, 23.0, 20.0, 36.0, 40.0, 32.0, 37.0, 60.0, 86.0, 114.0, 123.0, 80.0, 71.0, 31.0, 34.0, 33.0, 26.0, 18.0, 22.0, 12.0, 8.0, 12.0, 9.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00908660888671875, -0.00879359245300293, -0.00850057601928711, -0.008207559585571289, -0.007914543151855469, -0.0076215267181396484, -0.007328510284423828, -0.007035493850708008, -0.0067424774169921875, -0.006449460983276367, -0.006156444549560547, -0.0058634281158447266, -0.005570411682128906, -0.005277395248413086, -0.004984378814697266, -0.004691362380981445, -0.004398345947265625, -0.004105329513549805, -0.0038123130798339844, -0.003519296646118164, -0.0032262802124023438, -0.0029332637786865234, -0.002640247344970703, -0.002347230911254883, -0.0020542144775390625, -0.0017611980438232422, -0.0014681816101074219, -0.0011751651763916016, -0.0008821487426757812, -0.0005891323089599609, -0.0002961158752441406, -3.0994415283203125e-06, 0.0002899169921875, 0.0005829334259033203, 0.0008759498596191406, 0.001168966293334961, 0.0014619827270507812, 0.0017549991607666016, 0.002048015594482422, 0.002341032028198242, 0.0026340484619140625, 0.002927064895629883, 0.003220081329345703, 0.0035130977630615234, 0.0038061141967773438, 0.004099130630493164, 0.004392147064208984, 0.004685163497924805, 0.004978179931640625, 0.005271196365356445, 0.005564212799072266, 0.005857229232788086, 0.006150245666503906, 0.0064432621002197266, 0.006736278533935547, 0.007029294967651367, 0.0073223114013671875, 0.007615327835083008, 0.007908344268798828, 0.008201360702514648, 0.008494377136230469, 0.008787393569946289, 0.00908041000366211, 0.00937342643737793, 0.00966644287109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 7.0, 10.0, 10.0, 20.0, 16.0, 25.0, 38.0, 36.0, 58.0, 82.0, 116.0, 196.0, 357.0, 1054.0, 106746.0, 936662.0, 1954.0, 430.0, 232.0, 131.0, 103.0, 65.0, 45.0, 37.0, 25.0, 19.0, 21.0, 10.0, 6.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1881103515625, -0.1822528839111328, -0.17639541625976562, -0.17053794860839844, -0.16468048095703125, -0.15882301330566406, -0.15296554565429688, -0.1471080780029297, -0.1412506103515625, -0.1353931427001953, -0.12953567504882812, -0.12367820739746094, -0.11782073974609375, -0.11196327209472656, -0.10610580444335938, -0.10024833679199219, -0.094390869140625, -0.08853340148925781, -0.08267593383789062, -0.07681846618652344, -0.07096099853515625, -0.06510353088378906, -0.059246063232421875, -0.05338859558105469, -0.0475311279296875, -0.04167366027832031, -0.035816192626953125, -0.029958724975585938, -0.02410125732421875, -0.018243789672851562, -0.012386322021484375, -0.0065288543701171875, -0.00067138671875, 0.0051860809326171875, 0.011043548583984375, 0.016901016235351562, 0.02275848388671875, 0.028615951538085938, 0.034473419189453125, 0.04033088684082031, 0.0461883544921875, 0.05204582214355469, 0.057903289794921875, 0.06376075744628906, 0.06961822509765625, 0.07547569274902344, 0.08133316040039062, 0.08719062805175781, 0.093048095703125, 0.09890556335449219, 0.10476303100585938, 0.11062049865722656, 0.11647796630859375, 0.12233543395996094, 0.12819290161132812, 0.1340503692626953, 0.1399078369140625, 0.1457653045654297, 0.15162277221679688, 0.15748023986816406, 0.16333770751953125, 0.16919517517089844, 0.17505264282226562, 0.1809101104736328, 0.186767578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 93.0, 917.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.26087403297424316, -0.25647279620170593, -0.2520715892314911, -0.24767036736011505, -0.243269145488739, -0.23886792361736298, -0.23446670174598694, -0.2300654798746109, -0.22566425800323486, -0.22126303613185883, -0.2168618142604828, -0.21246059238910675, -0.2080593705177307, -0.20365814864635468, -0.19925692677497864, -0.1948557049036026, -0.19045448303222656, -0.18605326116085052, -0.1816520392894745, -0.17725081741809845, -0.1728495955467224, -0.16844837367534637, -0.16404715180397034, -0.1596459299325943, -0.15524469316005707, -0.15084347128868103, -0.146442249417305, -0.14204102754592896, -0.13763980567455292, -0.13323858380317688, -0.12883736193180084, -0.1244361400604248, -0.12003491818904877, -0.11563369631767273, -0.11123247444629669, -0.10683125257492065, -0.10243003070354462, -0.09802880883216858, -0.09362758696079254, -0.0892263650894165, -0.08482514321804047, -0.08042392134666443, -0.07602269947528839, -0.07162147760391235, -0.06722025573253632, -0.06281903386116028, -0.05841780826449394, -0.054016586393117905, -0.04961536452174187, -0.04521414265036583, -0.04081292077898979, -0.036411695182323456, -0.03201047331094742, -0.02760925330221653, -0.023208029568195343, -0.018806807696819305, -0.014405585825443268, -0.01000436395406723, -0.005603141151368618, -0.0012019183486700058, 0.003199303522706032, 0.007600525394082069, 0.012001749128103256, 0.016402970999479294, 0.02080419287085533]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 13.0, 17.0, 16.0, 23.0, 18.0, 35.0, 43.0, 47.0, 48.0, 50.0, 43.0, 50.0, 64.0, 52.0, 66.0, 51.0, 47.0, 59.0, 44.0, 40.0, 41.0, 28.0, 23.0, 26.0, 18.0, 8.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010998427867889404, -0.010624618269503117, -0.010250808671116829, -0.009876999072730541, -0.009503189474344254, -0.009129379875957966, -0.008755570277571678, -0.00838176067918539, -0.008007951080799103, -0.007634141482412815, -0.007260331884026527, -0.00688652228564024, -0.006512712687253952, -0.006138903088867664, -0.005765093490481377, -0.005391283892095089, -0.005017474293708801, -0.004643664695322514, -0.004269855096936226, -0.003896045498549938, -0.0035222359001636505, -0.003148426301777363, -0.002774616703391075, -0.0024008071050047874, -0.0020269975066184998, -0.001653187908232212, -0.0012793783098459244, -0.0009055687114596367, -0.000531759113073349, -0.0001579495146870613, 0.00021586008369922638, 0.0005896696820855141, 0.0009634792804718018, 0.0013372888788580894, 0.0017110984772443771, 0.002084908075630665, 0.0024587176740169525, 0.00283252727240324, 0.003206336870789528, 0.0035801464691758156, 0.003953956067562103, 0.004327765665948391, 0.004701575264334679, 0.005075384862720966, 0.005449194461107254, 0.005823004059493542, 0.006196813657879829, 0.006570623256266117, 0.006944432854652405, 0.0073182424530386925, 0.00769205205142498, 0.008065861649811268, 0.008439671248197556, 0.008813480846583843, 0.009187290444970131, 0.009561100043356419, 0.009934909641742706, 0.010308719240128994, 0.010682528838515282, 0.01105633843690157, 0.011430148035287857, 0.011803957633674145, 0.012177767232060432, 0.01255157683044672, 0.012925386428833008]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 6.0, 3.0, 10.0, 10.0, 11.0, 13.0, 15.0, 23.0, 25.0, 25.0, 29.0, 22.0, 27.0, 25.0, 41.0, 41.0, 39.0, 41.0, 39.0, 40.0, 49.0, 47.0, 26.0, 45.0, 43.0, 35.0, 22.0, 32.0, 23.0, 21.0, 23.0, 27.0, 14.0, 15.0, 20.0, 18.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.59765625, -5.422119140625, -5.24658203125, -5.071044921875, -4.8955078125, -4.719970703125, -4.54443359375, -4.368896484375, -4.193359375, -4.017822265625, -3.84228515625, -3.666748046875, -3.4912109375, -3.315673828125, -3.14013671875, -2.964599609375, -2.7890625, -2.613525390625, -2.43798828125, -2.262451171875, -2.0869140625, -1.911376953125, -1.73583984375, -1.560302734375, -1.384765625, -1.209228515625, -1.03369140625, -0.858154296875, -0.6826171875, -0.507080078125, -0.33154296875, -0.156005859375, 0.01953125, 0.195068359375, 0.37060546875, 0.546142578125, 0.7216796875, 0.897216796875, 1.07275390625, 1.248291015625, 1.423828125, 1.599365234375, 1.77490234375, 1.950439453125, 2.1259765625, 2.301513671875, 2.47705078125, 2.652587890625, 2.828125, 3.003662109375, 3.17919921875, 3.354736328125, 3.5302734375, 3.705810546875, 3.88134765625, 4.056884765625, 4.232421875, 4.407958984375, 4.58349609375, 4.759033203125, 4.9345703125, 5.110107421875, 5.28564453125, 5.461181640625, 5.63671875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 7.0, 4.0, 9.0, 7.0, 19.0, 27.0, 27.0, 42.0, 56.0, 68.0, 99.0, 143.0, 197.0, 308.0, 429.0, 594.0, 860.0, 1347.0, 2199.0, 4281.0, 13781.0, 102348.0, 712536.0, 177119.0, 19519.0, 5352.0, 2488.0, 1497.0, 1049.0, 632.0, 422.0, 341.0, 183.0, 153.0, 111.0, 78.0, 65.0, 40.0, 26.0, 22.0, 17.0, 16.0, 10.0, 11.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.921875, -14.4498291015625, -13.977783203125, -13.5057373046875, -13.03369140625, -12.5616455078125, -12.089599609375, -11.6175537109375, -11.1455078125, -10.6734619140625, -10.201416015625, -9.7293701171875, -9.25732421875, -8.7852783203125, -8.313232421875, -7.8411865234375, -7.369140625, -6.8970947265625, -6.425048828125, -5.9530029296875, -5.48095703125, -5.0089111328125, -4.536865234375, -4.0648193359375, -3.5927734375, -3.1207275390625, -2.648681640625, -2.1766357421875, -1.70458984375, -1.2325439453125, -0.760498046875, -0.2884521484375, 0.18359375, 0.6556396484375, 1.127685546875, 1.5997314453125, 2.07177734375, 2.5438232421875, 3.015869140625, 3.4879150390625, 3.9599609375, 4.4320068359375, 4.904052734375, 5.3760986328125, 5.84814453125, 6.3201904296875, 6.792236328125, 7.2642822265625, 7.736328125, 8.2083740234375, 8.680419921875, 9.1524658203125, 9.62451171875, 10.0965576171875, 10.568603515625, 11.0406494140625, 11.5126953125, 11.9847412109375, 12.456787109375, 12.9288330078125, 13.40087890625, 13.8729248046875, 14.344970703125, 14.8170166015625, 15.2890625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 7.0, 4.0, 10.0, 12.0, 7.0, 14.0, 11.0, 20.0, 24.0, 29.0, 34.0, 39.0, 53.0, 71.0, 63.0, 126.0, 293.0, 1567.0, 205.0, 106.0, 61.0, 58.0, 46.0, 31.0, 39.0, 31.0, 17.0, 14.0, 19.0, 11.0, 7.0, 5.0, 9.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.091796875, -15.48046875, -14.869140625, -14.2578125, -13.646484375, -13.03515625, -12.423828125, -11.8125, -11.201171875, -10.58984375, -9.978515625, -9.3671875, -8.755859375, -8.14453125, -7.533203125, -6.921875, -6.310546875, -5.69921875, -5.087890625, -4.4765625, -3.865234375, -3.25390625, -2.642578125, -2.03125, -1.419921875, -0.80859375, -0.197265625, 0.4140625, 1.025390625, 1.63671875, 2.248046875, 2.859375, 3.470703125, 4.08203125, 4.693359375, 5.3046875, 5.916015625, 6.52734375, 7.138671875, 7.75, 8.361328125, 8.97265625, 9.583984375, 10.1953125, 10.806640625, 11.41796875, 12.029296875, 12.640625, 13.251953125, 13.86328125, 14.474609375, 15.0859375, 15.697265625, 16.30859375, 16.919921875, 17.53125, 18.142578125, 18.75390625, 19.365234375, 19.9765625, 20.587890625, 21.19921875, 21.810546875, 22.421875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 4.0, 3.0, 6.0, 9.0, 14.0, 10.0, 17.0, 18.0, 28.0, 44.0, 55.0, 67.0, 107.0, 160.0, 261.0, 502.0, 1154.0, 7132.0, 3117592.0, 15730.0, 1339.0, 527.0, 299.0, 162.0, 121.0, 99.0, 62.0, 39.0, 37.0, 16.0, 18.0, 11.0, 10.0, 15.0, 9.0, 6.0, 3.0, 0.0, 1.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-53.46875, -51.9658203125, -50.462890625, -48.9599609375, -47.45703125, -45.9541015625, -44.451171875, -42.9482421875, -41.4453125, -39.9423828125, -38.439453125, -36.9365234375, -35.43359375, -33.9306640625, -32.427734375, -30.9248046875, -29.421875, -27.9189453125, -26.416015625, -24.9130859375, -23.41015625, -21.9072265625, -20.404296875, -18.9013671875, -17.3984375, -15.8955078125, -14.392578125, -12.8896484375, -11.38671875, -9.8837890625, -8.380859375, -6.8779296875, -5.375, -3.8720703125, -2.369140625, -0.8662109375, 0.63671875, 2.1396484375, 3.642578125, 5.1455078125, 6.6484375, 8.1513671875, 9.654296875, 11.1572265625, 12.66015625, 14.1630859375, 15.666015625, 17.1689453125, 18.671875, 20.1748046875, 21.677734375, 23.1806640625, 24.68359375, 26.1865234375, 27.689453125, 29.1923828125, 30.6953125, 32.1982421875, 33.701171875, 35.2041015625, 36.70703125, 38.2099609375, 39.712890625, 41.2158203125, 42.71875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [3.0, 25.0, 86.0, 278.0, 379.0, 196.0, 38.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.490334510803223, -10.339606285095215, -7.188878536224365, -4.038150787353516, -0.8874225616455078, 2.2633056640625, 5.414032936096191, 8.5647611618042, 11.715489387512207, 14.866217613220215, 18.016944885253906, 21.167673110961914, 24.318401336669922, 27.46912956237793, 30.619857788085938, 33.77058410644531, 36.92131423950195, 40.07204055786133, 43.22277069091797, 46.373497009277344, 49.524227142333984, 52.67495346069336, 55.82568359375, 58.976409912109375, 62.12713623046875, 65.27786254882812, 68.4285888671875, 71.5793228149414, 74.73004913330078, 77.88077545166016, 81.03150177001953, 84.18223571777344, 87.33295440673828, 90.48368072509766, 93.63440704345703, 96.78514099121094, 99.93586730957031, 103.08659362792969, 106.23731994628906, 109.38804626464844, 112.53878021240234, 115.68950653076172, 118.8402328491211, 121.990966796875, 125.14169311523438, 128.29241943359375, 131.44314575195312, 134.5938720703125, 137.74459838867188, 140.89532470703125, 144.04605102539062, 147.19677734375, 150.34750366210938, 153.4982452392578, 156.6489715576172, 159.79969787597656, 162.95042419433594, 166.1011505126953, 169.2518768310547, 172.40260314941406, 175.55332946777344, 178.70407104492188, 181.85479736328125, 185.00552368164062, 188.15625]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 16.0, 13.0, 12.0, 20.0, 21.0, 21.0, 25.0, 23.0, 29.0, 35.0, 35.0, 33.0, 45.0, 46.0, 51.0, 44.0, 53.0, 43.0, 49.0, 44.0, 35.0, 41.0, 40.0, 36.0, 25.0, 24.0, 28.0, 23.0, 18.0, 11.0, 10.0, 5.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.455413818359375, -42.0845947265625, -40.713775634765625, -39.342960357666016, -37.97214126586914, -36.601322174072266, -35.230506896972656, -33.85968780517578, -32.488868713378906, -31.11804962158203, -29.74723243713379, -28.376415252685547, -27.005596160888672, -25.634777069091797, -24.263959884643555, -22.893142700195312, -21.522323608398438, -20.151504516601562, -18.78068733215332, -17.409870147705078, -16.039051055908203, -14.668232917785645, -13.297414779663086, -11.926596641540527, -10.555778503417969, -9.18496036529541, -7.814142227172852, -6.443324089050293, -5.072505950927734, -3.701687812805176, -2.330869674682617, -0.9600515365600586, 0.4107666015625, 1.7815847396850586, 3.152402877807617, 4.523221015930176, 5.894039154052734, 7.264857292175293, 8.635675430297852, 10.00649356842041, 11.377311706542969, 12.748129844665527, 14.118947982788086, 15.489766120910645, 16.860584259033203, 18.231403350830078, 19.60222053527832, 20.973037719726562, 22.343856811523438, 23.714675903320312, 25.085493087768555, 26.456310272216797, 27.827129364013672, 29.197948455810547, 30.56876564025879, 31.93958282470703, 33.310401916503906, 34.68122100830078, 36.052040100097656, 37.422855377197266, 38.79367446899414, 40.164493560791016, 41.535308837890625, 42.9061279296875, 44.276947021484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 2.0, 6.0, 8.0, 6.0, 11.0, 13.0, 6.0, 15.0, 20.0, 19.0, 23.0, 16.0, 25.0, 26.0, 27.0, 38.0, 38.0, 33.0, 42.0, 37.0, 31.0, 38.0, 46.0, 48.0, 33.0, 36.0, 34.0, 46.0, 36.0, 26.0, 34.0, 23.0, 24.0, 10.0, 24.0, 14.0, 16.0, 13.0, 7.0, 11.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-5.87890625, -5.70050048828125, -5.5220947265625, -5.34368896484375, -5.165283203125, -4.98687744140625, -4.8084716796875, -4.63006591796875, -4.45166015625, -4.27325439453125, -4.0948486328125, -3.91644287109375, -3.738037109375, -3.55963134765625, -3.3812255859375, -3.20281982421875, -3.0244140625, -2.84600830078125, -2.6676025390625, -2.48919677734375, -2.310791015625, -2.13238525390625, -1.9539794921875, -1.77557373046875, -1.59716796875, -1.41876220703125, -1.2403564453125, -1.06195068359375, -0.883544921875, -0.70513916015625, -0.5267333984375, -0.34832763671875, -0.169921875, 0.00848388671875, 0.1868896484375, 0.36529541015625, 0.543701171875, 0.72210693359375, 0.9005126953125, 1.07891845703125, 1.25732421875, 1.43572998046875, 1.6141357421875, 1.79254150390625, 1.970947265625, 2.14935302734375, 2.3277587890625, 2.50616455078125, 2.6845703125, 2.86297607421875, 3.0413818359375, 3.21978759765625, 3.398193359375, 3.57659912109375, 3.7550048828125, 3.93341064453125, 4.11181640625, 4.29022216796875, 4.4686279296875, 4.64703369140625, 4.825439453125, 5.00384521484375, 5.1822509765625, 5.36065673828125, 5.5390625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 18.0, 20.0, 20.0, 31.0, 48.0, 55.0, 85.0, 100.0, 140.0, 200.0, 291.0, 420.0, 612.0, 943.0, 1398.0, 2233.0, 3690.0, 6666.0, 12742.0, 33138.0, 162896.0, 941414.0, 2104242.0, 738562.0, 128088.0, 28872.0, 11585.0, 5908.0, 3448.0, 2086.0, 1400.0, 902.0, 620.0, 400.0, 283.0, 209.0, 120.0, 96.0, 85.0, 54.0, 44.0, 32.0, 18.0, 13.0, 16.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.1328125, -8.8326416015625, -8.532470703125, -8.2322998046875, -7.93212890625, -7.6319580078125, -7.331787109375, -7.0316162109375, -6.7314453125, -6.4312744140625, -6.131103515625, -5.8309326171875, -5.53076171875, -5.2305908203125, -4.930419921875, -4.6302490234375, -4.330078125, -4.0299072265625, -3.729736328125, -3.4295654296875, -3.12939453125, -2.8292236328125, -2.529052734375, -2.2288818359375, -1.9287109375, -1.6285400390625, -1.328369140625, -1.0281982421875, -0.72802734375, -0.4278564453125, -0.127685546875, 0.1724853515625, 0.47265625, 0.7728271484375, 1.072998046875, 1.3731689453125, 1.67333984375, 1.9735107421875, 2.273681640625, 2.5738525390625, 2.8740234375, 3.1741943359375, 3.474365234375, 3.7745361328125, 4.07470703125, 4.3748779296875, 4.675048828125, 4.9752197265625, 5.275390625, 5.5755615234375, 5.875732421875, 6.1759033203125, 6.47607421875, 6.7762451171875, 7.076416015625, 7.3765869140625, 7.6767578125, 7.9769287109375, 8.277099609375, 8.5772705078125, 8.87744140625, 9.1776123046875, 9.477783203125, 9.7779541015625, 10.078125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 8.0, 15.0, 20.0, 28.0, 68.0, 100.0, 166.0, 251.0, 487.0, 710.0, 805.0, 541.0, 352.0, 209.0, 126.0, 80.0, 38.0, 27.0, 16.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.291748046875, -14.78662109375, -14.281494140625, -13.7763671875, -13.271240234375, -12.76611328125, -12.260986328125, -11.755859375, -11.250732421875, -10.74560546875, -10.240478515625, -9.7353515625, -9.230224609375, -8.72509765625, -8.219970703125, -7.71484375, -7.209716796875, -6.70458984375, -6.199462890625, -5.6943359375, -5.189208984375, -4.68408203125, -4.178955078125, -3.673828125, -3.168701171875, -2.66357421875, -2.158447265625, -1.6533203125, -1.148193359375, -0.64306640625, -0.137939453125, 0.3671875, 0.872314453125, 1.37744140625, 1.882568359375, 2.3876953125, 2.892822265625, 3.39794921875, 3.903076171875, 4.408203125, 4.913330078125, 5.41845703125, 5.923583984375, 6.4287109375, 6.933837890625, 7.43896484375, 7.944091796875, 8.44921875, 8.954345703125, 9.45947265625, 9.964599609375, 10.4697265625, 10.974853515625, 11.47998046875, 11.985107421875, 12.490234375, 12.995361328125, 13.50048828125, 14.005615234375, 14.5107421875, 15.015869140625, 15.52099609375, 16.026123046875, 16.53125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 17.0, 32.0, 48.0, 96.0, 237.0, 506.0, 1483.0, 9955.0, 1806409.0, 2361765.0, 11083.0, 1527.0, 568.0, 251.0, 134.0, 53.0, 36.0, 28.0, 13.0, 10.0, 7.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.5, -38.3037109375, -37.107421875, -35.9111328125, -34.71484375, -33.5185546875, -32.322265625, -31.1259765625, -29.9296875, -28.7333984375, -27.537109375, -26.3408203125, -25.14453125, -23.9482421875, -22.751953125, -21.5556640625, -20.359375, -19.1630859375, -17.966796875, -16.7705078125, -15.57421875, -14.3779296875, -13.181640625, -11.9853515625, -10.7890625, -9.5927734375, -8.396484375, -7.2001953125, -6.00390625, -4.8076171875, -3.611328125, -2.4150390625, -1.21875, -0.0224609375, 1.173828125, 2.3701171875, 3.56640625, 4.7626953125, 5.958984375, 7.1552734375, 8.3515625, 9.5478515625, 10.744140625, 11.9404296875, 13.13671875, 14.3330078125, 15.529296875, 16.7255859375, 17.921875, 19.1181640625, 20.314453125, 21.5107421875, 22.70703125, 23.9033203125, 25.099609375, 26.2958984375, 27.4921875, 28.6884765625, 29.884765625, 31.0810546875, 32.27734375, 33.4736328125, 34.669921875, 35.8662109375, 37.0625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 905.0, 94.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.72854614257812, -229.88121032714844, -213.03387451171875, -196.18653869628906, -179.33920288085938, -162.4918670654297, -145.64453125, -128.7971954345703, -111.94985961914062, -95.10252380371094, -78.25518798828125, -61.40785217285156, -44.560516357421875, -27.713180541992188, -10.8658447265625, 5.9814910888671875, 22.828826904296875, 39.67616271972656, 56.52349853515625, 73.37083435058594, 90.21817016601562, 107.06550598144531, 123.912841796875, 140.7601776123047, 157.60751342773438, 174.45484924316406, 191.30218505859375, 208.14952087402344, 224.99685668945312, 241.8441925048828, 258.6915283203125, 275.53887939453125, 292.38623046875, 309.23358154296875, 326.0809020996094, 342.92822265625, 359.77557373046875, 376.6229248046875, 393.4702453613281, 410.31756591796875, 427.1649169921875, 444.01226806640625, 460.8595886230469, 477.7069091796875, 494.55426025390625, 511.401611328125, 528.2489013671875, 545.0962524414062, 561.943603515625, 578.7909545898438, 595.6383056640625, 612.485595703125, 629.3329467773438, 646.1802978515625, 663.027587890625, 679.8749389648438, 696.7222900390625, 713.5696411132812, 730.4169921875, 747.2642822265625, 764.1116333007812, 780.958984375, 797.8062744140625, 814.6536254882812, 831.5009765625]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 9.0, 12.0, 18.0, 13.0, 19.0, 26.0, 25.0, 30.0, 28.0, 26.0, 49.0, 49.0, 48.0, 39.0, 51.0, 44.0, 42.0, 45.0, 47.0, 45.0, 41.0, 37.0, 47.0, 40.0, 24.0, 20.0, 23.0, 21.0, 20.0, 18.0, 4.0, 2.0, 8.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.15995788574219, -43.93891525268555, -42.71786880493164, -41.496826171875, -40.275779724121094, -39.05473709106445, -37.83369445800781, -36.612648010253906, -35.391605377197266, -34.170562744140625, -32.94951629638672, -31.728473663330078, -30.507429122924805, -29.28638458251953, -28.065340042114258, -26.844295501708984, -25.62325096130371, -24.402206420898438, -23.181161880493164, -21.96011734008789, -20.73907470703125, -19.518030166625977, -18.296985626220703, -17.075942993164062, -15.854897499084473, -14.6338529586792, -13.412809371948242, -12.191764831542969, -10.970720291137695, -9.749676704406738, -8.528632164001465, -7.307588577270508, -6.086544036865234, -4.865499973297119, -3.644455671310425, -2.4234113693237305, -1.2023673057556152, 0.0186767578125, 1.2397212982177734, 2.4607648849487305, 3.681809425354004, 4.902853488922119, 6.123897552490234, 7.344942092895508, 8.565986633300781, 9.787030220031738, 11.008074760437012, 12.229118347167969, 13.450162887573242, 14.671207427978516, 15.892251014709473, 17.113296508789062, 18.334339141845703, 19.555383682250977, 20.77642822265625, 21.99747085571289, 23.218517303466797, 24.43956184387207, 25.660606384277344, 26.881649017333984, 28.102693557739258, 29.32373809814453, 30.544782638549805, 31.765827178955078, 32.98686981201172]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 8.0, 8.0, 7.0, 8.0, 7.0, 13.0, 12.0, 18.0, 27.0, 23.0, 22.0, 26.0, 31.0, 38.0, 34.0, 39.0, 35.0, 36.0, 45.0, 39.0, 48.0, 27.0, 18.0, 35.0, 46.0, 44.0, 28.0, 29.0, 34.0, 24.0, 22.0, 21.0, 28.0, 21.0, 10.0, 7.0, 14.0, 12.0, 4.0, 6.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.53515625, -4.38592529296875, -4.2366943359375, -4.08746337890625, -3.938232421875, -3.78900146484375, -3.6397705078125, -3.49053955078125, -3.34130859375, -3.19207763671875, -3.0428466796875, -2.89361572265625, -2.744384765625, -2.59515380859375, -2.4459228515625, -2.29669189453125, -2.1474609375, -1.99822998046875, -1.8489990234375, -1.69976806640625, -1.550537109375, -1.40130615234375, -1.2520751953125, -1.10284423828125, -0.95361328125, -0.80438232421875, -0.6551513671875, -0.50592041015625, -0.356689453125, -0.20745849609375, -0.0582275390625, 0.09100341796875, 0.240234375, 0.38946533203125, 0.5386962890625, 0.68792724609375, 0.837158203125, 0.98638916015625, 1.1356201171875, 1.28485107421875, 1.43408203125, 1.58331298828125, 1.7325439453125, 1.88177490234375, 2.031005859375, 2.18023681640625, 2.3294677734375, 2.47869873046875, 2.6279296875, 2.77716064453125, 2.9263916015625, 3.07562255859375, 3.224853515625, 3.37408447265625, 3.5233154296875, 3.67254638671875, 3.82177734375, 3.97100830078125, 4.1202392578125, 4.26947021484375, 4.418701171875, 4.56793212890625, 4.7171630859375, 4.86639404296875, 5.015625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 13.0, 13.0, 30.0, 39.0, 56.0, 81.0, 131.0, 201.0, 300.0, 474.0, 707.0, 1058.0, 1609.0, 2364.0, 3452.0, 5104.0, 7619.0, 11178.0, 16731.0, 24603.0, 36455.0, 53022.0, 74215.0, 100375.0, 126747.0, 137941.0, 122327.0, 95995.0, 70188.0, 49878.0, 33922.0, 23208.0, 15803.0, 10792.0, 7133.0, 4876.0, 3279.0, 2228.0, 1491.0, 964.0, 666.0, 414.0, 286.0, 207.0, 124.0, 88.0, 56.0, 33.0, 27.0, 19.0, 5.0, 9.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.471435546875, -0.4568939208984375, -0.442352294921875, -0.4278106689453125, -0.41326904296875, -0.3987274169921875, -0.384185791015625, -0.3696441650390625, -0.3551025390625, -0.3405609130859375, -0.326019287109375, -0.3114776611328125, -0.29693603515625, -0.2823944091796875, -0.267852783203125, -0.2533111572265625, -0.23876953125, -0.2242279052734375, -0.209686279296875, -0.1951446533203125, -0.18060302734375, -0.1660614013671875, -0.151519775390625, -0.1369781494140625, -0.1224365234375, -0.1078948974609375, -0.093353271484375, -0.0788116455078125, -0.06427001953125, -0.0497283935546875, -0.035186767578125, -0.0206451416015625, -0.006103515625, 0.0084381103515625, 0.022979736328125, 0.0375213623046875, 0.05206298828125, 0.0666046142578125, 0.081146240234375, 0.0956878662109375, 0.1102294921875, 0.1247711181640625, 0.139312744140625, 0.1538543701171875, 0.16839599609375, 0.1829376220703125, 0.197479248046875, 0.2120208740234375, 0.2265625, 0.2411041259765625, 0.255645751953125, 0.2701873779296875, 0.28472900390625, 0.2992706298828125, 0.313812255859375, 0.3283538818359375, 0.3428955078125, 0.3574371337890625, 0.371978759765625, 0.3865203857421875, 0.40106201171875, 0.4156036376953125, 0.430145263671875, 0.4446868896484375, 0.459228515625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 8.0, 10.0, 11.0, 12.0, 16.0, 14.0, 18.0, 19.0, 20.0, 21.0, 24.0, 45.0, 33.0, 29.0, 31.0, 35.0, 50.0, 35.0, 41.0, 1055.0, 45.0, 45.0, 32.0, 36.0, 30.0, 39.0, 30.0, 25.0, 28.0, 28.0, 22.0, 17.0, 11.0, 23.0, 12.0, 15.0, 15.0, 11.0, 7.0, 8.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -3.010650634765625, -2.90606689453125, -2.801483154296875, -2.6968994140625, -2.592315673828125, -2.48773193359375, -2.383148193359375, -2.278564453125, -2.173980712890625, -2.06939697265625, -1.964813232421875, -1.8602294921875, -1.755645751953125, -1.65106201171875, -1.546478271484375, -1.44189453125, -1.337310791015625, -1.23272705078125, -1.128143310546875, -1.0235595703125, -0.918975830078125, -0.81439208984375, -0.709808349609375, -0.605224609375, -0.500640869140625, -0.39605712890625, -0.291473388671875, -0.1868896484375, -0.082305908203125, 0.02227783203125, 0.126861572265625, 0.2314453125, 0.336029052734375, 0.44061279296875, 0.545196533203125, 0.6497802734375, 0.754364013671875, 0.85894775390625, 0.963531494140625, 1.068115234375, 1.172698974609375, 1.27728271484375, 1.381866455078125, 1.4864501953125, 1.591033935546875, 1.69561767578125, 1.800201416015625, 1.90478515625, 2.009368896484375, 2.11395263671875, 2.218536376953125, 2.3231201171875, 2.427703857421875, 2.53228759765625, 2.636871337890625, 2.741455078125, 2.846038818359375, 2.95062255859375, 3.055206298828125, 3.1597900390625, 3.264373779296875, 3.36895751953125, 3.473541259765625, 3.578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 8.0, 12.0, 22.0, 27.0, 35.0, 51.0, 98.0, 126.0, 207.0, 329.0, 491.0, 826.0, 1287.0, 2094.0, 3261.0, 5172.0, 8465.0, 13570.0, 22056.0, 35160.0, 54669.0, 83132.0, 119032.0, 159638.0, 1201257.0, 128409.0, 91620.0, 60903.0, 39390.0, 24911.0, 15458.0, 9542.0, 5922.0, 3612.0, 2331.0, 1416.0, 926.0, 624.0, 431.0, 221.0, 128.0, 93.0, 43.0, 53.0, 35.0, 12.0, 16.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.412841796875, -0.3999900817871094, -0.38713836669921875, -0.3742866516113281, -0.3614349365234375, -0.3485832214355469, -0.33573150634765625, -0.3228797912597656, -0.310028076171875, -0.2971763610839844, -0.28432464599609375, -0.2714729309082031, -0.2586212158203125, -0.24576950073242188, -0.23291778564453125, -0.22006607055664062, -0.20721435546875, -0.19436264038085938, -0.18151092529296875, -0.16865921020507812, -0.1558074951171875, -0.14295578002929688, -0.13010406494140625, -0.11725234985351562, -0.104400634765625, -0.09154891967773438, -0.07869720458984375, -0.06584548950195312, -0.0529937744140625, -0.040142059326171875, -0.02729034423828125, -0.014438629150390625, -0.0015869140625, 0.011264801025390625, 0.02411651611328125, 0.036968231201171875, 0.0498199462890625, 0.06267166137695312, 0.07552337646484375, 0.08837509155273438, 0.101226806640625, 0.11407852172851562, 0.12693023681640625, 0.13978195190429688, 0.1526336669921875, 0.16548538208007812, 0.17833709716796875, 0.19118881225585938, 0.20404052734375, 0.21689224243164062, 0.22974395751953125, 0.24259567260742188, 0.2554473876953125, 0.2682991027832031, 0.28115081787109375, 0.2940025329589844, 0.306854248046875, 0.3197059631347656, 0.33255767822265625, 0.3454093933105469, 0.3582611083984375, 0.3711128234863281, 0.38396453857421875, 0.3968162536621094, 0.40966796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 7.0, 3.0, 4.0, 9.0, 7.0, 14.0, 18.0, 13.0, 21.0, 14.0, 33.0, 27.0, 40.0, 57.0, 72.0, 87.0, 88.0, 98.0, 71.0, 63.0, 47.0, 42.0, 24.0, 16.0, 24.0, 14.0, 12.0, 16.0, 9.0, 4.0, 7.0, 8.0, 11.0, 2.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.004489898681640625, -0.004364192485809326, -0.004238486289978027, -0.0041127800941467285, -0.00398707389831543, -0.003861367702484131, -0.003735661506652832, -0.003609955310821533, -0.0034842491149902344, -0.0033585429191589355, -0.0032328367233276367, -0.003107130527496338, -0.002981424331665039, -0.0028557181358337402, -0.0027300119400024414, -0.0026043057441711426, -0.0024785995483398438, -0.002352893352508545, -0.002227187156677246, -0.0021014809608459473, -0.0019757747650146484, -0.0018500685691833496, -0.0017243623733520508, -0.001598656177520752, -0.0014729499816894531, -0.0013472437858581543, -0.0012215375900268555, -0.0010958313941955566, -0.0009701251983642578, -0.000844419002532959, -0.0007187128067016602, -0.0005930066108703613, -0.0004673004150390625, -0.00034159421920776367, -0.00021588802337646484, -9.018182754516602e-05, 3.552436828613281e-05, 0.00016123056411743164, 0.00028693675994873047, 0.0004126429557800293, 0.0005383491516113281, 0.000664055347442627, 0.0007897615432739258, 0.0009154677391052246, 0.0010411739349365234, 0.0011668801307678223, 0.001292586326599121, 0.00141829252243042, 0.0015439987182617188, 0.0016697049140930176, 0.0017954111099243164, 0.0019211173057556152, 0.002046823501586914, 0.002172529697418213, 0.0022982358932495117, 0.0024239420890808105, 0.0025496482849121094, 0.002675354480743408, 0.002801060676574707, 0.002926766872406006, 0.0030524730682373047, 0.0031781792640686035, 0.0033038854598999023, 0.003429591655731201, 0.0035552978515625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 6.0, 17.0, 11.0, 15.0, 17.0, 26.0, 30.0, 37.0, 51.0, 64.0, 98.0, 162.0, 241.0, 406.0, 1040.0, 35629.0, 999465.0, 9465.0, 721.0, 327.0, 212.0, 138.0, 78.0, 67.0, 48.0, 41.0, 30.0, 16.0, 14.0, 15.0, 10.0, 5.0, 15.0, 7.0, 2.0, 8.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.08074951171875, -0.07832908630371094, -0.07590866088867188, -0.07348823547363281, -0.07106781005859375, -0.06864738464355469, -0.06622695922851562, -0.06380653381347656, -0.0613861083984375, -0.05896568298339844, -0.056545257568359375, -0.05412483215332031, -0.05170440673828125, -0.04928398132324219, -0.046863555908203125, -0.04444313049316406, -0.042022705078125, -0.03960227966308594, -0.037181854248046875, -0.03476142883300781, -0.03234100341796875, -0.029920578002929688, -0.027500152587890625, -0.025079727172851562, -0.0226593017578125, -0.020238876342773438, -0.017818450927734375, -0.015398025512695312, -0.01297760009765625, -0.010557174682617188, -0.008136749267578125, -0.0057163238525390625, -0.0032958984375, -0.0008754730224609375, 0.001544952392578125, 0.0039653778076171875, 0.00638580322265625, 0.008806228637695312, 0.011226654052734375, 0.013647079467773438, 0.0160675048828125, 0.018487930297851562, 0.020908355712890625, 0.023328781127929688, 0.02574920654296875, 0.028169631958007812, 0.030590057373046875, 0.03301048278808594, 0.035430908203125, 0.03785133361816406, 0.040271759033203125, 0.04269218444824219, 0.04511260986328125, 0.04753303527832031, 0.049953460693359375, 0.05237388610839844, 0.0547943115234375, 0.05721473693847656, 0.059635162353515625, 0.06205558776855469, 0.06447601318359375, 0.06689643859863281, 0.06931686401367188, 0.07173728942871094, 0.07415771484375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 62.0, 459.0, 427.0, 49.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023918382823467255, -0.02328827977180481, -0.022658176720142365, -0.02202807553112507, -0.021397972479462624, -0.02076786942780018, -0.020137766376137733, -0.019507665187120438, -0.018877562135457993, -0.018247459083795547, -0.017617356032133102, -0.016987254843115807, -0.01635715179145336, -0.015727048739790916, -0.015096945688128471, -0.014466843567788601, -0.013836740516126156, -0.01320663746446371, -0.01257653534412384, -0.011946432292461395, -0.011316330172121525, -0.01068622712045908, -0.01005612500011921, -0.009426021948456764, -0.00879591889679432, -0.008165815845131874, -0.007535713724792004, -0.0069056106731295586, -0.006275508552789688, -0.005645405501127243, -0.005015302915126085, -0.0043852003291249275, -0.003755098208785057, -0.0031249956227838993, -0.0024948930367827415, -0.0018647902179509401, -0.0012346876319497824, -0.0006045850459486246, 2.5517772883176804e-05, 0.0006556203588843346, 0.0012857229448854923, 0.00191582553088665, 0.002545928116887808, 0.0031760309357196093, 0.003806133521720767, 0.004436235874891281, 0.005066338926553726, 0.005696441512554884, 0.006326544098556042, 0.0069566466845571995, 0.007586749270558357, 0.008216852322220802, 0.008846954442560673, 0.009477057494223118, 0.010107159614562988, 0.010737262666225433, 0.011367365717887878, 0.011997468769550323, 0.012627570889890194, 0.013257673941552639, 0.01388777606189251, 0.014517879113554955, 0.0151479821652174, 0.015778083354234695, 0.01640818640589714]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 3.0, 6.0, 2.0, 8.0, 11.0, 7.0, 15.0, 17.0, 12.0, 24.0, 19.0, 26.0, 26.0, 28.0, 38.0, 43.0, 50.0, 38.0, 39.0, 39.0, 45.0, 48.0, 42.0, 44.0, 45.0, 45.0, 38.0, 35.0, 36.0, 23.0, 18.0, 20.0, 27.0, 17.0, 17.0, 14.0, 12.0, 10.0, 4.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023120641708374023, -0.0022395411506295204, -0.0021670181304216385, -0.0020944951102137566, -0.0020219720900058746, -0.0019494490697979927, -0.0018769260495901108, -0.0018044030293822289, -0.001731880009174347, -0.001659356988966465, -0.001586833968758583, -0.0015143109485507011, -0.0014417879283428192, -0.0013692649081349373, -0.0012967418879270554, -0.0012242188677191734, -0.0011516958475112915, -0.0010791728273034096, -0.0010066498070955276, -0.0009341267868876457, -0.0008616037666797638, -0.0007890807464718819, -0.0007165577262639999, -0.000644034706056118, -0.0005715116858482361, -0.0004989886656403542, -0.00042646564543247223, -0.0003539426252245903, -0.0002814196050167084, -0.00020889658480882645, -0.00013637356460094452, -6.385054439306259e-05, 8.672475814819336e-06, 8.119549602270126e-05, 0.0001537185162305832, 0.00022624153643846512, 0.00029876455664634705, 0.000371287576854229, 0.0004438105970621109, 0.0005163336172699928, 0.0005888566374778748, 0.0006613796576857567, 0.0007339026778936386, 0.0008064256981015205, 0.0008789487183094025, 0.0009514717385172844, 0.0010239947587251663, 0.0010965177789330482, 0.0011690407991409302, 0.001241563819348812, 0.001314086839556694, 0.001386609859764576, 0.0014591328799724579, 0.0015316559001803398, 0.0016041789203882217, 0.0016767019405961037, 0.0017492249608039856, 0.0018217479810118675, 0.0018942710012197495, 0.0019667940214276314, 0.0020393170416355133, 0.0021118400618433952, 0.002184363082051277, 0.002256886102259159, 0.002329409122467041]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 11.0, 8.0, 8.0, 7.0, 8.0, 7.0, 13.0, 12.0, 18.0, 27.0, 23.0, 22.0, 26.0, 31.0, 39.0, 33.0, 39.0, 35.0, 36.0, 45.0, 39.0, 48.0, 27.0, 18.0, 35.0, 46.0, 44.0, 28.0, 29.0, 34.0, 24.0, 22.0, 21.0, 28.0, 21.0, 10.0, 7.0, 14.0, 12.0, 4.0, 6.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.53515625, -4.38592529296875, -4.2366943359375, -4.08746337890625, -3.938232421875, -3.78900146484375, -3.6397705078125, -3.49053955078125, -3.34130859375, -3.19207763671875, -3.0428466796875, -2.89361572265625, -2.744384765625, -2.59515380859375, -2.4459228515625, -2.29669189453125, -2.1474609375, -1.99822998046875, -1.8489990234375, -1.69976806640625, -1.550537109375, -1.40130615234375, -1.2520751953125, -1.10284423828125, -0.95361328125, -0.80438232421875, -0.6551513671875, -0.50592041015625, -0.356689453125, -0.20745849609375, -0.0582275390625, 0.09100341796875, 0.240234375, 0.38946533203125, 0.5386962890625, 0.68792724609375, 0.837158203125, 0.98638916015625, 1.1356201171875, 1.28485107421875, 1.43408203125, 1.58331298828125, 1.7325439453125, 1.88177490234375, 2.031005859375, 2.18023681640625, 2.3294677734375, 2.47869873046875, 2.6279296875, 2.77716064453125, 2.9263916015625, 3.07562255859375, 3.224853515625, 3.37408447265625, 3.5233154296875, 3.67254638671875, 3.82177734375, 3.97100830078125, 4.1202392578125, 4.26947021484375, 4.418701171875, 4.56793212890625, 4.7171630859375, 4.86639404296875, 5.015625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 7.0, 12.0, 9.0, 13.0, 17.0, 16.0, 32.0, 36.0, 48.0, 59.0, 64.0, 112.0, 148.0, 204.0, 315.0, 448.0, 705.0, 1163.0, 2396.0, 5429.0, 17161.0, 77889.0, 462657.0, 390259.0, 64309.0, 14725.0, 4853.0, 2184.0, 1124.0, 629.0, 436.0, 307.0, 222.0, 138.0, 103.0, 76.0, 55.0, 41.0, 31.0, 24.0, 22.0, 15.0, 12.0, 11.0, 10.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-8.734375, -8.4609375, -8.1875, -7.9140625, -7.640625, -7.3671875, -7.09375, -6.8203125, -6.546875, -6.2734375, -6.0, -5.7265625, -5.453125, -5.1796875, -4.90625, -4.6328125, -4.359375, -4.0859375, -3.8125, -3.5390625, -3.265625, -2.9921875, -2.71875, -2.4453125, -2.171875, -1.8984375, -1.625, -1.3515625, -1.078125, -0.8046875, -0.53125, -0.2578125, 0.015625, 0.2890625, 0.5625, 0.8359375, 1.109375, 1.3828125, 1.65625, 1.9296875, 2.203125, 2.4765625, 2.75, 3.0234375, 3.296875, 3.5703125, 3.84375, 4.1171875, 4.390625, 4.6640625, 4.9375, 5.2109375, 5.484375, 5.7578125, 6.03125, 6.3046875, 6.578125, 6.8515625, 7.125, 7.3984375, 7.671875, 7.9453125, 8.21875, 8.4921875, 8.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 7.0, 8.0, 13.0, 9.0, 9.0, 19.0, 26.0, 24.0, 35.0, 28.0, 44.0, 54.0, 73.0, 90.0, 242.0, 1487.0, 286.0, 154.0, 80.0, 71.0, 40.0, 39.0, 50.0, 23.0, 25.0, 16.0, 21.0, 11.0, 9.0, 11.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-19.21875, -18.6793212890625, -18.139892578125, -17.6004638671875, -17.06103515625, -16.5216064453125, -15.982177734375, -15.4427490234375, -14.9033203125, -14.3638916015625, -13.824462890625, -13.2850341796875, -12.74560546875, -12.2061767578125, -11.666748046875, -11.1273193359375, -10.587890625, -10.0484619140625, -9.509033203125, -8.9696044921875, -8.43017578125, -7.8907470703125, -7.351318359375, -6.8118896484375, -6.2724609375, -5.7330322265625, -5.193603515625, -4.6541748046875, -4.11474609375, -3.5753173828125, -3.035888671875, -2.4964599609375, -1.95703125, -1.4176025390625, -0.878173828125, -0.3387451171875, 0.20068359375, 0.7401123046875, 1.279541015625, 1.8189697265625, 2.3583984375, 2.8978271484375, 3.437255859375, 3.9766845703125, 4.51611328125, 5.0555419921875, 5.594970703125, 6.1343994140625, 6.673828125, 7.2132568359375, 7.752685546875, 8.2921142578125, 8.83154296875, 9.3709716796875, 9.910400390625, 10.4498291015625, 10.9892578125, 11.5286865234375, 12.068115234375, 12.6075439453125, 13.14697265625, 13.6864013671875, 14.225830078125, 14.7652587890625, 15.3046875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 7.0, 0.0, 2.0, 3.0, 7.0, 8.0, 12.0, 4.0, 11.0, 16.0, 22.0, 37.0, 39.0, 60.0, 67.0, 141.0, 197.0, 397.0, 739.0, 2580.0, 2985885.0, 152504.0, 1513.0, 562.0, 312.0, 195.0, 114.0, 80.0, 37.0, 32.0, 36.0, 15.0, 13.0, 10.0, 12.0, 10.0, 6.0, 5.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-45.46875, -44.1259765625, -42.783203125, -41.4404296875, -40.09765625, -38.7548828125, -37.412109375, -36.0693359375, -34.7265625, -33.3837890625, -32.041015625, -30.6982421875, -29.35546875, -28.0126953125, -26.669921875, -25.3271484375, -23.984375, -22.6416015625, -21.298828125, -19.9560546875, -18.61328125, -17.2705078125, -15.927734375, -14.5849609375, -13.2421875, -11.8994140625, -10.556640625, -9.2138671875, -7.87109375, -6.5283203125, -5.185546875, -3.8427734375, -2.5, -1.1572265625, 0.185546875, 1.5283203125, 2.87109375, 4.2138671875, 5.556640625, 6.8994140625, 8.2421875, 9.5849609375, 10.927734375, 12.2705078125, 13.61328125, 14.9560546875, 16.298828125, 17.6416015625, 18.984375, 20.3271484375, 21.669921875, 23.0126953125, 24.35546875, 25.6982421875, 27.041015625, 28.3837890625, 29.7265625, 31.0693359375, 32.412109375, 33.7548828125, 35.09765625, 36.4404296875, 37.783203125, 39.1259765625, 40.46875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 40.0, 948.0, 28.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.12523651123047, -80.39488220214844, -72.6645278930664, -64.93417358398438, -57.20382308959961, -49.47346878051758, -41.74311828613281, -34.01276397705078, -26.28240966796875, -18.55205535888672, -10.82170295715332, -3.091350555419922, 4.639003753662109, 12.36935806274414, 20.099708557128906, 27.830062866210938, 35.56041717529297, 43.290771484375, 51.02112579345703, 58.7514762878418, 66.48182678222656, 74.21218872070312, 81.94253540039062, 89.67288970947266, 97.40324401855469, 105.13359832763672, 112.86395263671875, 120.59429931640625, 128.3246612548828, 136.0550079345703, 143.78536987304688, 151.51571655273438, 159.24606323242188, 166.97640991210938, 174.70677185058594, 182.43711853027344, 190.16748046875, 197.8978271484375, 205.628173828125, 213.35853576660156, 221.08889770507812, 228.81924438476562, 236.5496063232422, 244.2799530029297, 252.01031494140625, 259.74066162109375, 267.47100830078125, 275.20135498046875, 282.93170166015625, 290.66204833984375, 298.39239501953125, 306.1227722167969, 313.8531188964844, 321.5834655761719, 329.3138122558594, 337.044189453125, 344.7745361328125, 352.5048828125, 360.2352294921875, 367.9656066894531, 375.6959533691406, 383.4263000488281, 391.1566467285156, 398.88702392578125, 406.61737060546875]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 6.0, 10.0, 12.0, 14.0, 11.0, 19.0, 16.0, 20.0, 23.0, 31.0, 27.0, 37.0, 39.0, 42.0, 47.0, 32.0, 45.0, 39.0, 35.0, 42.0, 50.0, 44.0, 47.0, 29.0, 35.0, 30.0, 24.0, 30.0, 25.0, 20.0, 23.0, 23.0, 10.0, 12.0, 4.0, 3.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-31.725662231445312, -30.64242172241211, -29.559181213378906, -28.475940704345703, -27.3927001953125, -26.309459686279297, -25.22621726989746, -24.142976760864258, -23.059736251831055, -21.97649574279785, -20.89325523376465, -19.810014724731445, -18.72677230834961, -17.643531799316406, -16.560291290283203, -15.47705078125, -14.393810272216797, -13.310569763183594, -12.22732925415039, -11.144087791442871, -10.060847282409668, -8.977606773376465, -7.8943657875061035, -6.811124801635742, -5.727884292602539, -4.644643783569336, -3.5614027976989746, -2.4781620502471924, -1.3949213027954102, -0.31168079376220703, 0.7715601921081543, 1.8548011779785156, 2.9380416870117188, 4.021282196044922, 5.104523181915283, 6.1877641677856445, 7.271004676818848, 8.35424518585205, 9.43748664855957, 10.520727157592773, 11.603967666625977, 12.68720817565918, 13.770448684692383, 14.853690147399902, 15.936930656433105, 17.020172119140625, 18.103412628173828, 19.18665313720703, 20.269893646240234, 21.353134155273438, 22.43637466430664, 23.519615173339844, 24.602855682373047, 25.68609619140625, 26.769338607788086, 27.85257911682129, 28.935819625854492, 30.019060134887695, 31.1023006439209, 32.185543060302734, 33.26878356933594, 34.35202407836914, 35.435264587402344, 36.51850509643555, 37.60174560546875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 3.0, 9.0, 10.0, 7.0, 6.0, 11.0, 12.0, 14.0, 17.0, 21.0, 24.0, 36.0, 23.0, 32.0, 33.0, 32.0, 34.0, 33.0, 38.0, 39.0, 40.0, 47.0, 41.0, 40.0, 40.0, 37.0, 31.0, 33.0, 38.0, 29.0, 20.0, 24.0, 25.0, 12.0, 18.0, 12.0, 12.0, 10.0, 8.0, 9.0, 4.0, 5.0, 6.0, 8.0, 6.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.73828125, -5.5611572265625, -5.384033203125, -5.2069091796875, -5.02978515625, -4.8526611328125, -4.675537109375, -4.4984130859375, -4.3212890625, -4.1441650390625, -3.967041015625, -3.7899169921875, -3.61279296875, -3.4356689453125, -3.258544921875, -3.0814208984375, -2.904296875, -2.7271728515625, -2.550048828125, -2.3729248046875, -2.19580078125, -2.0186767578125, -1.841552734375, -1.6644287109375, -1.4873046875, -1.3101806640625, -1.133056640625, -0.9559326171875, -0.77880859375, -0.6016845703125, -0.424560546875, -0.2474365234375, -0.0703125, 0.1068115234375, 0.283935546875, 0.4610595703125, 0.63818359375, 0.8153076171875, 0.992431640625, 1.1695556640625, 1.3466796875, 1.5238037109375, 1.700927734375, 1.8780517578125, 2.05517578125, 2.2322998046875, 2.409423828125, 2.5865478515625, 2.763671875, 2.9407958984375, 3.117919921875, 3.2950439453125, 3.47216796875, 3.6492919921875, 3.826416015625, 4.0035400390625, 4.1806640625, 4.3577880859375, 4.534912109375, 4.7120361328125, 4.88916015625, 5.0662841796875, 5.243408203125, 5.4205322265625, 5.59765625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 8.0, 23.0, 24.0, 35.0, 36.0, 47.0, 50.0, 86.0, 106.0, 124.0, 180.0, 218.0, 312.0, 441.0, 640.0, 1276.0, 3819.0, 20986.0, 548869.0, 3455665.0, 144063.0, 11419.0, 2640.0, 1023.0, 571.0, 398.0, 275.0, 199.0, 145.0, 130.0, 110.0, 73.0, 53.0, 51.0, 34.0, 37.0, 26.0, 18.0, 14.0, 6.0, 10.0, 7.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.1875, -27.258544921875, -26.32958984375, -25.400634765625, -24.4716796875, -23.542724609375, -22.61376953125, -21.684814453125, -20.755859375, -19.826904296875, -18.89794921875, -17.968994140625, -17.0400390625, -16.111083984375, -15.18212890625, -14.253173828125, -13.32421875, -12.395263671875, -11.46630859375, -10.537353515625, -9.6083984375, -8.679443359375, -7.75048828125, -6.821533203125, -5.892578125, -4.963623046875, -4.03466796875, -3.105712890625, -2.1767578125, -1.247802734375, -0.31884765625, 0.610107421875, 1.5390625, 2.468017578125, 3.39697265625, 4.325927734375, 5.2548828125, 6.183837890625, 7.11279296875, 8.041748046875, 8.970703125, 9.899658203125, 10.82861328125, 11.757568359375, 12.6865234375, 13.615478515625, 14.54443359375, 15.473388671875, 16.40234375, 17.331298828125, 18.26025390625, 19.189208984375, 20.1181640625, 21.047119140625, 21.97607421875, 22.905029296875, 23.833984375, 24.762939453125, 25.69189453125, 26.620849609375, 27.5498046875, 28.478759765625, 29.40771484375, 30.336669921875, 31.265625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 5.0, 3.0, 7.0, 7.0, 12.0, 21.0, 37.0, 61.0, 86.0, 132.0, 185.0, 300.0, 433.0, 607.0, 635.0, 533.0, 341.0, 211.0, 149.0, 91.0, 66.0, 41.0, 29.0, 17.0, 16.0, 14.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.471923828125, -10.02197265625, -9.572021484375, -9.1220703125, -8.672119140625, -8.22216796875, -7.772216796875, -7.322265625, -6.872314453125, -6.42236328125, -5.972412109375, -5.5224609375, -5.072509765625, -4.62255859375, -4.172607421875, -3.72265625, -3.272705078125, -2.82275390625, -2.372802734375, -1.9228515625, -1.472900390625, -1.02294921875, -0.572998046875, -0.123046875, 0.326904296875, 0.77685546875, 1.226806640625, 1.6767578125, 2.126708984375, 2.57666015625, 3.026611328125, 3.4765625, 3.926513671875, 4.37646484375, 4.826416015625, 5.2763671875, 5.726318359375, 6.17626953125, 6.626220703125, 7.076171875, 7.526123046875, 7.97607421875, 8.426025390625, 8.8759765625, 9.325927734375, 9.77587890625, 10.225830078125, 10.67578125, 11.125732421875, 11.57568359375, 12.025634765625, 12.4755859375, 12.925537109375, 13.37548828125, 13.825439453125, 14.275390625, 14.725341796875, 15.17529296875, 15.625244140625, 16.0751953125, 16.525146484375, 16.97509765625, 17.425048828125, 17.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 12.0, 12.0, 22.0, 15.0, 21.0, 43.0, 69.0, 101.0, 178.0, 277.0, 520.0, 895.0, 1660.0, 3984.0, 9966.0, 32137.0, 139382.0, 924705.0, 2540197.0, 429739.0, 77155.0, 20257.0, 6918.0, 2884.0, 1387.0, 683.0, 374.0, 262.0, 166.0, 89.0, 75.0, 22.0, 26.0, 16.0, 10.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.1990966796875, -8.835693359375, -8.4722900390625, -8.10888671875, -7.7454833984375, -7.382080078125, -7.0186767578125, -6.6552734375, -6.2918701171875, -5.928466796875, -5.5650634765625, -5.20166015625, -4.8382568359375, -4.474853515625, -4.1114501953125, -3.748046875, -3.3846435546875, -3.021240234375, -2.6578369140625, -2.29443359375, -1.9310302734375, -1.567626953125, -1.2042236328125, -0.8408203125, -0.4774169921875, -0.114013671875, 0.2493896484375, 0.61279296875, 0.9761962890625, 1.339599609375, 1.7030029296875, 2.06640625, 2.4298095703125, 2.793212890625, 3.1566162109375, 3.52001953125, 3.8834228515625, 4.246826171875, 4.6102294921875, 4.9736328125, 5.3370361328125, 5.700439453125, 6.0638427734375, 6.42724609375, 6.7906494140625, 7.154052734375, 7.5174560546875, 7.880859375, 8.2442626953125, 8.607666015625, 8.9710693359375, 9.33447265625, 9.6978759765625, 10.061279296875, 10.4246826171875, 10.7880859375, 11.1514892578125, 11.514892578125, 11.8782958984375, 12.24169921875, 12.6051025390625, 12.968505859375, 13.3319091796875, 13.6953125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 2.0, 9.0, 6.0, 11.0, 23.0, 26.0, 32.0, 66.0, 61.0, 52.0, 110.0, 109.0, 100.0, 103.0, 75.0, 59.0, 43.0, 37.0, 32.0, 20.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.6331787109375, -66.67305755615234, -63.71293640136719, -60.75281524658203, -57.792694091796875, -54.83257293701172, -51.8724479675293, -48.91232681274414, -45.952205657958984, -42.99208450317383, -40.03196334838867, -37.07183837890625, -34.111717224121094, -31.15159797668457, -28.19147491455078, -25.231353759765625, -22.27123260498047, -19.311111450195312, -16.350990295410156, -13.390867233276367, -10.430746078491211, -7.470624923706055, -4.510501861572266, -1.5503807067871094, 1.4097404479980469, 4.369862079620361, 7.329983711242676, 10.290105819702148, 13.250226974487305, 16.21034812927246, 19.17047119140625, 22.130592346191406, 25.090721130371094, 28.05084228515625, 31.010963439941406, 33.97108459472656, 36.93120574951172, 39.891326904296875, 42.8514518737793, 45.81157302856445, 48.77169418334961, 51.731815338134766, 54.69193649291992, 57.652061462402344, 60.6121826171875, 63.572303771972656, 66.53242492675781, 69.49254608154297, 72.45266723632812, 75.41278839111328, 78.37290954589844, 81.3330307006836, 84.29315185546875, 87.2532730102539, 90.21339416503906, 93.17352294921875, 96.13363647460938, 99.09375762939453, 102.05387878417969, 105.01399993896484, 107.97412109375, 110.93424224853516, 113.89436340332031, 116.8544921875, 119.81461334228516]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 5.0, 10.0, 8.0, 7.0, 19.0, 25.0, 20.0, 32.0, 25.0, 16.0, 32.0, 30.0, 36.0, 31.0, 41.0, 43.0, 37.0, 49.0, 38.0, 35.0, 51.0, 47.0, 34.0, 39.0, 40.0, 35.0, 27.0, 38.0, 28.0, 20.0, 23.0, 14.0, 11.0, 7.0, 10.0, 17.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-51.48828125, -49.910430908203125, -48.332584381103516, -46.75473403930664, -45.17688751220703, -43.599037170410156, -42.02119064331055, -40.44334030151367, -38.86549377441406, -37.28764343261719, -35.70979690551758, -34.1319465637207, -32.554100036621094, -30.97625160217285, -29.39840316772461, -27.820552825927734, -26.242704391479492, -24.66485595703125, -23.087007522583008, -21.509159088134766, -19.931310653686523, -18.35346221923828, -16.775611877441406, -15.19776439666748, -13.619915962219238, -12.042067527770996, -10.464219093322754, -8.886369705200195, -7.308521747589111, -5.730673313140869, -4.152824401855469, -2.5749759674072266, -0.9971275329589844, 0.5807210206985474, 2.158569574356079, 3.7364182472229004, 5.314266681671143, 6.892115116119385, 8.469964027404785, 10.047812461853027, 11.62566089630127, 13.203509330749512, 14.781357765197754, 16.359207153320312, 17.937055587768555, 19.514904022216797, 21.09275245666504, 22.67060089111328, 24.248449325561523, 25.826297760009766, 27.404146194458008, 28.98199462890625, 30.559843063354492, 32.137691497802734, 33.71554183959961, 35.29338836669922, 36.871238708496094, 38.44908905029297, 40.02693557739258, 41.60478591918945, 43.18263244628906, 44.76048278808594, 46.33832931518555, 47.91617965698242, 49.49402618408203]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 5.0, 12.0, 15.0, 23.0, 23.0, 30.0, 26.0, 30.0, 30.0, 40.0, 34.0, 42.0, 43.0, 56.0, 44.0, 41.0, 47.0, 51.0, 45.0, 31.0, 41.0, 46.0, 37.0, 36.0, 33.0, 22.0, 25.0, 15.0, 11.0, 12.0, 13.0, 8.0, 7.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.5625, -86.7421875, -83.921875, -81.1015625, -78.28125, -75.4609375, -72.640625, -69.8203125, -67.0, -64.1796875, -61.359375, -58.5390625, -55.71875, -52.8984375, -50.078125, -47.2578125, -44.4375, -41.6171875, -38.796875, -35.9765625, -33.15625, -30.3359375, -27.515625, -24.6953125, -21.875, -19.0546875, -16.234375, -13.4140625, -10.59375, -7.7734375, -4.953125, -2.1328125, 0.6875, 3.5078125, 6.328125, 9.1484375, 11.96875, 14.7890625, 17.609375, 20.4296875, 23.25, 26.0703125, 28.890625, 31.7109375, 34.53125, 37.3515625, 40.171875, 42.9921875, 45.8125, 48.6328125, 51.453125, 54.2734375, 57.09375, 59.9140625, 62.734375, 65.5546875, 68.375, 71.1953125, 74.015625, 76.8359375, 79.65625, 82.4765625, 85.296875, 88.1171875, 90.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 13.0, 17.0, 22.0, 21.0, 59.0, 99.0, 114.0, 195.0, 270.0, 456.0, 691.0, 1020.0, 1627.0, 2683.0, 4590.0, 7195.0, 11399.0, 18524.0, 29580.0, 46044.0, 70772.0, 102713.0, 142277.0, 165225.0, 142950.0, 104468.0, 70351.0, 46249.0, 29677.0, 18582.0, 11679.0, 7080.0, 4396.0, 2735.0, 1709.0, 1072.0, 665.0, 454.0, 262.0, 210.0, 125.0, 91.0, 48.0, 39.0, 29.0, 26.0, 12.0, 12.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.39453125, -7.16705322265625, -6.9395751953125, -6.71209716796875, -6.484619140625, -6.25714111328125, -6.0296630859375, -5.80218505859375, -5.57470703125, -5.34722900390625, -5.1197509765625, -4.89227294921875, -4.664794921875, -4.43731689453125, -4.2098388671875, -3.98236083984375, -3.7548828125, -3.52740478515625, -3.2999267578125, -3.07244873046875, -2.844970703125, -2.61749267578125, -2.3900146484375, -2.16253662109375, -1.93505859375, -1.70758056640625, -1.4801025390625, -1.25262451171875, -1.025146484375, -0.79766845703125, -0.5701904296875, -0.34271240234375, -0.115234375, 0.11224365234375, 0.3397216796875, 0.56719970703125, 0.794677734375, 1.02215576171875, 1.2496337890625, 1.47711181640625, 1.70458984375, 1.93206787109375, 2.1595458984375, 2.38702392578125, 2.614501953125, 2.84197998046875, 3.0694580078125, 3.29693603515625, 3.5244140625, 3.75189208984375, 3.9793701171875, 4.20684814453125, 4.434326171875, 4.66180419921875, 4.8892822265625, 5.11676025390625, 5.34423828125, 5.57171630859375, 5.7991943359375, 6.02667236328125, 6.254150390625, 6.48162841796875, 6.7091064453125, 6.93658447265625, 7.1640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 12.0, 4.0, 6.0, 11.0, 8.0, 16.0, 16.0, 19.0, 15.0, 28.0, 20.0, 36.0, 25.0, 26.0, 36.0, 30.0, 41.0, 33.0, 34.0, 36.0, 30.0, 1057.0, 38.0, 34.0, 36.0, 35.0, 35.0, 34.0, 31.0, 28.0, 31.0, 21.0, 21.0, 25.0, 15.0, 16.0, 20.0, 11.0, 15.0, 7.0, 11.0, 2.0, 4.0, 4.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-48.90625, -47.49169921875, -46.0771484375, -44.66259765625, -43.248046875, -41.83349609375, -40.4189453125, -39.00439453125, -37.58984375, -36.17529296875, -34.7607421875, -33.34619140625, -31.931640625, -30.51708984375, -29.1025390625, -27.68798828125, -26.2734375, -24.85888671875, -23.4443359375, -22.02978515625, -20.615234375, -19.20068359375, -17.7861328125, -16.37158203125, -14.95703125, -13.54248046875, -12.1279296875, -10.71337890625, -9.298828125, -7.88427734375, -6.4697265625, -5.05517578125, -3.640625, -2.22607421875, -0.8115234375, 0.60302734375, 2.017578125, 3.43212890625, 4.8466796875, 6.26123046875, 7.67578125, 9.09033203125, 10.5048828125, 11.91943359375, 13.333984375, 14.74853515625, 16.1630859375, 17.57763671875, 18.9921875, 20.40673828125, 21.8212890625, 23.23583984375, 24.650390625, 26.06494140625, 27.4794921875, 28.89404296875, 30.30859375, 31.72314453125, 33.1376953125, 34.55224609375, 35.966796875, 37.38134765625, 38.7958984375, 40.21044921875, 41.625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 18.0, 11.0, 34.0, 51.0, 82.0, 95.0, 176.0, 234.0, 363.0, 480.0, 771.0, 1203.0, 1691.0, 2710.0, 4122.0, 6366.0, 9583.0, 14575.0, 22382.0, 33160.0, 49379.0, 72091.0, 102292.0, 133654.0, 1197778.0, 131547.0, 99834.0, 69819.0, 47837.0, 32260.0, 21492.0, 14113.0, 9085.0, 6055.0, 4006.0, 2506.0, 1761.0, 1152.0, 794.0, 475.0, 348.0, 256.0, 144.0, 114.0, 79.0, 49.0, 32.0, 27.0, 15.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.42578125, -5.25860595703125, -5.0914306640625, -4.92425537109375, -4.757080078125, -4.58990478515625, -4.4227294921875, -4.25555419921875, -4.08837890625, -3.92120361328125, -3.7540283203125, -3.58685302734375, -3.419677734375, -3.25250244140625, -3.0853271484375, -2.91815185546875, -2.7509765625, -2.58380126953125, -2.4166259765625, -2.24945068359375, -2.082275390625, -1.91510009765625, -1.7479248046875, -1.58074951171875, -1.41357421875, -1.24639892578125, -1.0792236328125, -0.91204833984375, -0.744873046875, -0.57769775390625, -0.4105224609375, -0.24334716796875, -0.076171875, 0.09100341796875, 0.2581787109375, 0.42535400390625, 0.592529296875, 0.75970458984375, 0.9268798828125, 1.09405517578125, 1.26123046875, 1.42840576171875, 1.5955810546875, 1.76275634765625, 1.929931640625, 2.09710693359375, 2.2642822265625, 2.43145751953125, 2.5986328125, 2.76580810546875, 2.9329833984375, 3.10015869140625, 3.267333984375, 3.43450927734375, 3.6016845703125, 3.76885986328125, 3.93603515625, 4.10321044921875, 4.2703857421875, 4.43756103515625, 4.604736328125, 4.77191162109375, 4.9390869140625, 5.10626220703125, 5.2734375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 7.0, 12.0, 9.0, 11.0, 18.0, 29.0, 37.0, 74.0, 73.0, 118.0, 131.0, 145.0, 100.0, 77.0, 37.0, 25.0, 21.0, 17.0, 9.0, 9.0, 13.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07665729522705078, -0.07415199279785156, -0.07164669036865234, -0.06914138793945312, -0.0666360855102539, -0.06413078308105469, -0.06162548065185547, -0.05912017822265625, -0.05661487579345703, -0.05410957336425781, -0.051604270935058594, -0.049098968505859375, -0.046593666076660156, -0.04408836364746094, -0.04158306121826172, -0.0390777587890625, -0.03657245635986328, -0.03406715393066406, -0.031561851501464844, -0.029056549072265625, -0.026551246643066406, -0.024045944213867188, -0.02154064178466797, -0.01903533935546875, -0.01653003692626953, -0.014024734497070312, -0.011519432067871094, -0.009014129638671875, -0.006508827209472656, -0.0040035247802734375, -0.0014982223510742188, 0.001007080078125, 0.0035123825073242188, 0.0060176849365234375, 0.008522987365722656, 0.011028289794921875, 0.013533592224121094, 0.016038894653320312, 0.01854419708251953, 0.02104949951171875, 0.02355480194091797, 0.026060104370117188, 0.028565406799316406, 0.031070709228515625, 0.033576011657714844, 0.03608131408691406, 0.03858661651611328, 0.0410919189453125, 0.04359722137451172, 0.04610252380371094, 0.048607826232910156, 0.051113128662109375, 0.053618431091308594, 0.05612373352050781, 0.05862903594970703, 0.06113433837890625, 0.06363964080810547, 0.06614494323730469, 0.0686502456665039, 0.07115554809570312, 0.07366085052490234, 0.07616615295410156, 0.07867145538330078, 0.0811767578125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 4.0, 3.0, 4.0, 5.0, 15.0, 17.0, 20.0, 24.0, 30.0, 45.0, 79.0, 119.0, 242.0, 387.0, 779.0, 1663.0, 4374.0, 15527.0, 116238.0, 777088.0, 109169.0, 15105.0, 4224.0, 1649.0, 753.0, 399.0, 227.0, 113.0, 68.0, 45.0, 49.0, 24.0, 15.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.43603515625, -0.42218780517578125, -0.4083404541015625, -0.39449310302734375, -0.380645751953125, -0.36679840087890625, -0.3529510498046875, -0.33910369873046875, -0.32525634765625, -0.31140899658203125, -0.2975616455078125, -0.28371429443359375, -0.269866943359375, -0.25601959228515625, -0.2421722412109375, -0.22832489013671875, -0.2144775390625, -0.20063018798828125, -0.1867828369140625, -0.17293548583984375, -0.159088134765625, -0.14524078369140625, -0.1313934326171875, -0.11754608154296875, -0.10369873046875, -0.08985137939453125, -0.0760040283203125, -0.06215667724609375, -0.048309326171875, -0.03446197509765625, -0.0206146240234375, -0.00676727294921875, 0.007080078125, 0.02092742919921875, 0.0347747802734375, 0.04862213134765625, 0.062469482421875, 0.07631683349609375, 0.0901641845703125, 0.10401153564453125, 0.11785888671875, 0.13170623779296875, 0.1455535888671875, 0.15940093994140625, 0.173248291015625, 0.18709564208984375, 0.2009429931640625, 0.21479034423828125, 0.2286376953125, 0.24248504638671875, 0.2563323974609375, 0.27017974853515625, 0.284027099609375, 0.29787445068359375, 0.3117218017578125, 0.32556915283203125, 0.33941650390625, 0.35326385498046875, 0.3671112060546875, 0.38095855712890625, 0.394805908203125, 0.40865325927734375, 0.4225006103515625, 0.43634796142578125, 0.4501953125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 5.0, 5.0, 8.0, 9.0, 10.0, 19.0, 16.0, 42.0, 31.0, 55.0, 65.0, 88.0, 119.0, 109.0, 126.0, 74.0, 77.0, 40.0, 27.0, 16.0, 17.0, 12.0, 5.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06960821896791458, -0.06774312257766724, -0.06587802618741989, -0.06401292979717255, -0.0621478371322155, -0.060282740741968155, -0.05841764807701111, -0.05655255168676376, -0.05468745529651642, -0.052822358906269073, -0.05095726251602173, -0.04909216985106468, -0.04722707346081734, -0.04536197707056999, -0.043496884405612946, -0.0416317880153656, -0.039766691625118256, -0.03790159523487091, -0.036036498844623566, -0.03417140617966652, -0.032306309789419174, -0.03044121339917183, -0.028576118871569633, -0.026711024343967438, -0.024845927953720093, -0.022980831563472748, -0.021115737035870552, -0.019250642508268356, -0.01738554611802101, -0.015520450659096241, -0.01365535520017147, -0.0117902597412467, -0.009925168007612228, -0.008060072548687458, -0.006194977089762688, -0.004329881630837917, -0.002464786171913147, -0.0005996907129883766, 0.0012654047459363937, 0.003130500204861164, 0.0049955956637859344, 0.006860691122710705, 0.008725786581635475, 0.010590882040560246, 0.012455977499485016, 0.014321072958409786, 0.016186168417334557, 0.018051262944936752, 0.019916359335184097, 0.021781455725431442, 0.023646550253033638, 0.025511644780635834, 0.02737674117088318, 0.029241837561130524, 0.03110693208873272, 0.032972026616334915, 0.03483712300658226, 0.036702219396829605, 0.03856731206178665, 0.040432408452034, 0.04229750484228134, 0.044162601232528687, 0.04602769762277603, 0.04789279028773308, 0.04975788667798042]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 8.0, 5.0, 7.0, 9.0, 9.0, 11.0, 9.0, 13.0, 15.0, 18.0, 30.0, 22.0, 23.0, 29.0, 18.0, 30.0, 28.0, 30.0, 31.0, 42.0, 42.0, 42.0, 38.0, 36.0, 35.0, 35.0, 30.0, 28.0, 34.0, 32.0, 30.0, 39.0, 27.0, 22.0, 13.0, 20.0, 14.0, 17.0, 22.0, 10.0, 11.0, 8.0, 6.0, 9.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.03910249471664429, -0.03793303668498993, -0.03676357865333557, -0.03559412062168121, -0.034424662590026855, -0.0332552045583725, -0.03208574652671814, -0.030916288495063782, -0.029746830463409424, -0.028577372431755066, -0.027407914400100708, -0.02623845636844635, -0.025068998336791992, -0.023899540305137634, -0.022730082273483276, -0.02156062424182892, -0.02039116621017456, -0.019221708178520203, -0.018052250146865845, -0.016882792115211487, -0.01571333408355713, -0.014543876051902771, -0.013374418020248413, -0.012204959988594055, -0.011035501956939697, -0.00986604392528534, -0.008696585893630981, -0.0075271278619766235, -0.006357669830322266, -0.005188211798667908, -0.00401875376701355, -0.002849295735359192, -0.001679837703704834, -0.0005103796720504761, 0.0006590783596038818, 0.0018285363912582397, 0.0029979944229125977, 0.004167452454566956, 0.0053369104862213135, 0.006506368517875671, 0.007675826549530029, 0.008845284581184387, 0.010014742612838745, 0.011184200644493103, 0.012353658676147461, 0.013523116707801819, 0.014692574739456177, 0.015862032771110535, 0.017031490802764893, 0.01820094883441925, 0.01937040686607361, 0.020539864897727966, 0.021709322929382324, 0.022878780961036682, 0.02404823899269104, 0.025217697024345398, 0.026387155055999756, 0.027556613087654114, 0.02872607111930847, 0.02989552915096283, 0.031064987182617188, 0.032234445214271545, 0.0334039032459259, 0.03457336127758026, 0.03574281930923462]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 4.0, 12.0, 16.0, 24.0, 23.0, 28.0, 27.0, 28.0, 32.0, 40.0, 35.0, 41.0, 44.0, 56.0, 44.0, 41.0, 45.0, 54.0, 43.0, 33.0, 41.0, 45.0, 37.0, 35.0, 35.0, 20.0, 25.0, 15.0, 11.0, 13.0, 14.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.6875, -86.8623046875, -84.037109375, -81.2119140625, -78.38671875, -75.5615234375, -72.736328125, -69.9111328125, -67.0859375, -64.2607421875, -61.435546875, -58.6103515625, -55.78515625, -52.9599609375, -50.134765625, -47.3095703125, -44.484375, -41.6591796875, -38.833984375, -36.0087890625, -33.18359375, -30.3583984375, -27.533203125, -24.7080078125, -21.8828125, -19.0576171875, -16.232421875, -13.4072265625, -10.58203125, -7.7568359375, -4.931640625, -2.1064453125, 0.71875, 3.5439453125, 6.369140625, 9.1943359375, 12.01953125, 14.8447265625, 17.669921875, 20.4951171875, 23.3203125, 26.1455078125, 28.970703125, 31.7958984375, 34.62109375, 37.4462890625, 40.271484375, 43.0966796875, 45.921875, 48.7470703125, 51.572265625, 54.3974609375, 57.22265625, 60.0478515625, 62.873046875, 65.6982421875, 68.5234375, 71.3486328125, 74.173828125, 76.9990234375, 79.82421875, 82.6494140625, 85.474609375, 88.2998046875, 91.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 13.0, 13.0, 19.0, 37.0, 59.0, 75.0, 133.0, 186.0, 277.0, 421.0, 783.0, 1320.0, 2866.0, 6986.0, 22444.0, 99708.0, 427177.0, 372413.0, 82441.0, 19171.0, 6293.0, 2635.0, 1243.0, 676.0, 391.0, 234.0, 159.0, 95.0, 84.0, 69.0, 35.0, 25.0, 24.0, 13.0, 9.0, 3.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.8304443359375, -15.364013671875, -14.8975830078125, -14.43115234375, -13.9647216796875, -13.498291015625, -13.0318603515625, -12.5654296875, -12.0989990234375, -11.632568359375, -11.1661376953125, -10.69970703125, -10.2332763671875, -9.766845703125, -9.3004150390625, -8.833984375, -8.3675537109375, -7.901123046875, -7.4346923828125, -6.96826171875, -6.5018310546875, -6.035400390625, -5.5689697265625, -5.1025390625, -4.6361083984375, -4.169677734375, -3.7032470703125, -3.23681640625, -2.7703857421875, -2.303955078125, -1.8375244140625, -1.37109375, -0.9046630859375, -0.438232421875, 0.0281982421875, 0.49462890625, 0.9610595703125, 1.427490234375, 1.8939208984375, 2.3603515625, 2.8267822265625, 3.293212890625, 3.7596435546875, 4.22607421875, 4.6925048828125, 5.158935546875, 5.6253662109375, 6.091796875, 6.5582275390625, 7.024658203125, 7.4910888671875, 7.95751953125, 8.4239501953125, 8.890380859375, 9.3568115234375, 9.8232421875, 10.2896728515625, 10.756103515625, 11.2225341796875, 11.68896484375, 12.1553955078125, 12.621826171875, 13.0882568359375, 13.5546875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 5.0, 10.0, 12.0, 15.0, 19.0, 29.0, 28.0, 31.0, 40.0, 57.0, 75.0, 71.0, 70.0, 2092.0, 108.0, 76.0, 47.0, 51.0, 50.0, 30.0, 33.0, 21.0, 22.0, 14.0, 17.0, 9.0, 3.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-186.875, -181.498046875, -176.12109375, -170.744140625, -165.3671875, -159.990234375, -154.61328125, -149.236328125, -143.859375, -138.482421875, -133.10546875, -127.728515625, -122.3515625, -116.974609375, -111.59765625, -106.220703125, -100.84375, -95.466796875, -90.08984375, -84.712890625, -79.3359375, -73.958984375, -68.58203125, -63.205078125, -57.828125, -52.451171875, -47.07421875, -41.697265625, -36.3203125, -30.943359375, -25.56640625, -20.189453125, -14.8125, -9.435546875, -4.05859375, 1.318359375, 6.6953125, 12.072265625, 17.44921875, 22.826171875, 28.203125, 33.580078125, 38.95703125, 44.333984375, 49.7109375, 55.087890625, 60.46484375, 65.841796875, 71.21875, 76.595703125, 81.97265625, 87.349609375, 92.7265625, 98.103515625, 103.48046875, 108.857421875, 114.234375, 119.611328125, 124.98828125, 130.365234375, 135.7421875, 141.119140625, 146.49609375, 151.873046875, 157.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 9.0, 13.0, 8.0, 23.0, 35.0, 58.0, 73.0, 116.0, 167.0, 279.0, 562.0, 1360.0, 4368.0, 58454.0, 2979496.0, 92266.0, 5451.0, 1462.0, 648.0, 308.0, 175.0, 120.0, 81.0, 70.0, 30.0, 23.0, 15.0, 8.0, 8.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.46875, -33.302734375, -32.13671875, -30.970703125, -29.8046875, -28.638671875, -27.47265625, -26.306640625, -25.140625, -23.974609375, -22.80859375, -21.642578125, -20.4765625, -19.310546875, -18.14453125, -16.978515625, -15.8125, -14.646484375, -13.48046875, -12.314453125, -11.1484375, -9.982421875, -8.81640625, -7.650390625, -6.484375, -5.318359375, -4.15234375, -2.986328125, -1.8203125, -0.654296875, 0.51171875, 1.677734375, 2.84375, 4.009765625, 5.17578125, 6.341796875, 7.5078125, 8.673828125, 9.83984375, 11.005859375, 12.171875, 13.337890625, 14.50390625, 15.669921875, 16.8359375, 18.001953125, 19.16796875, 20.333984375, 21.5, 22.666015625, 23.83203125, 24.998046875, 26.1640625, 27.330078125, 28.49609375, 29.662109375, 30.828125, 31.994140625, 33.16015625, 34.326171875, 35.4921875, 36.658203125, 37.82421875, 38.990234375, 40.15625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [5.0, 4.0, 9.0, 21.0, 224.0, 481.0, 196.0, 39.0, 17.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.66000366210938, -89.31739044189453, -68.97477722167969, -48.632164001464844, -28.28955078125, -7.946937561035156, 12.395675659179688, 32.73828125, 53.080902099609375, 73.42351531982422, 93.76612854003906, 114.1087417602539, 134.45135498046875, 154.79397583007812, 175.13658142089844, 195.47918701171875, 215.82180786132812, 236.1644287109375, 256.50701904296875, 276.8496398925781, 297.1922607421875, 317.5348815917969, 337.87750244140625, 358.2200927734375, 378.5627136230469, 398.90533447265625, 419.2479248046875, 439.5905456542969, 459.93316650390625, 480.2757873535156, 500.618408203125, 520.9609985351562, 541.3035888671875, 561.6461791992188, 581.9888305664062, 602.3314208984375, 622.674072265625, 643.0166625976562, 663.3592529296875, 683.701904296875, 704.0444946289062, 724.3870849609375, 744.729736328125, 765.0723266601562, 785.4149169921875, 805.757568359375, 826.1001586914062, 846.4427490234375, 866.785400390625, 887.1279907226562, 907.4706420898438, 927.813232421875, 948.1558837890625, 968.4984741210938, 988.841064453125, 1009.1837158203125, 1029.5263671875, 1049.8690185546875, 1070.2115478515625, 1090.55419921875, 1110.8968505859375, 1131.2393798828125, 1151.58203125, 1171.9246826171875, 1192.2672119140625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 8.0, 14.0, 13.0, 11.0, 17.0, 16.0, 27.0, 20.0, 24.0, 35.0, 44.0, 35.0, 41.0, 49.0, 42.0, 50.0, 48.0, 43.0, 41.0, 52.0, 46.0, 40.0, 49.0, 37.0, 28.0, 27.0, 22.0, 27.0, 22.0, 14.0, 13.0, 4.0, 8.0, 13.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-164.3860626220703, -159.03541564941406, -153.6847686767578, -148.33412170410156, -142.9834747314453, -137.63282775878906, -132.28219604492188, -126.9315414428711, -121.58089447021484, -116.2302474975586, -110.87960052490234, -105.52896118164062, -100.17831420898438, -94.82766723632812, -89.47702026367188, -84.12637329101562, -78.77572631835938, -73.42507934570312, -68.07443237304688, -62.72378921508789, -57.37314224243164, -52.02249526977539, -46.671852111816406, -41.321205139160156, -35.970558166503906, -30.619911193847656, -25.26926612854004, -19.918621063232422, -14.567974090576172, -9.217327117919922, -3.8666839599609375, 1.4839630126953125, 6.834625244140625, 12.185271263122559, 17.535917282104492, 22.88656234741211, 28.23720932006836, 33.58785629272461, 38.938499450683594, 44.289146423339844, 49.639793395996094, 54.990440368652344, 60.341087341308594, 65.69172668457031, 71.04237365722656, 76.39302062988281, 81.74366760253906, 87.09431457519531, 92.44496154785156, 97.79560852050781, 103.14625549316406, 108.49690246582031, 113.84754943847656, 119.19819641113281, 124.54883575439453, 129.89947509765625, 135.2501220703125, 140.60076904296875, 145.951416015625, 151.30206298828125, 156.6527099609375, 162.00335693359375, 167.35400390625, 172.70465087890625, 178.0552978515625]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 6.0, 16.0, 14.0, 19.0, 32.0, 27.0, 50.0, 69.0, 110.0, 138.0, 174.0, 213.0, 306.0, 353.0, 514.0, 723.0, 1120.0, 1040177.0, 1352.0, 822.0, 601.0, 416.0, 302.0, 257.0, 181.0, 154.0, 111.0, 97.0, 54.0, 42.0, 31.0, 28.0, 9.0, 14.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.704925537109375, -57.98390197753906, -56.26287841796875, -54.54185485839844, -52.820831298828125, -51.09980773925781, -49.3787841796875, -47.65776062011719, -45.936737060546875, -44.21571350097656, -42.49468994140625, -40.77366638183594, -39.052642822265625, -37.33161926269531, -35.610595703125, -33.88957214355469, -32.16854476928711, -30.447521209716797, -28.726497650146484, -27.005474090576172, -25.28445053100586, -23.563426971435547, -21.8424015045166, -20.12137794494629, -18.400354385375977, -16.679330825805664, -14.958307266235352, -13.237282752990723, -11.51625919342041, -9.795235633850098, -8.074211120605469, -6.353187561035156, -4.632160186767578, -2.9111363887786865, -1.190112590789795, 0.5309114456176758, 2.2519350051879883, 3.972958564758301, 5.69398307800293, 7.415006637573242, 9.136030197143555, 10.857053756713867, 12.57807731628418, 14.299101829528809, 16.020126342773438, 17.74114990234375, 19.462173461914062, 21.183197021484375, 22.904220581054688, 24.625244140625, 26.346267700195312, 28.067291259765625, 29.788314819335938, 31.50933837890625, 33.23036193847656, 34.951385498046875, 36.67240905761719, 38.3934326171875, 40.11445617675781, 41.835479736328125, 43.55650329589844, 45.27752685546875, 46.99855041503906, 48.719573974609375, 50.44060134887695]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 8.0, 12.0, 24.0, 21.0, 52.0, 126.0, 51442200.0, 20614.0, 69.0, 23.0, 28.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3162.0, -3048.893310546875, -2935.786376953125, -2822.6796875, -2709.572998046875, -2596.46630859375, -2483.359375, -2370.252685546875, -2257.14599609375, -2144.039306640625, -2030.9324951171875, -1917.82568359375, -1804.718994140625, -1691.6121826171875, -1578.50537109375, -1465.398681640625, -1352.2918701171875, -1239.18505859375, -1126.078369140625, -1012.9715576171875, -899.8648681640625, -786.758056640625, -673.6513061523438, -560.5445556640625, -447.43780517578125, -334.3310546875, -221.2242889404297, -108.11752319335938, 4.989227294921875, 118.09600830078125, 231.2027587890625, 344.30950927734375, 457.416259765625, 570.5230102539062, 683.6297607421875, 796.736572265625, 909.84326171875, 1022.9500732421875, 1136.056884765625, 1249.16357421875, 1362.270263671875, 1475.3770751953125, 1588.4837646484375, 1701.590576171875, 1814.697265625, 1927.8040771484375, 2040.910888671875, 2154.017578125, 2267.12451171875, 2380.231201171875, 2493.338134765625, 2606.44482421875, 2719.551513671875, 2832.658203125, 2945.76513671875, 3058.871826171875, 3171.978515625, 3285.085205078125, 3398.192138671875, 3511.298828125, 3624.405517578125, 3737.51220703125, 3850.619140625, 3963.725830078125, 4076.83251953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 2.0, 9.0, 9.0, 7.0, 7.0, 6.0, 12.0, 22.0, 31.0, 44.0, 79.0, 104.0, 190.0, 302.0, 480.0, 830.0, 1430.0, 2580.0, 4493.0, 7842.0, 13395.0, 23436.0, 40546.0, 69810.0, 117911.0, 196482.0, 311578.0, 457738.0, 3589372.0, 548432.0, 349314.0, 224869.0, 136896.0, 80795.0, 47366.0, 27270.0, 15961.0, 9100.0, 5254.0, 3081.0, 1697.0, 1059.0, 618.0, 387.0, 213.0, 134.0, 105.0, 54.0, 39.0, 21.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.896484375, -1.8365478515625, -1.776611328125, -1.7166748046875, -1.65673828125, -1.5968017578125, -1.536865234375, -1.4769287109375, -1.4169921875, -1.3570556640625, -1.297119140625, -1.2371826171875, -1.17724609375, -1.1173095703125, -1.057373046875, -0.9974365234375, -0.9375, -0.8775634765625, -0.817626953125, -0.7576904296875, -0.69775390625, -0.6378173828125, -0.577880859375, -0.5179443359375, -0.4580078125, -0.3980712890625, -0.338134765625, -0.2781982421875, -0.21826171875, -0.1583251953125, -0.098388671875, -0.0384521484375, 0.021484375, 0.0814208984375, 0.141357421875, 0.2012939453125, 0.26123046875, 0.3211669921875, 0.381103515625, 0.4410400390625, 0.5009765625, 0.5609130859375, 0.620849609375, 0.6807861328125, 0.74072265625, 0.8006591796875, 0.860595703125, 0.9205322265625, 0.98046875, 1.0404052734375, 1.100341796875, 1.1602783203125, 1.22021484375, 1.2801513671875, 1.340087890625, 1.4000244140625, 1.4599609375, 1.5198974609375, 1.579833984375, 1.6397705078125, 1.69970703125, 1.7596435546875, 1.819580078125, 1.8795166015625, 1.939453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 6.0, 12.0, 12.0, 12.0, 5.0, 19.0, 25.0, 19.0, 17.0, 21.0, 21.0, 25.0, 33.0, 34.0, 33.0, 36.0, 39.0, 48.0, 147.0, 904.0, 89.0, 38.0, 40.0, 49.0, 32.0, 31.0, 31.0, 27.0, 24.0, 30.0, 25.0, 23.0, 21.0, 14.0, 17.0, 18.0, 7.0, 9.0, 4.0, 4.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-21.703125, -21.092041015625, -20.48095703125, -19.869873046875, -19.2587890625, -18.647705078125, -18.03662109375, -17.425537109375, -16.814453125, -16.203369140625, -15.59228515625, -14.981201171875, -14.3701171875, -13.759033203125, -13.14794921875, -12.536865234375, -11.92578125, -11.314697265625, -10.70361328125, -10.092529296875, -9.4814453125, -8.870361328125, -8.25927734375, -7.648193359375, -7.037109375, -6.426025390625, -5.81494140625, -5.203857421875, -4.5927734375, -3.981689453125, -3.37060546875, -2.759521484375, -2.1484375, -1.537353515625, -0.92626953125, -0.315185546875, 0.2958984375, 0.906982421875, 1.51806640625, 2.129150390625, 2.740234375, 3.351318359375, 3.96240234375, 4.573486328125, 5.1845703125, 5.795654296875, 6.40673828125, 7.017822265625, 7.62890625, 8.239990234375, 8.85107421875, 9.462158203125, 10.0732421875, 10.684326171875, 11.29541015625, 11.906494140625, 12.517578125, 13.128662109375, 13.73974609375, 14.350830078125, 14.9619140625, 15.572998046875, 16.18408203125, 16.795166015625, 17.40625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 8.0, 16.0, 22.0, 37.0, 58.0, 76.0, 139.0, 195.0, 336.0, 510.0, 734.0, 1118.0, 1656.0, 2627.0, 3849.0, 5813.0, 8522.0, 13056.0, 19488.0, 29082.0, 43415.0, 63441.0, 92166.0, 132381.0, 185137.0, 248741.0, 313086.0, 876167.0, 2978044.0, 335242.0, 266762.0, 202920.0, 147560.0, 103696.0, 71039.0, 48425.0, 32238.0, 21536.0, 14412.0, 9392.0, 6123.0, 4155.0, 2676.0, 1769.0, 1175.0, 806.0, 546.0, 347.0, 248.0, 163.0, 108.0, 72.0, 35.0, 32.0, 13.0, 15.0, 8.0, 3.0, 4.0, 3.0, 3.0], "bins": [-1.1748046875, -1.1371002197265625, -1.099395751953125, -1.0616912841796875, -1.02398681640625, -0.9862823486328125, -0.948577880859375, -0.9108734130859375, -0.8731689453125, -0.8354644775390625, -0.797760009765625, -0.7600555419921875, -0.72235107421875, -0.6846466064453125, -0.646942138671875, -0.6092376708984375, -0.571533203125, -0.5338287353515625, -0.496124267578125, -0.4584197998046875, -0.42071533203125, -0.3830108642578125, -0.345306396484375, -0.3076019287109375, -0.2698974609375, -0.2321929931640625, -0.194488525390625, -0.1567840576171875, -0.11907958984375, -0.0813751220703125, -0.043670654296875, -0.0059661865234375, 0.03173828125, 0.0694427490234375, 0.107147216796875, 0.1448516845703125, 0.18255615234375, 0.2202606201171875, 0.257965087890625, 0.2956695556640625, 0.3333740234375, 0.3710784912109375, 0.408782958984375, 0.4464874267578125, 0.48419189453125, 0.5218963623046875, 0.559600830078125, 0.5973052978515625, 0.635009765625, 0.6727142333984375, 0.710418701171875, 0.7481231689453125, 0.78582763671875, 0.8235321044921875, 0.861236572265625, 0.8989410400390625, 0.9366455078125, 0.9743499755859375, 1.012054443359375, 1.0497589111328125, 1.08746337890625, 1.1251678466796875, 1.162872314453125, 1.2005767822265625, 1.23828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 4.0, 6.0, 6.0, 6.0, 5.0, 14.0, 15.0, 11.0, 13.0, 19.0, 22.0, 29.0, 24.0, 26.0, 32.0, 23.0, 34.0, 28.0, 39.0, 25.0, 44.0, 610.0, 472.0, 41.0, 40.0, 34.0, 42.0, 27.0, 26.0, 44.0, 26.0, 32.0, 29.0, 26.0, 16.0, 26.0, 15.0, 19.0, 14.0, 12.0, 13.0, 11.0, 2.0, 5.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-18.15625, -17.6064453125, -17.056640625, -16.5068359375, -15.95703125, -15.4072265625, -14.857421875, -14.3076171875, -13.7578125, -13.2080078125, -12.658203125, -12.1083984375, -11.55859375, -11.0087890625, -10.458984375, -9.9091796875, -9.359375, -8.8095703125, -8.259765625, -7.7099609375, -7.16015625, -6.6103515625, -6.060546875, -5.5107421875, -4.9609375, -4.4111328125, -3.861328125, -3.3115234375, -2.76171875, -2.2119140625, -1.662109375, -1.1123046875, -0.5625, -0.0126953125, 0.537109375, 1.0869140625, 1.63671875, 2.1865234375, 2.736328125, 3.2861328125, 3.8359375, 4.3857421875, 4.935546875, 5.4853515625, 6.03515625, 6.5849609375, 7.134765625, 7.6845703125, 8.234375, 8.7841796875, 9.333984375, 9.8837890625, 10.43359375, 10.9833984375, 11.533203125, 12.0830078125, 12.6328125, 13.1826171875, 13.732421875, 14.2822265625, 14.83203125, 15.3818359375, 15.931640625, 16.4814453125, 17.03125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 8.0, 14.0, 17.0, 20.0, 33.0, 35.0, 56.0, 83.0, 109.0, 176.0, 265.0, 569.0, 1074.0, 2039.0, 4443.0, 9723.0, 22330.0, 53366.0, 135735.0, 5777011.0, 168911.0, 66065.0, 26652.0, 11904.0, 5380.0, 2568.0, 1233.0, 614.0, 363.0, 185.0, 121.0, 89.0, 68.0, 43.0, 26.0, 26.0, 18.0, 10.0, 9.0, 5.0, 9.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.515625, -8.26959228515625, -8.0235595703125, -7.77752685546875, -7.531494140625, -7.28546142578125, -7.0394287109375, -6.79339599609375, -6.54736328125, -6.30133056640625, -6.0552978515625, -5.80926513671875, -5.563232421875, -5.31719970703125, -5.0711669921875, -4.82513427734375, -4.5791015625, -4.33306884765625, -4.0870361328125, -3.84100341796875, -3.594970703125, -3.34893798828125, -3.1029052734375, -2.85687255859375, -2.61083984375, -2.36480712890625, -2.1187744140625, -1.87274169921875, -1.626708984375, -1.38067626953125, -1.1346435546875, -0.88861083984375, -0.642578125, -0.39654541015625, -0.1505126953125, 0.09552001953125, 0.341552734375, 0.58758544921875, 0.8336181640625, 1.07965087890625, 1.32568359375, 1.57171630859375, 1.8177490234375, 2.06378173828125, 2.309814453125, 2.55584716796875, 2.8018798828125, 3.04791259765625, 3.2939453125, 3.53997802734375, 3.7860107421875, 4.03204345703125, 4.278076171875, 4.52410888671875, 4.7701416015625, 5.01617431640625, 5.26220703125, 5.50823974609375, 5.7542724609375, 6.00030517578125, 6.246337890625, 6.49237060546875, 6.7384033203125, 6.98443603515625, 7.23046875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 7.0, 7.0, 7.0, 8.0, 16.0, 17.0, 21.0, 27.0, 24.0, 28.0, 27.0, 38.0, 32.0, 38.0, 54.0, 45.0, 41.0, 169.0, 953.0, 41.0, 53.0, 30.0, 38.0, 41.0, 35.0, 33.0, 31.0, 29.0, 36.0, 15.0, 21.0, 11.0, 18.0, 15.0, 10.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.765625, -26.0078125, -25.25, -24.4921875, -23.734375, -22.9765625, -22.21875, -21.4609375, -20.703125, -19.9453125, -19.1875, -18.4296875, -17.671875, -16.9140625, -16.15625, -15.3984375, -14.640625, -13.8828125, -13.125, -12.3671875, -11.609375, -10.8515625, -10.09375, -9.3359375, -8.578125, -7.8203125, -7.0625, -6.3046875, -5.546875, -4.7890625, -4.03125, -3.2734375, -2.515625, -1.7578125, -1.0, -0.2421875, 0.515625, 1.2734375, 2.03125, 2.7890625, 3.546875, 4.3046875, 5.0625, 5.8203125, 6.578125, 7.3359375, 8.09375, 8.8515625, 9.609375, 10.3671875, 11.125, 11.8828125, 12.640625, 13.3984375, 14.15625, 14.9140625, 15.671875, 16.4296875, 17.1875, 17.9453125, 18.703125, 19.4609375, 20.21875, 20.9765625, 21.734375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 10.0, 18.0, 50.0, 195.0, 483.0, 172.0, 52.0, 13.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.42251586914062, -95.8067855834961, -92.19105529785156, -88.57533264160156, -84.95960235595703, -81.3438720703125, -77.72814178466797, -74.11241149902344, -70.49668884277344, -66.8809585571289, -63.26523208618164, -59.64950180053711, -56.033775329589844, -52.41804504394531, -48.80231475830078, -45.186588287353516, -41.570858001708984, -37.95512771606445, -34.33940124511719, -30.723670959472656, -27.10794448852539, -23.49221420288086, -19.87648582458496, -16.260757446289062, -12.645029067993164, -9.029300689697266, -5.413571834564209, -1.7978429794311523, 1.817885398864746, 5.433614730834961, 9.04934310913086, 12.665071487426758, 16.280799865722656, 19.896528244018555, 23.512256622314453, 27.127986907958984, 30.74371337890625, 34.35944366455078, 37.97517395019531, 41.59090042114258, 45.206626892089844, 48.822357177734375, 52.43808364868164, 56.05381393432617, 59.66954040527344, 63.28527069091797, 66.9010009765625, 70.5167236328125, 74.13246154785156, 77.7481918334961, 81.36392211914062, 84.97964477539062, 88.59537506103516, 92.21110534667969, 95.82683563232422, 99.44256591796875, 103.05828857421875, 106.67401885986328, 110.28974914550781, 113.90547180175781, 117.52120208740234, 121.13693237304688, 124.7526626586914, 128.36839294433594, 131.98411560058594]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 2.0, 7.0, 12.0, 15.0, 25.0, 32.0, 33.0, 65.0, 72.0, 78.0, 79.0, 87.0, 81.0, 90.0, 73.0, 68.0, 46.0, 41.0, 26.0, 16.0, 14.0, 12.0, 13.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.66326904296875, -97.94090270996094, -95.2185287475586, -92.49615478515625, -89.77378845214844, -87.05142211914062, -84.32904815673828, -81.60667419433594, -78.88430786132812, -76.16194152832031, -73.43956756591797, -70.71719360351562, -67.99482727050781, -65.2724609375, -62.550086975097656, -59.82771682739258, -57.1053466796875, -54.38297653198242, -51.660606384277344, -48.938236236572266, -46.21586608886719, -43.49349594116211, -40.77112579345703, -38.04875564575195, -35.326385498046875, -32.6040153503418, -29.88164520263672, -27.15927505493164, -24.436904907226562, -21.714534759521484, -18.992164611816406, -16.269794464111328, -13.547431945800781, -10.825061798095703, -8.102691650390625, -5.380321502685547, -2.6579513549804688, 0.06441879272460938, 2.7867889404296875, 5.509159088134766, 8.231529235839844, 10.953899383544922, 13.67626953125, 16.398639678955078, 19.121009826660156, 21.843379974365234, 24.565750122070312, 27.28812026977539, 30.01049041748047, 32.73286056518555, 35.455230712890625, 38.1776008605957, 40.89997100830078, 43.62234115600586, 46.34471130371094, 49.067081451416016, 51.789451599121094, 54.51182174682617, 57.23419189453125, 59.95656204223633, 62.678932189941406, 65.40130615234375, 68.12367248535156, 70.84603881835938, 73.56841278076172]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 8.0, 14.0, 16.0, 21.0, 27.0, 40.0, 39.0, 63.0, 89.0, 142.0, 154.0, 221.0, 340.0, 492.0, 831.0, 1268.0, 2292.0, 4226.0, 9233.0, 24773.0, 128817.0, 3925656.0, 64289.0, 16933.0, 6798.0, 3211.0, 1655.0, 934.0, 591.0, 364.0, 231.0, 147.0, 96.0, 87.0, 36.0, 43.0, 15.0, 23.0, 10.0, 15.0, 3.0, 4.0, 2.0, 10.0, 5.0, 3.0, 2.0, 1.0], "bins": [-0.50537109375, -0.4918365478515625, -0.478302001953125, -0.4647674560546875, -0.45123291015625, -0.4376983642578125, -0.424163818359375, -0.4106292724609375, -0.3970947265625, -0.3835601806640625, -0.370025634765625, -0.3564910888671875, -0.34295654296875, -0.3294219970703125, -0.315887451171875, -0.3023529052734375, -0.288818359375, -0.2752838134765625, -0.261749267578125, -0.2482147216796875, -0.23468017578125, -0.2211456298828125, -0.207611083984375, -0.1940765380859375, -0.1805419921875, -0.1670074462890625, -0.153472900390625, -0.1399383544921875, -0.12640380859375, -0.1128692626953125, -0.099334716796875, -0.0858001708984375, -0.072265625, -0.0587310791015625, -0.045196533203125, -0.0316619873046875, -0.01812744140625, -0.0045928955078125, 0.008941650390625, 0.0224761962890625, 0.0360107421875, 0.0495452880859375, 0.063079833984375, 0.0766143798828125, 0.09014892578125, 0.1036834716796875, 0.117218017578125, 0.1307525634765625, 0.144287109375, 0.1578216552734375, 0.171356201171875, 0.1848907470703125, 0.19842529296875, 0.2119598388671875, 0.225494384765625, 0.2390289306640625, 0.2525634765625, 0.2660980224609375, 0.279632568359375, 0.2931671142578125, 0.30670166015625, 0.3202362060546875, 0.333770751953125, 0.3473052978515625, 0.36083984375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 4.0, 5.0, 6.0, 7.0, 10.0, 18.0, 14.0, 16.0, 62.0, 729.0, 22.0, 19.0, 8.0, 11.0, 13.0, 10.0, 5.0, 1.0, 4.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.3526649475097656, -0.34229278564453125, -0.3319206237792969, -0.3215484619140625, -0.3111763000488281, -0.30080413818359375, -0.2904319763183594, -0.280059814453125, -0.2696876525878906, -0.25931549072265625, -0.24894332885742188, -0.2385711669921875, -0.22819900512695312, -0.21782684326171875, -0.20745468139648438, -0.19708251953125, -0.18671035766601562, -0.17633819580078125, -0.16596603393554688, -0.1555938720703125, -0.14522171020507812, -0.13484954833984375, -0.12447738647460938, -0.114105224609375, -0.10373306274414062, -0.09336090087890625, -0.08298873901367188, -0.0726165771484375, -0.062244415283203125, -0.05187225341796875, -0.041500091552734375, -0.0311279296875, -0.020755767822265625, -0.01038360595703125, -1.1444091796875e-05, 0.0103607177734375, 0.020732879638671875, 0.03110504150390625, 0.041477203369140625, 0.051849365234375, 0.062221527099609375, 0.07259368896484375, 0.08296585083007812, 0.0933380126953125, 0.10371017456054688, 0.11408233642578125, 0.12445449829101562, 0.13482666015625, 0.14519882202148438, 0.15557098388671875, 0.16594314575195312, 0.1763153076171875, 0.18668746948242188, 0.19705963134765625, 0.20743179321289062, 0.217803955078125, 0.22817611694335938, 0.23854827880859375, 0.24892044067382812, 0.2592926025390625, 0.2696647644042969, 0.28003692626953125, 0.2904090881347656, 0.30078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 6.0, 8.0, 13.0, 9.0, 10.0, 18.0, 12.0, 38.0, 62.0, 85.0, 122.0, 185.0, 335.0, 529.0, 1110.0, 2651.0, 7738.0, 31811.0, 301549.0, 3687900.0, 133500.0, 18621.0, 4885.0, 1686.0, 649.0, 308.0, 168.0, 102.0, 66.0, 39.0, 19.0, 13.0, 11.0, 11.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6875, -0.6685943603515625, -0.649688720703125, -0.6307830810546875, -0.61187744140625, -0.5929718017578125, -0.574066162109375, -0.5551605224609375, -0.5362548828125, -0.5173492431640625, -0.498443603515625, -0.4795379638671875, -0.46063232421875, -0.4417266845703125, -0.422821044921875, -0.4039154052734375, -0.385009765625, -0.3661041259765625, -0.347198486328125, -0.3282928466796875, -0.30938720703125, -0.2904815673828125, -0.271575927734375, -0.2526702880859375, -0.2337646484375, -0.2148590087890625, -0.195953369140625, -0.1770477294921875, -0.15814208984375, -0.1392364501953125, -0.120330810546875, -0.1014251708984375, -0.08251953125, -0.0636138916015625, -0.044708251953125, -0.0258026123046875, -0.00689697265625, 0.0120086669921875, 0.030914306640625, 0.0498199462890625, 0.0687255859375, 0.0876312255859375, 0.106536865234375, 0.1254425048828125, 0.14434814453125, 0.1632537841796875, 0.182159423828125, 0.2010650634765625, 0.219970703125, 0.2388763427734375, 0.257781982421875, 0.2766876220703125, 0.29559326171875, 0.3144989013671875, 0.333404541015625, 0.3523101806640625, 0.3712158203125, 0.3901214599609375, 0.409027099609375, 0.4279327392578125, 0.44683837890625, 0.4657440185546875, 0.484649658203125, 0.5035552978515625, 0.5224609375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 16.0, 18.0, 21.0, 38.0, 42.0, 58.0, 99.0, 160.0, 347.0, 930.0, 1397.0, 396.0, 185.0, 101.0, 69.0, 47.0, 31.0, 31.0, 10.0, 12.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.349853515625, -0.3413505554199219, -0.33284759521484375, -0.3243446350097656, -0.3158416748046875, -0.3073387145996094, -0.29883575439453125, -0.2903327941894531, -0.281829833984375, -0.2733268737792969, -0.26482391357421875, -0.2563209533691406, -0.2478179931640625, -0.23931503295898438, -0.23081207275390625, -0.22230911254882812, -0.21380615234375, -0.20530319213867188, -0.19680023193359375, -0.18829727172851562, -0.1797943115234375, -0.17129135131835938, -0.16278839111328125, -0.15428543090820312, -0.145782470703125, -0.13727951049804688, -0.12877655029296875, -0.12027359008789062, -0.1117706298828125, -0.10326766967773438, -0.09476470947265625, -0.08626174926757812, -0.0777587890625, -0.06925582885742188, -0.06075286865234375, -0.052249908447265625, -0.0437469482421875, -0.035243988037109375, -0.02674102783203125, -0.018238067626953125, -0.009735107421875, -0.001232147216796875, 0.00727081298828125, 0.015773773193359375, 0.0242767333984375, 0.032779693603515625, 0.04128265380859375, 0.049785614013671875, 0.05828857421875, 0.06679153442382812, 0.07529449462890625, 0.08379745483398438, 0.0923004150390625, 0.10080337524414062, 0.10930633544921875, 0.11780929565429688, 0.126312255859375, 0.13481521606445312, 0.14331817626953125, 0.15182113647460938, 0.1603240966796875, 0.16882705688476562, 0.17733001708984375, 0.18583297729492188, 0.1943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 9.0, 42.0, 214.0, 586.0, 126.0, 18.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.585526466369629, -6.462272644042969, -6.339018821716309, -6.21576452255249, -6.09251070022583, -5.96925687789917, -5.846002578735352, -5.722748756408691, -5.599494934082031, -5.476241111755371, -5.352987289428711, -5.229732990264893, -5.106479167938232, -4.983225345611572, -4.859971046447754, -4.736717224121094, -4.613463401794434, -4.490209579467773, -4.366955757141113, -4.243701457977295, -4.120447635650635, -3.9971938133239746, -3.8739397525787354, -3.750685691833496, -3.627431869506836, -3.504178047180176, -3.3809239864349365, -3.2576699256896973, -3.134416103363037, -3.011162281036377, -2.8879082202911377, -2.7646541595458984, -2.641400098800659, -2.51814603805542, -2.3948922157287598, -2.2716383934020996, -2.1483843326568604, -2.025130271911621, -1.901876449584961, -1.7786225080490112, -1.6553685665130615, -1.5321146249771118, -1.408860683441162, -1.2856067419052124, -1.1623528003692627, -1.039098858833313, -0.9158449172973633, -0.7925909757614136, -0.6693370342254639, -0.5460830926895142, -0.42282915115356445, -0.29957520961761475, -0.17632126808166504, -0.05306732654571533, 0.07018661499023438, 0.19344055652618408, 0.3166944980621338, 0.4399484395980835, 0.5632023811340332, 0.6864563226699829, 0.8097102642059326, 0.9329642057418823, 1.056218147277832, 1.1794720888137817, 1.3027260303497314]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 3.0, 11.0, 3.0, 9.0, 13.0, 15.0, 24.0, 23.0, 28.0, 20.0, 40.0, 37.0, 47.0, 52.0, 52.0, 54.0, 69.0, 66.0, 51.0, 50.0, 36.0, 36.0, 38.0, 41.0, 27.0, 35.0, 18.0, 21.0, 17.0, 7.0, 5.0, 7.0, 11.0, 7.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.082724690437317, -1.0506690740585327, -1.018613338470459, -0.98655766248703, -0.9545019865036011, -0.9224463701248169, -0.8903906941413879, -0.858335018157959, -0.82627934217453, -0.7942236661911011, -0.7621679902076721, -0.7301123142242432, -0.698056697845459, -0.6660009622573853, -0.6339453458786011, -0.6018896698951721, -0.5698339939117432, -0.5377783179283142, -0.5057226419448853, -0.4736669957637787, -0.44161131978034973, -0.4095556437969208, -0.3774999976158142, -0.34544432163238525, -0.3133886456489563, -0.28133296966552734, -0.24927730858325958, -0.21722164750099182, -0.18516597151756287, -0.1531102955341339, -0.12105463445186615, -0.08899897336959839, -0.05694335699081421, -0.02488768845796585, 0.007167980074882507, 0.039223648607730865, 0.07127931714057922, 0.10333499312400818, 0.13539065420627594, 0.1674463152885437, 0.19950199127197266, 0.2315576672554016, 0.26361334323883057, 0.29566898941993713, 0.3277246654033661, 0.35978034138679504, 0.3918359875679016, 0.42389166355133057, 0.4559473395347595, 0.4880030155181885, 0.5200586915016174, 0.5521143674850464, 0.5841699838638306, 0.6162257194519043, 0.6482813358306885, 0.6803370118141174, 0.7123926877975464, 0.7444483637809753, 0.7765040397644043, 0.8085597157478333, 0.8406153917312622, 0.8726710081100464, 0.9047266840934753, 0.9367823600769043, 0.9688380360603333]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 13.0, 7.0, 20.0, 16.0, 27.0, 44.0, 58.0, 73.0, 113.0, 147.0, 213.0, 316.0, 497.0, 703.0, 1192.0, 1890.0, 3164.0, 5839.0, 11296.0, 25084.0, 150109.0, 790389.0, 29105.0, 12798.0, 6232.0, 3498.0, 2024.0, 1217.0, 790.0, 538.0, 373.0, 230.0, 153.0, 99.0, 67.0, 47.0, 32.0, 30.0, 21.0, 28.0, 17.0, 14.0, 6.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2763671875, -1.2339324951171875, -1.191497802734375, -1.1490631103515625, -1.10662841796875, -1.0641937255859375, -1.021759033203125, -0.9793243408203125, -0.9368896484375, -0.8944549560546875, -0.852020263671875, -0.8095855712890625, -0.76715087890625, -0.7247161865234375, -0.682281494140625, -0.6398468017578125, -0.597412109375, -0.5549774169921875, -0.512542724609375, -0.4701080322265625, -0.42767333984375, -0.3852386474609375, -0.342803955078125, -0.3003692626953125, -0.2579345703125, -0.2154998779296875, -0.173065185546875, -0.1306304931640625, -0.08819580078125, -0.0457611083984375, -0.003326416015625, 0.0391082763671875, 0.08154296875, 0.1239776611328125, 0.166412353515625, 0.2088470458984375, 0.25128173828125, 0.2937164306640625, 0.336151123046875, 0.3785858154296875, 0.4210205078125, 0.4634552001953125, 0.505889892578125, 0.5483245849609375, 0.59075927734375, 0.6331939697265625, 0.675628662109375, 0.7180633544921875, 0.760498046875, 0.8029327392578125, 0.845367431640625, 0.8878021240234375, 0.93023681640625, 0.9726715087890625, 1.015106201171875, 1.0575408935546875, 1.0999755859375, 1.1424102783203125, 1.184844970703125, 1.2272796630859375, 1.26971435546875, 1.3121490478515625, 1.354583740234375, 1.3970184326171875, 1.439453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 3.0, 5.0, 8.0, 4.0, 5.0, 10.0, 7.0, 18.0, 16.0, 23.0, 545.0, 245.0, 18.0, 13.0, 12.0, 10.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35595703125, -0.3457183837890625, -0.335479736328125, -0.3252410888671875, -0.31500244140625, -0.3047637939453125, -0.294525146484375, -0.2842864990234375, -0.2740478515625, -0.2638092041015625, -0.253570556640625, -0.2433319091796875, -0.23309326171875, -0.2228546142578125, -0.212615966796875, -0.2023773193359375, -0.192138671875, -0.1819000244140625, -0.171661376953125, -0.1614227294921875, -0.15118408203125, -0.1409454345703125, -0.130706787109375, -0.1204681396484375, -0.1102294921875, -0.0999908447265625, -0.089752197265625, -0.0795135498046875, -0.06927490234375, -0.0590362548828125, -0.048797607421875, -0.0385589599609375, -0.0283203125, -0.0180816650390625, -0.007843017578125, 0.0023956298828125, 0.01263427734375, 0.0228729248046875, 0.033111572265625, 0.0433502197265625, 0.0535888671875, 0.0638275146484375, 0.074066162109375, 0.0843048095703125, 0.09454345703125, 0.1047821044921875, 0.115020751953125, 0.1252593994140625, 0.135498046875, 0.1457366943359375, 0.155975341796875, 0.1662139892578125, 0.17645263671875, 0.1866912841796875, 0.196929931640625, 0.2071685791015625, 0.2174072265625, 0.2276458740234375, 0.237884521484375, 0.2481231689453125, 0.25836181640625, 0.2686004638671875, 0.278839111328125, 0.2890777587890625, 0.29931640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 12.0, 12.0, 17.0, 33.0, 46.0, 43.0, 67.0, 101.0, 124.0, 179.0, 263.0, 430.0, 811.0, 1564.0, 3839.0, 10982.0, 35804.0, 148845.0, 571115.0, 206024.0, 45926.0, 13428.0, 4680.0, 1867.0, 882.0, 469.0, 292.0, 185.0, 149.0, 98.0, 79.0, 55.0, 40.0, 30.0, 20.0, 11.0, 14.0, 2.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8808135986328125, -0.852935791015625, -0.8250579833984375, -0.79718017578125, -0.7693023681640625, -0.741424560546875, -0.7135467529296875, -0.6856689453125, -0.6577911376953125, -0.629913330078125, -0.6020355224609375, -0.57415771484375, -0.5462799072265625, -0.518402099609375, -0.4905242919921875, -0.462646484375, -0.4347686767578125, -0.406890869140625, -0.3790130615234375, -0.35113525390625, -0.3232574462890625, -0.295379638671875, -0.2675018310546875, -0.2396240234375, -0.2117462158203125, -0.183868408203125, -0.1559906005859375, -0.12811279296875, -0.1002349853515625, -0.072357177734375, -0.0444793701171875, -0.0166015625, 0.0112762451171875, 0.039154052734375, 0.0670318603515625, 0.09490966796875, 0.1227874755859375, 0.150665283203125, 0.1785430908203125, 0.2064208984375, 0.2342987060546875, 0.262176513671875, 0.2900543212890625, 0.31793212890625, 0.3458099365234375, 0.373687744140625, 0.4015655517578125, 0.429443359375, 0.4573211669921875, 0.485198974609375, 0.5130767822265625, 0.54095458984375, 0.5688323974609375, 0.596710205078125, 0.6245880126953125, 0.6524658203125, 0.6803436279296875, 0.708221435546875, 0.7360992431640625, 0.76397705078125, 0.7918548583984375, 0.819732666015625, 0.8476104736328125, 0.87548828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 10.0, 14.0, 12.0, 13.0, 12.0, 21.0, 19.0, 18.0, 23.0, 31.0, 32.0, 32.0, 38.0, 37.0, 45.0, 45.0, 36.0, 43.0, 35.0, 40.0, 43.0, 36.0, 41.0, 29.0, 43.0, 35.0, 28.0, 29.0, 20.0, 21.0, 13.0, 19.0, 11.0, 6.0, 15.0, 11.0, 3.0, 6.0, 4.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0], "bins": [-1.1611328125, -1.129669189453125, -1.09820556640625, -1.066741943359375, -1.0352783203125, -1.003814697265625, -0.97235107421875, -0.940887451171875, -0.909423828125, -0.877960205078125, -0.84649658203125, -0.815032958984375, -0.7835693359375, -0.752105712890625, -0.72064208984375, -0.689178466796875, -0.65771484375, -0.626251220703125, -0.59478759765625, -0.563323974609375, -0.5318603515625, -0.500396728515625, -0.46893310546875, -0.437469482421875, -0.406005859375, -0.374542236328125, -0.34307861328125, -0.311614990234375, -0.2801513671875, -0.248687744140625, -0.21722412109375, -0.185760498046875, -0.154296875, -0.122833251953125, -0.09136962890625, -0.059906005859375, -0.0284423828125, 0.003021240234375, 0.03448486328125, 0.065948486328125, 0.097412109375, 0.128875732421875, 0.16033935546875, 0.191802978515625, 0.2232666015625, 0.254730224609375, 0.28619384765625, 0.317657470703125, 0.34912109375, 0.380584716796875, 0.41204833984375, 0.443511962890625, 0.4749755859375, 0.506439208984375, 0.53790283203125, 0.569366455078125, 0.600830078125, 0.632293701171875, 0.66375732421875, 0.695220947265625, 0.7266845703125, 0.758148193359375, 0.78961181640625, 0.821075439453125, 0.8525390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 8.0, 17.0, 26.0, 63.0, 96.0, 176.0, 427.0, 1266.0, 7531.0, 695594.0, 335202.0, 6268.0, 1110.0, 372.0, 164.0, 92.0, 50.0, 22.0, 18.0, 11.0, 12.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.697265625, -1.6457672119140625, -1.594268798828125, -1.5427703857421875, -1.49127197265625, -1.4397735595703125, -1.388275146484375, -1.3367767333984375, -1.2852783203125, -1.2337799072265625, -1.182281494140625, -1.1307830810546875, -1.07928466796875, -1.0277862548828125, -0.976287841796875, -0.9247894287109375, -0.873291015625, -0.8217926025390625, -0.770294189453125, -0.7187957763671875, -0.66729736328125, -0.6157989501953125, -0.564300537109375, -0.5128021240234375, -0.4613037109375, -0.4098052978515625, -0.358306884765625, -0.3068084716796875, -0.25531005859375, -0.2038116455078125, -0.152313232421875, -0.1008148193359375, -0.04931640625, 0.0021820068359375, 0.053680419921875, 0.1051788330078125, 0.15667724609375, 0.2081756591796875, 0.259674072265625, 0.3111724853515625, 0.3626708984375, 0.4141693115234375, 0.465667724609375, 0.5171661376953125, 0.56866455078125, 0.6201629638671875, 0.671661376953125, 0.7231597900390625, 0.774658203125, 0.8261566162109375, 0.877655029296875, 0.9291534423828125, 0.98065185546875, 1.0321502685546875, 1.083648681640625, 1.1351470947265625, 1.1866455078125, 1.2381439208984375, 1.289642333984375, 1.3411407470703125, 1.39263916015625, 1.4441375732421875, 1.495635986328125, 1.5471343994140625, 1.5986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 6.0, 15.0, 27.0, 45.0, 46.0, 91.0, 112.0, 166.0, 135.0, 127.0, 80.0, 40.0, 26.0, 19.0, 13.0, 9.0, 7.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.835294723510742e-05, -5.646608769893646e-05, -5.45792281627655e-05, -5.2692368626594543e-05, -5.0805509090423584e-05, -4.8918649554252625e-05, -4.7031790018081665e-05, -4.5144930481910706e-05, -4.3258070945739746e-05, -4.137121140956879e-05, -3.948435187339783e-05, -3.759749233722687e-05, -3.571063280105591e-05, -3.382377326488495e-05, -3.193691372871399e-05, -3.005005419254303e-05, -2.816319465637207e-05, -2.627633512020111e-05, -2.438947558403015e-05, -2.2502616047859192e-05, -2.0615756511688232e-05, -1.8728896975517273e-05, -1.6842037439346313e-05, -1.4955177903175354e-05, -1.3068318367004395e-05, -1.1181458830833435e-05, -9.294599294662476e-06, -7.407739758491516e-06, -5.520880222320557e-06, -3.634020686149597e-06, -1.7471611499786377e-06, 1.3969838619232178e-07, 2.0265579223632812e-06, 3.913417458534241e-06, 5.8002769947052e-06, 7.68713653087616e-06, 9.573996067047119e-06, 1.1460855603218079e-05, 1.3347715139389038e-05, 1.5234574675559998e-05, 1.7121434211730957e-05, 1.9008293747901917e-05, 2.0895153284072876e-05, 2.2782012820243835e-05, 2.4668872356414795e-05, 2.6555731892585754e-05, 2.8442591428756714e-05, 3.0329450964927673e-05, 3.221631050109863e-05, 3.410317003726959e-05, 3.599002957344055e-05, 3.787688910961151e-05, 3.976374864578247e-05, 4.165060818195343e-05, 4.353746771812439e-05, 4.542432725429535e-05, 4.731118679046631e-05, 4.919804632663727e-05, 5.108490586280823e-05, 5.297176539897919e-05, 5.4858624935150146e-05, 5.6745484471321106e-05, 5.8632344007492065e-05, 6.0519203543663025e-05, 6.240606307983398e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 7.0, 7.0, 3.0, 7.0, 9.0, 17.0, 20.0, 55.0, 71.0, 137.0, 235.0, 466.0, 922.0, 2187.0, 8165.0, 54676.0, 724909.0, 229456.0, 20150.0, 4191.0, 1444.0, 648.0, 356.0, 168.0, 100.0, 46.0, 35.0, 20.0, 13.0, 12.0, 8.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65673828125, -0.634674072265625, -0.61260986328125, -0.590545654296875, -0.5684814453125, -0.546417236328125, -0.52435302734375, -0.502288818359375, -0.480224609375, -0.458160400390625, -0.43609619140625, -0.414031982421875, -0.3919677734375, -0.369903564453125, -0.34783935546875, -0.325775146484375, -0.3037109375, -0.281646728515625, -0.25958251953125, -0.237518310546875, -0.2154541015625, -0.193389892578125, -0.17132568359375, -0.149261474609375, -0.127197265625, -0.105133056640625, -0.08306884765625, -0.061004638671875, -0.0389404296875, -0.016876220703125, 0.00518798828125, 0.027252197265625, 0.04931640625, 0.071380615234375, 0.09344482421875, 0.115509033203125, 0.1375732421875, 0.159637451171875, 0.18170166015625, 0.203765869140625, 0.225830078125, 0.247894287109375, 0.26995849609375, 0.292022705078125, 0.3140869140625, 0.336151123046875, 0.35821533203125, 0.380279541015625, 0.40234375, 0.424407958984375, 0.44647216796875, 0.468536376953125, 0.4906005859375, 0.512664794921875, 0.53472900390625, 0.556793212890625, 0.578857421875, 0.600921630859375, 0.62298583984375, 0.645050048828125, 0.6671142578125, 0.689178466796875, 0.71124267578125, 0.733306884765625, 0.75537109375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 7.0, 14.0, 19.0, 31.0, 39.0, 54.0, 71.0, 90.0, 95.0, 131.0, 118.0, 93.0, 78.0, 44.0, 38.0, 24.0, 16.0, 12.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.01239013671875, -0.9837646484375, -0.95513916015625, -0.926513671875, -0.89788818359375, -0.8692626953125, -0.84063720703125, -0.81201171875, -0.78338623046875, -0.7547607421875, -0.72613525390625, -0.697509765625, -0.66888427734375, -0.6402587890625, -0.61163330078125, -0.5830078125, -0.55438232421875, -0.5257568359375, -0.49713134765625, -0.468505859375, -0.43988037109375, -0.4112548828125, -0.38262939453125, -0.35400390625, -0.32537841796875, -0.2967529296875, -0.26812744140625, -0.239501953125, -0.21087646484375, -0.1822509765625, -0.15362548828125, -0.125, -0.09637451171875, -0.0677490234375, -0.03912353515625, -0.010498046875, 0.01812744140625, 0.0467529296875, 0.07537841796875, 0.10400390625, 0.13262939453125, 0.1612548828125, 0.18988037109375, 0.218505859375, 0.24713134765625, 0.2757568359375, 0.30438232421875, 0.3330078125, 0.36163330078125, 0.3902587890625, 0.41888427734375, 0.447509765625, 0.47613525390625, 0.5047607421875, 0.53338623046875, 0.56201171875, 0.59063720703125, 0.6192626953125, 0.64788818359375, 0.676513671875, 0.70513916015625, 0.7337646484375, 0.76239013671875, 0.791015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 9.0, 27.0, 68.0, 492.0, 346.0, 43.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.80778884887695, -41.896427154541016, -40.98506546020508, -40.073707580566406, -39.16234588623047, -38.25098419189453, -37.339622497558594, -36.428260803222656, -35.516902923583984, -34.60554122924805, -33.69417953491211, -32.78282165527344, -31.8714599609375, -30.960098266601562, -30.048736572265625, -29.13737678527832, -28.226015090942383, -27.314653396606445, -26.40329360961914, -25.491931915283203, -24.5805721282959, -23.66921043395996, -22.757850646972656, -21.84648895263672, -20.93512725830078, -20.023765563964844, -19.11240577697754, -18.2010440826416, -17.289684295654297, -16.37832260131836, -15.466961860656738, -14.555601119995117, -13.644241333007812, -12.732880592346191, -11.82151985168457, -10.910158157348633, -9.998798370361328, -9.08743667602539, -8.17607593536377, -7.264715194702148, -6.353354454040527, -5.441993713378906, -4.530632972717285, -3.619271755218506, -2.7079110145568848, -1.7965502738952637, -0.8851890563964844, 0.02617168426513672, 0.9375324249267578, 1.8488932847976685, 2.760254144668579, 3.6716151237487793, 4.5829758644104, 5.4943366050720215, 6.405697822570801, 7.317058563232422, 8.228419303894043, 9.139780044555664, 10.051140785217285, 10.962501525878906, 11.873863220214844, 12.785223007202148, 13.696584701538086, 14.607945442199707, 15.519306182861328]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 9.0, 7.0, 7.0, 7.0, 15.0, 23.0, 25.0, 50.0, 59.0, 86.0, 96.0, 130.0, 116.0, 110.0, 84.0, 43.0, 26.0, 15.0, 11.0, 13.0, 5.0, 8.0, 9.0, 8.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15753173828125, -16.574954986572266, -15.992377281188965, -15.409799575805664, -14.82722282409668, -14.244645118713379, -13.662067413330078, -13.079490661621094, -12.496912956237793, -11.914335250854492, -11.331758499145508, -10.749180793762207, -10.166603088378906, -9.584026336669922, -9.001448631286621, -8.41887092590332, -7.836294174194336, -7.253716945648193, -6.671139717102051, -6.08856201171875, -5.505984783172607, -4.923407554626465, -4.340829849243164, -3.7582526206970215, -3.175675392150879, -2.5930981636047363, -2.0105206966400146, -1.4279433488845825, -0.8453660011291504, -0.2627887725830078, 0.31978869438171387, 0.9023661613464355, 1.4849433898925781, 2.0675206184387207, 2.6500980854034424, 3.232675552368164, 3.8152527809143066, 4.397830009460449, 4.98040771484375, 5.562984943389893, 6.145562171936035, 6.728139400482178, 7.31071662902832, 7.893294334411621, 8.475872039794922, 9.058448791503906, 9.641026496887207, 10.223604202270508, 10.806180953979492, 11.388758659362793, 11.971335411071777, 12.553913116455078, 13.136489868164062, 13.719067573547363, 14.301645278930664, 14.884222030639648, 15.46679973602295, 16.04937744140625, 16.631954193115234, 17.21453094482422, 17.797109603881836, 18.37968635559082, 18.962263107299805, 19.544841766357422, 20.127418518066406]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 16.0, 6.0, 11.0, 19.0, 21.0, 30.0, 63.0, 131.0, 269.0, 701.0, 1771.0, 6351.0, 37020.0, 4003572.0, 127981.0, 11945.0, 2852.0, 886.0, 328.0, 145.0, 82.0, 39.0, 23.0, 13.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.871978759765625, -3.76934814453125, -3.666717529296875, -3.5640869140625, -3.461456298828125, -3.35882568359375, -3.256195068359375, -3.153564453125, -3.050933837890625, -2.94830322265625, -2.845672607421875, -2.7430419921875, -2.640411376953125, -2.53778076171875, -2.435150146484375, -2.33251953125, -2.229888916015625, -2.12725830078125, -2.024627685546875, -1.9219970703125, -1.819366455078125, -1.71673583984375, -1.614105224609375, -1.511474609375, -1.408843994140625, -1.30621337890625, -1.203582763671875, -1.1009521484375, -0.998321533203125, -0.89569091796875, -0.793060302734375, -0.6904296875, -0.587799072265625, -0.48516845703125, -0.382537841796875, -0.2799072265625, -0.177276611328125, -0.07464599609375, 0.027984619140625, 0.130615234375, 0.233245849609375, 0.33587646484375, 0.438507080078125, 0.5411376953125, 0.643768310546875, 0.74639892578125, 0.849029541015625, 0.95166015625, 1.054290771484375, 1.15692138671875, 1.259552001953125, 1.3621826171875, 1.464813232421875, 1.56744384765625, 1.670074462890625, 1.772705078125, 1.875335693359375, 1.97796630859375, 2.080596923828125, 2.1832275390625, 2.285858154296875, 2.38848876953125, 2.491119384765625, 2.59375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 4.0, 10.0, 12.0, 17.0, 15.0, 18.0, 39.0, 110.0, 355.0, 253.0, 63.0, 28.0, 17.0, 7.0, 10.0, 6.0, 12.0, 4.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34814453125, -0.33915138244628906, -0.3301582336425781, -0.3211650848388672, -0.31217193603515625, -0.3031787872314453, -0.2941856384277344, -0.28519248962402344, -0.2761993408203125, -0.26720619201660156, -0.2582130432128906, -0.2492198944091797, -0.24022674560546875, -0.2312335968017578, -0.22224044799804688, -0.21324729919433594, -0.204254150390625, -0.19526100158691406, -0.18626785278320312, -0.1772747039794922, -0.16828155517578125, -0.1592884063720703, -0.15029525756835938, -0.14130210876464844, -0.1323089599609375, -0.12331581115722656, -0.11432266235351562, -0.10532951354980469, -0.09633636474609375, -0.08734321594238281, -0.07835006713867188, -0.06935691833496094, -0.06036376953125, -0.05137062072753906, -0.042377471923828125, -0.03338432312011719, -0.02439117431640625, -0.015398025512695312, -0.006404876708984375, 0.0025882720947265625, 0.0115814208984375, 0.020574569702148438, 0.029567718505859375, 0.03856086730957031, 0.04755401611328125, 0.05654716491699219, 0.06554031372070312, 0.07453346252441406, 0.083526611328125, 0.09251976013183594, 0.10151290893554688, 0.11050605773925781, 0.11949920654296875, 0.1284923553466797, 0.13748550415039062, 0.14647865295410156, 0.1554718017578125, 0.16446495056152344, 0.17345809936523438, 0.1824512481689453, 0.19144439697265625, 0.2004375457763672, 0.20943069458007812, 0.21842384338378906, 0.2274169921875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 8.0, 9.0, 11.0, 11.0, 10.0, 30.0, 38.0, 43.0, 71.0, 107.0, 189.0, 328.0, 598.0, 1079.0, 2559.0, 7349.0, 28533.0, 262021.0, 3688084.0, 168428.0, 23296.0, 6595.0, 2327.0, 1067.0, 527.0, 332.0, 226.0, 101.0, 94.0, 61.0, 35.0, 25.0, 25.0, 11.0, 14.0, 8.0, 6.0, 8.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.185546875, -1.1452484130859375, -1.104949951171875, -1.0646514892578125, -1.02435302734375, -0.9840545654296875, -0.943756103515625, -0.9034576416015625, -0.8631591796875, -0.8228607177734375, -0.782562255859375, -0.7422637939453125, -0.70196533203125, -0.6616668701171875, -0.621368408203125, -0.5810699462890625, -0.540771484375, -0.5004730224609375, -0.460174560546875, -0.4198760986328125, -0.37957763671875, -0.3392791748046875, -0.298980712890625, -0.2586822509765625, -0.2183837890625, -0.1780853271484375, -0.137786865234375, -0.0974884033203125, -0.05718994140625, -0.0168914794921875, 0.023406982421875, 0.0637054443359375, 0.10400390625, 0.1443023681640625, 0.184600830078125, 0.2248992919921875, 0.26519775390625, 0.3054962158203125, 0.345794677734375, 0.3860931396484375, 0.4263916015625, 0.4666900634765625, 0.506988525390625, 0.5472869873046875, 0.58758544921875, 0.6278839111328125, 0.668182373046875, 0.7084808349609375, 0.748779296875, 0.7890777587890625, 0.829376220703125, 0.8696746826171875, 0.90997314453125, 0.9502716064453125, 0.990570068359375, 1.0308685302734375, 1.0711669921875, 1.1114654541015625, 1.151763916015625, 1.1920623779296875, 1.23236083984375, 1.2726593017578125, 1.312957763671875, 1.3532562255859375, 1.3935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 8.0, 7.0, 15.0, 15.0, 51.0, 67.0, 120.0, 213.0, 585.0, 1817.0, 534.0, 269.0, 133.0, 82.0, 45.0, 30.0, 21.0, 9.0, 12.0, 5.0, 10.0, 6.0, 4.0, 2.0, 7.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343505859375, -0.3329200744628906, -0.32233428955078125, -0.3117485046386719, -0.3011627197265625, -0.2905769348144531, -0.27999114990234375, -0.2694053649902344, -0.258819580078125, -0.24823379516601562, -0.23764801025390625, -0.22706222534179688, -0.2164764404296875, -0.20589065551757812, -0.19530487060546875, -0.18471908569335938, -0.17413330078125, -0.16354751586914062, -0.15296173095703125, -0.14237594604492188, -0.1317901611328125, -0.12120437622070312, -0.11061859130859375, -0.10003280639648438, -0.089447021484375, -0.07886123657226562, -0.06827545166015625, -0.057689666748046875, -0.0471038818359375, -0.036518096923828125, -0.02593231201171875, -0.015346527099609375, -0.0047607421875, 0.005825042724609375, 0.01641082763671875, 0.026996612548828125, 0.0375823974609375, 0.048168182373046875, 0.05875396728515625, 0.06933975219726562, 0.079925537109375, 0.09051132202148438, 0.10109710693359375, 0.11168289184570312, 0.1222686767578125, 0.13285446166992188, 0.14344024658203125, 0.15402603149414062, 0.16461181640625, 0.17519760131835938, 0.18578338623046875, 0.19636917114257812, 0.2069549560546875, 0.21754074096679688, 0.22812652587890625, 0.23871231079101562, 0.249298095703125, 0.2598838806152344, 0.27046966552734375, 0.2810554504394531, 0.2916412353515625, 0.3022270202636719, 0.31281280517578125, 0.3233985900878906, 0.333984375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 26.0, 599.0, 313.0, 40.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.644268035888672, -8.446642875671387, -8.249017715454102, -8.0513916015625, -7.853766441345215, -7.65614128112793, -7.458515644073486, -7.260890483856201, -7.063264846801758, -6.865639686584473, -6.668014049530029, -6.470388889312744, -6.272763252258301, -6.075138092041016, -5.877512454986572, -5.679887294769287, -5.482261657714844, -5.284636497497559, -5.087010860443115, -4.88938570022583, -4.691760063171387, -4.494134902954102, -4.296509265899658, -4.098884105682373, -3.901258945465088, -3.7036335468292236, -3.5060081481933594, -3.308382749557495, -3.110757350921631, -2.9131319522857666, -2.7155065536499023, -2.517881393432617, -2.320255756378174, -2.1226303577423096, -1.9250049591064453, -1.727379560470581, -1.5297541618347168, -1.3321287631988525, -1.1345034837722778, -0.9368780851364136, -0.7392526865005493, -0.5416272878646851, -0.3440019190311432, -0.14637655019760132, 0.05124884843826294, 0.2488742470741272, 0.4464995861053467, 0.6441249847412109, 0.8417503833770752, 1.0393757820129395, 1.2370011806488037, 1.434626579284668, 1.6322519779205322, 1.8298773765563965, 2.0275025367736816, 2.225128173828125, 2.42275333404541, 2.6203787326812744, 2.8180041313171387, 3.015629529953003, 3.213254928588867, 3.4108803272247314, 3.6085057258605957, 3.806130886077881, 4.003756523132324]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 14.0, 12.0, 14.0, 32.0, 34.0, 39.0, 52.0, 68.0, 77.0, 84.0, 67.0, 80.0, 77.0, 76.0, 64.0, 51.0, 39.0, 31.0, 26.0, 14.0, 12.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9605276584625244, -1.907336711883545, -1.854145884513855, -1.8009549379348755, -1.747763991355896, -1.694573163986206, -1.6413822174072266, -1.588191270828247, -1.5350003242492676, -1.481809377670288, -1.4286185503005981, -1.3754276037216187, -1.3222366571426392, -1.2690458297729492, -1.2158548831939697, -1.1626639366149902, -1.1094731092453003, -1.0562821626663208, -1.0030913352966309, -0.9499003887176514, -0.8967094421386719, -0.8435185551643372, -0.7903276681900024, -0.737136721611023, -0.6839458346366882, -0.6307549476623535, -0.577564001083374, -0.5243731141090393, -0.4711821973323822, -0.4179912805557251, -0.3648003935813904, -0.3116094768047333, -0.25841856002807617, -0.20522764325141907, -0.15203674137592316, -0.09884583950042725, -0.04565492272377014, 0.007535994052886963, 0.06072688102722168, 0.11391779780387878, 0.1671087145805359, 0.220299631357193, 0.2734905481338501, 0.3266814351081848, 0.3798723518848419, 0.433063268661499, 0.48625415563583374, 0.5394450426101685, 0.592635989189148, 0.6458268761634827, 0.6990178227424622, 0.7522087097167969, 0.8053996562957764, 0.8585905432701111, 0.9117814302444458, 0.9649723768234253, 1.0181632041931152, 1.0713541507720947, 1.1245449781417847, 1.1777359247207642, 1.2309268712997437, 1.2841176986694336, 1.337308645248413, 1.3904995918273926, 1.443690538406372]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 7.0, 12.0, 7.0, 13.0, 22.0, 38.0, 61.0, 77.0, 115.0, 201.0, 408.0, 758.0, 1678.0, 4266.0, 11815.0, 42207.0, 840124.0, 116107.0, 19390.0, 6399.0, 2524.0, 1111.0, 499.0, 256.0, 170.0, 93.0, 58.0, 33.0, 30.0, 19.0, 17.0, 9.0, 7.0, 4.0, 12.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.936767578125, -1.87158203125, -1.806396484375, -1.7412109375, -1.676025390625, -1.61083984375, -1.545654296875, -1.48046875, -1.415283203125, -1.35009765625, -1.284912109375, -1.2197265625, -1.154541015625, -1.08935546875, -1.024169921875, -0.958984375, -0.893798828125, -0.82861328125, -0.763427734375, -0.6982421875, -0.633056640625, -0.56787109375, -0.502685546875, -0.4375, -0.372314453125, -0.30712890625, -0.241943359375, -0.1767578125, -0.111572265625, -0.04638671875, 0.018798828125, 0.083984375, 0.149169921875, 0.21435546875, 0.279541015625, 0.3447265625, 0.409912109375, 0.47509765625, 0.540283203125, 0.60546875, 0.670654296875, 0.73583984375, 0.801025390625, 0.8662109375, 0.931396484375, 0.99658203125, 1.061767578125, 1.126953125, 1.192138671875, 1.25732421875, 1.322509765625, 1.3876953125, 1.452880859375, 1.51806640625, 1.583251953125, 1.6484375, 1.713623046875, 1.77880859375, 1.843994140625, 1.9091796875, 1.974365234375, 2.03955078125, 2.104736328125, 2.169921875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 10.0, 9.0, 12.0, 15.0, 20.0, 15.0, 45.0, 179.0, 395.0, 188.0, 46.0, 15.0, 13.0, 11.0, 11.0, 5.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.396728515625, -0.3866596221923828, -0.3765907287597656, -0.36652183532714844, -0.35645294189453125, -0.34638404846191406, -0.3363151550292969, -0.3262462615966797, -0.3161773681640625, -0.3061084747314453, -0.2960395812988281, -0.28597068786621094, -0.27590179443359375, -0.26583290100097656, -0.2557640075683594, -0.2456951141357422, -0.235626220703125, -0.2255573272705078, -0.21548843383789062, -0.20541954040527344, -0.19535064697265625, -0.18528175354003906, -0.17521286010742188, -0.1651439666748047, -0.1550750732421875, -0.1450061798095703, -0.13493728637695312, -0.12486839294433594, -0.11479949951171875, -0.10473060607910156, -0.09466171264648438, -0.08459281921386719, -0.07452392578125, -0.06445503234863281, -0.054386138916015625, -0.04431724548339844, -0.03424835205078125, -0.024179458618164062, -0.014110565185546875, -0.0040416717529296875, 0.0060272216796875, 0.016096115112304688, 0.026165008544921875, 0.03623390197753906, 0.04630279541015625, 0.05637168884277344, 0.06644058227539062, 0.07650947570800781, 0.086578369140625, 0.09664726257324219, 0.10671615600585938, 0.11678504943847656, 0.12685394287109375, 0.13692283630371094, 0.14699172973632812, 0.1570606231689453, 0.1671295166015625, 0.1771984100341797, 0.18726730346679688, 0.19733619689941406, 0.20740509033203125, 0.21747398376464844, 0.22754287719726562, 0.2376117706298828, 0.2476806640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 11.0, 18.0, 15.0, 20.0, 25.0, 39.0, 58.0, 51.0, 95.0, 121.0, 199.0, 344.0, 603.0, 1246.0, 3419.0, 11227.0, 47969.0, 271238.0, 560907.0, 117099.0, 23383.0, 6147.0, 2069.0, 936.0, 435.0, 276.0, 169.0, 127.0, 68.0, 55.0, 41.0, 30.0, 30.0, 18.0, 9.0, 12.0, 6.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8327484130859375, -0.802215576171875, -0.7716827392578125, -0.74114990234375, -0.7106170654296875, -0.680084228515625, -0.6495513916015625, -0.6190185546875, -0.5884857177734375, -0.557952880859375, -0.5274200439453125, -0.49688720703125, -0.4663543701171875, -0.435821533203125, -0.4052886962890625, -0.374755859375, -0.3442230224609375, -0.313690185546875, -0.2831573486328125, -0.25262451171875, -0.2220916748046875, -0.191558837890625, -0.1610260009765625, -0.1304931640625, -0.0999603271484375, -0.069427490234375, -0.0388946533203125, -0.00836181640625, 0.0221710205078125, 0.052703857421875, 0.0832366943359375, 0.11376953125, 0.1443023681640625, 0.174835205078125, 0.2053680419921875, 0.23590087890625, 0.2664337158203125, 0.296966552734375, 0.3274993896484375, 0.3580322265625, 0.3885650634765625, 0.419097900390625, 0.4496307373046875, 0.48016357421875, 0.5106964111328125, 0.541229248046875, 0.5717620849609375, 0.602294921875, 0.6328277587890625, 0.663360595703125, 0.6938934326171875, 0.72442626953125, 0.7549591064453125, 0.785491943359375, 0.8160247802734375, 0.8465576171875, 0.8770904541015625, 0.907623291015625, 0.9381561279296875, 0.96868896484375, 0.9992218017578125, 1.029754638671875, 1.0602874755859375, 1.0908203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 14.0, 12.0, 7.0, 15.0, 18.0, 14.0, 30.0, 24.0, 36.0, 26.0, 46.0, 37.0, 42.0, 41.0, 34.0, 46.0, 53.0, 46.0, 35.0, 45.0, 37.0, 38.0, 36.0, 37.0, 31.0, 36.0, 20.0, 25.0, 20.0, 13.0, 10.0, 16.0, 11.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5665969848632812, -0.5462799072265625, -0.5259628295898438, -0.505645751953125, -0.48532867431640625, -0.4650115966796875, -0.44469451904296875, -0.42437744140625, -0.40406036376953125, -0.3837432861328125, -0.36342620849609375, -0.343109130859375, -0.32279205322265625, -0.3024749755859375, -0.28215789794921875, -0.2618408203125, -0.24152374267578125, -0.2212066650390625, -0.20088958740234375, -0.180572509765625, -0.16025543212890625, -0.1399383544921875, -0.11962127685546875, -0.09930419921875, -0.07898712158203125, -0.0586700439453125, -0.03835296630859375, -0.018035888671875, 0.00228118896484375, 0.0225982666015625, 0.04291534423828125, 0.063232421875, 0.08354949951171875, 0.1038665771484375, 0.12418365478515625, 0.144500732421875, 0.16481781005859375, 0.1851348876953125, 0.20545196533203125, 0.22576904296875, 0.24608612060546875, 0.2664031982421875, 0.28672027587890625, 0.307037353515625, 0.32735443115234375, 0.3476715087890625, 0.36798858642578125, 0.3883056640625, 0.40862274169921875, 0.4289398193359375, 0.44925689697265625, 0.469573974609375, 0.48989105224609375, 0.5102081298828125, 0.5305252075195312, 0.55084228515625, 0.5711593627929688, 0.5914764404296875, 0.6117935180664062, 0.632110595703125, 0.6524276733398438, 0.6727447509765625, 0.6930618286132812, 0.71337890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 3.0, 10.0, 10.0, 17.0, 23.0, 44.0, 86.0, 155.0, 387.0, 1032.0, 4847.0, 715996.0, 320208.0, 4086.0, 942.0, 342.0, 152.0, 84.0, 43.0, 25.0, 18.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.590911865234375, -2.49822998046875, -2.405548095703125, -2.3128662109375, -2.220184326171875, -2.12750244140625, -2.034820556640625, -1.942138671875, -1.849456787109375, -1.75677490234375, -1.664093017578125, -1.5714111328125, -1.478729248046875, -1.38604736328125, -1.293365478515625, -1.20068359375, -1.108001708984375, -1.01531982421875, -0.922637939453125, -0.8299560546875, -0.737274169921875, -0.64459228515625, -0.551910400390625, -0.459228515625, -0.366546630859375, -0.27386474609375, -0.181182861328125, -0.0885009765625, 0.004180908203125, 0.09686279296875, 0.189544677734375, 0.2822265625, 0.374908447265625, 0.46759033203125, 0.560272216796875, 0.6529541015625, 0.745635986328125, 0.83831787109375, 0.930999755859375, 1.023681640625, 1.116363525390625, 1.20904541015625, 1.301727294921875, 1.3944091796875, 1.487091064453125, 1.57977294921875, 1.672454833984375, 1.76513671875, 1.857818603515625, 1.95050048828125, 2.043182373046875, 2.1358642578125, 2.228546142578125, 2.32122802734375, 2.413909912109375, 2.506591796875, 2.599273681640625, 2.69195556640625, 2.784637451171875, 2.8773193359375, 2.970001220703125, 3.06268310546875, 3.155364990234375, 3.248046875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 12.0, 21.0, 46.0, 105.0, 234.0, 321.0, 154.0, 49.0, 31.0, 14.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.00021457672119140625, -0.0002103801816701889, -0.00020618364214897156, -0.0002019871026277542, -0.00019779056310653687, -0.00019359402358531952, -0.00018939748406410217, -0.00018520094454288483, -0.00018100440502166748, -0.00017680786550045013, -0.0001726113259792328, -0.00016841478645801544, -0.0001642182469367981, -0.00016002170741558075, -0.0001558251678943634, -0.00015162862837314606, -0.0001474320888519287, -0.00014323554933071136, -0.00013903900980949402, -0.00013484247028827667, -0.00013064593076705933, -0.00012644939124584198, -0.00012225285172462463, -0.00011805631220340729, -0.00011385977268218994, -0.0001096632331609726, -0.00010546669363975525, -0.0001012701541185379, -9.707361459732056e-05, -9.287707507610321e-05, -8.868053555488586e-05, -8.448399603366852e-05, -8.028745651245117e-05, -7.609091699123383e-05, -7.189437747001648e-05, -6.769783794879913e-05, -6.350129842758179e-05, -5.930475890636444e-05, -5.5108219385147095e-05, -5.091167986392975e-05, -4.67151403427124e-05, -4.2518600821495056e-05, -3.832206130027771e-05, -3.4125521779060364e-05, -2.9928982257843018e-05, -2.573244273662567e-05, -2.1535903215408325e-05, -1.733936369419098e-05, -1.3142824172973633e-05, -8.946284651756287e-06, -4.7497451305389404e-06, -5.532056093215942e-07, 3.643333911895752e-06, 7.839873433113098e-06, 1.2036412954330444e-05, 1.623295247554779e-05, 2.0429491996765137e-05, 2.4626031517982483e-05, 2.882257103919983e-05, 3.3019110560417175e-05, 3.721565008163452e-05, 4.141218960285187e-05, 4.5608729124069214e-05, 4.980526864528656e-05, 5.4001808166503906e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 7.0, 7.0, 15.0, 17.0, 19.0, 43.0, 99.0, 231.0, 542.0, 1676.0, 7820.0, 285273.0, 738818.0, 11145.0, 1799.0, 560.0, 249.0, 121.0, 50.0, 22.0, 14.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.728515625, -1.67108154296875, -1.6136474609375, -1.55621337890625, -1.498779296875, -1.44134521484375, -1.3839111328125, -1.32647705078125, -1.26904296875, -1.21160888671875, -1.1541748046875, -1.09674072265625, -1.039306640625, -0.98187255859375, -0.9244384765625, -0.86700439453125, -0.8095703125, -0.75213623046875, -0.6947021484375, -0.63726806640625, -0.579833984375, -0.52239990234375, -0.4649658203125, -0.40753173828125, -0.35009765625, -0.29266357421875, -0.2352294921875, -0.17779541015625, -0.120361328125, -0.06292724609375, -0.0054931640625, 0.05194091796875, 0.109375, 0.16680908203125, 0.2242431640625, 0.28167724609375, 0.339111328125, 0.39654541015625, 0.4539794921875, 0.51141357421875, 0.56884765625, 0.62628173828125, 0.6837158203125, 0.74114990234375, 0.798583984375, 0.85601806640625, 0.9134521484375, 0.97088623046875, 1.0283203125, 1.08575439453125, 1.1431884765625, 1.20062255859375, 1.258056640625, 1.31549072265625, 1.3729248046875, 1.43035888671875, 1.48779296875, 1.54522705078125, 1.6026611328125, 1.66009521484375, 1.717529296875, 1.77496337890625, 1.8323974609375, 1.88983154296875, 1.947265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 15.0, 25.0, 22.0, 44.0, 73.0, 135.0, 185.0, 183.0, 126.0, 63.0, 35.0, 32.0, 22.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.091796875, -1.0552978515625, -1.018798828125, -0.9822998046875, -0.94580078125, -0.9093017578125, -0.872802734375, -0.8363037109375, -0.7998046875, -0.7633056640625, -0.726806640625, -0.6903076171875, -0.65380859375, -0.6173095703125, -0.580810546875, -0.5443115234375, -0.5078125, -0.4713134765625, -0.434814453125, -0.3983154296875, -0.36181640625, -0.3253173828125, -0.288818359375, -0.2523193359375, -0.2158203125, -0.1793212890625, -0.142822265625, -0.1063232421875, -0.06982421875, -0.0333251953125, 0.003173828125, 0.0396728515625, 0.076171875, 0.1126708984375, 0.149169921875, 0.1856689453125, 0.22216796875, 0.2586669921875, 0.295166015625, 0.3316650390625, 0.3681640625, 0.4046630859375, 0.441162109375, 0.4776611328125, 0.51416015625, 0.5506591796875, 0.587158203125, 0.6236572265625, 0.66015625, 0.6966552734375, 0.733154296875, 0.7696533203125, 0.80615234375, 0.8426513671875, 0.879150390625, 0.9156494140625, 0.9521484375, 0.9886474609375, 1.025146484375, 1.0616455078125, 1.09814453125, 1.1346435546875, 1.171142578125, 1.2076416015625, 1.244140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 9.0, 75.0, 625.0, 247.0, 28.0, 12.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.03753662109375, -34.317893981933594, -33.59825134277344, -32.87860870361328, -32.15896987915039, -31.439327239990234, -30.719684600830078, -30.000041961669922, -29.280399322509766, -28.56075668334961, -27.841115951538086, -27.12147331237793, -26.401830673217773, -25.68218994140625, -24.962547302246094, -24.242904663085938, -23.523263931274414, -22.803621292114258, -22.083980560302734, -21.364337921142578, -20.644695281982422, -19.925052642822266, -19.205411911010742, -18.485769271850586, -17.766128540039062, -17.046485900878906, -16.326845169067383, -15.607202529907227, -14.88755989074707, -14.16791820526123, -13.44827651977539, -12.728633880615234, -12.008993148803711, -11.289351463317871, -10.569708824157715, -9.850067138671875, -9.130424499511719, -8.410782814025879, -7.691141128540039, -6.971498966217041, -6.251856803894043, -5.532214641571045, -4.812572479248047, -4.092930793762207, -3.373288631439209, -2.653646469116211, -1.934004783630371, -1.214362621307373, -0.494720458984375, 0.2249215841293335, 0.944563627243042, 1.664205551147461, 2.383847713470459, 3.103489875793457, 3.823131561279297, 4.542773723602295, 5.262415885925293, 5.982058048248291, 6.701700210571289, 7.421341896057129, 8.140983581542969, 8.860626220703125, 9.580267906188965, 10.299909591674805, 11.019552230834961]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 7.0, 11.0, 21.0, 21.0, 33.0, 50.0, 45.0, 58.0, 72.0, 88.0, 66.0, 84.0, 72.0, 65.0, 59.0, 57.0, 32.0, 35.0, 21.0, 12.0, 15.0, 11.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.706931114196777, -6.4611921310424805, -6.215453624725342, -5.969714641571045, -5.723975658416748, -5.478237152099609, -5.2324981689453125, -4.986759185791016, -4.741020202636719, -4.495281219482422, -4.249542713165283, -4.003803730010986, -3.7580647468566895, -3.5123260021209717, -3.266587257385254, -3.020848274230957, -2.7751095294952393, -2.5293707847595215, -2.2836318016052246, -2.037893056869507, -1.79215407371521, -1.5464153289794922, -1.3006764650344849, -1.0549376010894775, -0.8091987371444702, -0.5634598731994629, -0.31772103905677795, -0.07198220491409302, 0.1737566590309143, 0.41949546337127686, 0.6652343273162842, 0.9109731912612915, 1.1567120552062988, 1.4024509191513062, 1.6481897830963135, 1.8939285278320312, 2.139667510986328, 2.385406255722046, 2.6311450004577637, 2.8768839836120605, 3.1226229667663574, 3.368361711502075, 3.614100694656372, 3.85983943939209, 4.105578422546387, 4.351317405700684, 4.597055912017822, 4.842794895172119, 5.088533401489258, 5.334272384643555, 5.580010890960693, 5.82574987411499, 6.071488857269287, 6.317227363586426, 6.562966346740723, 6.8087053298950195, 7.054444313049316, 7.300183296203613, 7.545921802520752, 7.791660785675049, 8.037399291992188, 8.283138275146484, 8.528877258300781, 8.774616241455078, 9.020355224609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 0.0, 5.0, 2.0, 4.0, 5.0, 5.0, 4.0, 3.0, 7.0, 6.0, 3.0, 10.0, 11.0, 14.0, 16.0, 29.0, 30.0, 66.0, 100.0, 151.0, 274.0, 524.0, 941.0, 2183.0, 6783.0, 64035.0, 4089559.0, 22571.0, 3976.0, 1392.0, 663.0, 314.0, 181.0, 111.0, 81.0, 58.0, 34.0, 35.0, 30.0, 18.0, 17.0, 8.0, 10.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.76953125, -5.6190185546875, -5.468505859375, -5.3179931640625, -5.16748046875, -5.0169677734375, -4.866455078125, -4.7159423828125, -4.5654296875, -4.4149169921875, -4.264404296875, -4.1138916015625, -3.96337890625, -3.8128662109375, -3.662353515625, -3.5118408203125, -3.361328125, -3.2108154296875, -3.060302734375, -2.9097900390625, -2.75927734375, -2.6087646484375, -2.458251953125, -2.3077392578125, -2.1572265625, -2.0067138671875, -1.856201171875, -1.7056884765625, -1.55517578125, -1.4046630859375, -1.254150390625, -1.1036376953125, -0.953125, -0.8026123046875, -0.652099609375, -0.5015869140625, -0.35107421875, -0.2005615234375, -0.050048828125, 0.1004638671875, 0.2509765625, 0.4014892578125, 0.552001953125, 0.7025146484375, 0.85302734375, 1.0035400390625, 1.154052734375, 1.3045654296875, 1.455078125, 1.6055908203125, 1.756103515625, 1.9066162109375, 2.05712890625, 2.2076416015625, 2.358154296875, 2.5086669921875, 2.6591796875, 2.8096923828125, 2.960205078125, 3.1107177734375, 3.26123046875, 3.4117431640625, 3.562255859375, 3.7127685546875, 3.86328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 10.0, 17.0, 29.0, 49.0, 129.0, 298.0, 255.0, 107.0, 42.0, 23.0, 11.0, 7.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3964996337890625, -0.386016845703125, -0.3755340576171875, -0.36505126953125, -0.3545684814453125, -0.344085693359375, -0.3336029052734375, -0.3231201171875, -0.3126373291015625, -0.302154541015625, -0.2916717529296875, -0.28118896484375, -0.2707061767578125, -0.260223388671875, -0.2497406005859375, -0.2392578125, -0.2287750244140625, -0.218292236328125, -0.2078094482421875, -0.19732666015625, -0.1868438720703125, -0.176361083984375, -0.1658782958984375, -0.1553955078125, -0.1449127197265625, -0.134429931640625, -0.1239471435546875, -0.11346435546875, -0.1029815673828125, -0.092498779296875, -0.0820159912109375, -0.071533203125, -0.0610504150390625, -0.050567626953125, -0.0400848388671875, -0.02960205078125, -0.0191192626953125, -0.008636474609375, 0.0018463134765625, 0.0123291015625, 0.0228118896484375, 0.033294677734375, 0.0437774658203125, 0.05426025390625, 0.0647430419921875, 0.075225830078125, 0.0857086181640625, 0.09619140625, 0.1066741943359375, 0.117156982421875, 0.1276397705078125, 0.13812255859375, 0.1486053466796875, 0.159088134765625, 0.1695709228515625, 0.1800537109375, 0.1905364990234375, 0.201019287109375, 0.2115020751953125, 0.22198486328125, 0.2324676513671875, 0.242950439453125, 0.2534332275390625, 0.263916015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 9.0, 10.0, 9.0, 24.0, 23.0, 24.0, 51.0, 77.0, 126.0, 243.0, 541.0, 1692.0, 9150.0, 171983.0, 3962011.0, 41934.0, 4496.0, 1039.0, 397.0, 176.0, 83.0, 59.0, 33.0, 28.0, 13.0, 12.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.640625, -2.553497314453125, -2.46636962890625, -2.379241943359375, -2.2921142578125, -2.204986572265625, -2.11785888671875, -2.030731201171875, -1.943603515625, -1.856475830078125, -1.76934814453125, -1.682220458984375, -1.5950927734375, -1.507965087890625, -1.42083740234375, -1.333709716796875, -1.24658203125, -1.159454345703125, -1.07232666015625, -0.985198974609375, -0.8980712890625, -0.810943603515625, -0.72381591796875, -0.636688232421875, -0.549560546875, -0.462432861328125, -0.37530517578125, -0.288177490234375, -0.2010498046875, -0.113922119140625, -0.02679443359375, 0.060333251953125, 0.1474609375, 0.234588623046875, 0.32171630859375, 0.408843994140625, 0.4959716796875, 0.583099365234375, 0.67022705078125, 0.757354736328125, 0.844482421875, 0.931610107421875, 1.01873779296875, 1.105865478515625, 1.1929931640625, 1.280120849609375, 1.36724853515625, 1.454376220703125, 1.54150390625, 1.628631591796875, 1.71575927734375, 1.802886962890625, 1.8900146484375, 1.977142333984375, 2.06427001953125, 2.151397705078125, 2.238525390625, 2.325653076171875, 2.41278076171875, 2.499908447265625, 2.5870361328125, 2.674163818359375, 2.76129150390625, 2.848419189453125, 2.935546875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 1.0, 4.0, 9.0, 7.0, 19.0, 16.0, 21.0, 44.0, 64.0, 121.0, 174.0, 437.0, 1424.0, 827.0, 350.0, 204.0, 110.0, 52.0, 36.0, 38.0, 23.0, 22.0, 15.0, 9.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.29150390625, -0.2828826904296875, -0.274261474609375, -0.2656402587890625, -0.25701904296875, -0.2483978271484375, -0.239776611328125, -0.2311553955078125, -0.2225341796875, -0.2139129638671875, -0.205291748046875, -0.1966705322265625, -0.18804931640625, -0.1794281005859375, -0.170806884765625, -0.1621856689453125, -0.153564453125, -0.1449432373046875, -0.136322021484375, -0.1277008056640625, -0.11907958984375, -0.1104583740234375, -0.101837158203125, -0.0932159423828125, -0.0845947265625, -0.0759735107421875, -0.067352294921875, -0.0587310791015625, -0.05010986328125, -0.0414886474609375, -0.032867431640625, -0.0242462158203125, -0.015625, -0.0070037841796875, 0.001617431640625, 0.0102386474609375, 0.01885986328125, 0.0274810791015625, 0.036102294921875, 0.0447235107421875, 0.0533447265625, 0.0619659423828125, 0.070587158203125, 0.0792083740234375, 0.08782958984375, 0.0964508056640625, 0.105072021484375, 0.1136932373046875, 0.122314453125, 0.1309356689453125, 0.139556884765625, 0.1481781005859375, 0.15679931640625, 0.1654205322265625, 0.174041748046875, 0.1826629638671875, 0.1912841796875, 0.1999053955078125, 0.208526611328125, 0.2171478271484375, 0.22576904296875, 0.2343902587890625, 0.243011474609375, 0.2516326904296875, 0.26025390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 23.0, 85.0, 341.0, 361.0, 132.0, 35.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7346351146698, -3.6455018520355225, -3.556368350982666, -3.4672350883483887, -3.3781018257141113, -3.288968563079834, -3.1998353004455566, -3.1107017993927, -3.021568536758423, -2.9324352741241455, -2.843301773071289, -2.7541685104370117, -2.6650352478027344, -2.575901985168457, -2.4867687225341797, -2.3976352214813232, -2.308501958847046, -2.2193686962127686, -2.130235195159912, -2.0411019325256348, -1.9519686698913574, -1.86283540725708, -1.7737020254135132, -1.6845686435699463, -1.595435380935669, -1.5063021183013916, -1.4171687364578247, -1.3280353546142578, -1.2389020919799805, -1.1497688293457031, -1.0606354475021362, -0.9715021252632141, -0.8823685646057129, -0.7932352423667908, -0.7041019201278687, -0.6149685978889465, -0.5258352756500244, -0.4367019534111023, -0.3475686311721802, -0.25843530893325806, -0.16930198669433594, -0.08016866445541382, 0.0089646577835083, 0.09809798002243042, 0.18723130226135254, 0.27636462450027466, 0.3654979467391968, 0.4546312689781189, 0.543764591217041, 0.6328979134559631, 0.7220312356948853, 0.8111645579338074, 0.9002978801727295, 0.9894312024116516, 1.0785645246505737, 1.1676979064941406, 1.256831169128418, 1.3459644317626953, 1.4350978136062622, 1.524231195449829, 1.6133644580841064, 1.7024977207183838, 1.7916311025619507, 1.8807644844055176, 1.969897747039795]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 6.0, 11.0, 13.0, 16.0, 21.0, 23.0, 28.0, 26.0, 35.0, 38.0, 43.0, 44.0, 43.0, 46.0, 53.0, 67.0, 51.0, 45.0, 41.0, 47.0, 59.0, 32.0, 41.0, 24.0, 25.0, 17.0, 15.0, 11.0, 11.0, 8.0, 12.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.8824684619903564, -0.8533709645271301, -0.824273407459259, -0.7951759099960327, -0.7660783529281616, -0.7369808554649353, -0.707883358001709, -0.6787858009338379, -0.6496883034706116, -0.6205908060073853, -0.5914932489395142, -0.5623957514762878, -0.5332982540130615, -0.5042006969451904, -0.4751031994819641, -0.4460056722164154, -0.4169081449508667, -0.387810617685318, -0.3587130904197693, -0.32961559295654297, -0.30051806569099426, -0.27142053842544556, -0.24232302606105804, -0.21322551369667053, -0.18412798643112183, -0.15503045916557312, -0.1259329468011856, -0.0968354269862175, -0.06773790717124939, -0.038640379905700684, -0.009542867541313171, 0.01955464482307434, 0.04865217208862305, 0.07774969190359116, 0.10684721171855927, 0.13594472408294678, 0.16504225134849548, 0.1941397786140442, 0.2232372909784317, 0.2523348033428192, 0.2814323306083679, 0.3105298578739166, 0.33962738513946533, 0.36872488260269165, 0.39782240986824036, 0.42691993713378906, 0.4560174345970154, 0.4851149618625641, 0.5142124891281128, 0.5433099865913391, 0.5724075436592102, 0.6015050411224365, 0.6306025981903076, 0.6597000956535339, 0.6887975931167603, 0.7178951501846313, 0.7469926476478577, 0.776090145111084, 0.8051877021789551, 0.8342851996421814, 0.8633826971054077, 0.8924802541732788, 0.9215777516365051, 0.9506752490997314, 0.9797728061676025]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 4.0, 2.0, 12.0, 21.0, 33.0, 34.0, 64.0, 108.0, 190.0, 504.0, 1101.0, 3779.0, 31139.0, 958366.0, 46484.0, 4338.0, 1248.0, 536.0, 269.0, 135.0, 67.0, 38.0, 34.0, 13.0, 9.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.869140625, -2.772064208984375, -2.67498779296875, -2.577911376953125, -2.4808349609375, -2.383758544921875, -2.28668212890625, -2.189605712890625, -2.092529296875, -1.995452880859375, -1.89837646484375, -1.801300048828125, -1.7042236328125, -1.607147216796875, -1.51007080078125, -1.412994384765625, -1.31591796875, -1.218841552734375, -1.12176513671875, -1.024688720703125, -0.9276123046875, -0.830535888671875, -0.73345947265625, -0.636383056640625, -0.539306640625, -0.442230224609375, -0.34515380859375, -0.248077392578125, -0.1510009765625, -0.053924560546875, 0.04315185546875, 0.140228271484375, 0.2373046875, 0.334381103515625, 0.43145751953125, 0.528533935546875, 0.6256103515625, 0.722686767578125, 0.81976318359375, 0.916839599609375, 1.013916015625, 1.110992431640625, 1.20806884765625, 1.305145263671875, 1.4022216796875, 1.499298095703125, 1.59637451171875, 1.693450927734375, 1.79052734375, 1.887603759765625, 1.98468017578125, 2.081756591796875, 2.1788330078125, 2.275909423828125, 2.37298583984375, 2.470062255859375, 2.567138671875, 2.664215087890625, 2.76129150390625, 2.858367919921875, 2.9554443359375, 3.052520751953125, 3.14959716796875, 3.246673583984375, 3.34375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 17.0, 31.0, 63.0, 188.0, 293.0, 230.0, 102.0, 37.0, 9.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42578125, -0.4152965545654297, -0.4048118591308594, -0.39432716369628906, -0.38384246826171875, -0.37335777282714844, -0.3628730773925781, -0.3523883819580078, -0.3419036865234375, -0.3314189910888672, -0.3209342956542969, -0.31044960021972656, -0.29996490478515625, -0.28948020935058594, -0.2789955139160156, -0.2685108184814453, -0.258026123046875, -0.2475414276123047, -0.23705673217773438, -0.22657203674316406, -0.21608734130859375, -0.20560264587402344, -0.19511795043945312, -0.1846332550048828, -0.1741485595703125, -0.1636638641357422, -0.15317916870117188, -0.14269447326660156, -0.13220977783203125, -0.12172508239746094, -0.11124038696289062, -0.10075569152832031, -0.09027099609375, -0.07978630065917969, -0.06930160522460938, -0.05881690979003906, -0.04833221435546875, -0.03784751892089844, -0.027362823486328125, -0.016878128051757812, -0.0063934326171875, 0.0040912628173828125, 0.014575958251953125, 0.025060653686523438, 0.03554534912109375, 0.04603004455566406, 0.056514739990234375, 0.06699943542480469, 0.077484130859375, 0.08796882629394531, 0.09845352172851562, 0.10893821716308594, 0.11942291259765625, 0.12990760803222656, 0.14039230346679688, 0.1508769989013672, 0.1613616943359375, 0.1718463897705078, 0.18233108520507812, 0.19281578063964844, 0.20330047607421875, 0.21378517150878906, 0.22426986694335938, 0.2347545623779297, 0.2452392578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 10.0, 19.0, 19.0, 26.0, 28.0, 49.0, 76.0, 97.0, 124.0, 153.0, 258.0, 387.0, 518.0, 878.0, 1794.0, 4520.0, 17325.0, 91154.0, 594621.0, 280959.0, 40115.0, 9162.0, 2816.0, 1289.0, 699.0, 413.0, 283.0, 217.0, 127.0, 98.0, 81.0, 58.0, 40.0, 36.0, 29.0, 9.0, 12.0, 12.0, 7.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3036956787109375, -1.262664794921875, -1.2216339111328125, -1.18060302734375, -1.1395721435546875, -1.098541259765625, -1.0575103759765625, -1.0164794921875, -0.9754486083984375, -0.934417724609375, -0.8933868408203125, -0.85235595703125, -0.8113250732421875, -0.770294189453125, -0.7292633056640625, -0.688232421875, -0.6472015380859375, -0.606170654296875, -0.5651397705078125, -0.52410888671875, -0.4830780029296875, -0.442047119140625, -0.4010162353515625, -0.3599853515625, -0.3189544677734375, -0.277923583984375, -0.2368927001953125, -0.19586181640625, -0.1548309326171875, -0.113800048828125, -0.0727691650390625, -0.03173828125, 0.0092926025390625, 0.050323486328125, 0.0913543701171875, 0.13238525390625, 0.1734161376953125, 0.214447021484375, 0.2554779052734375, 0.2965087890625, 0.3375396728515625, 0.378570556640625, 0.4196014404296875, 0.46063232421875, 0.5016632080078125, 0.542694091796875, 0.5837249755859375, 0.624755859375, 0.6657867431640625, 0.706817626953125, 0.7478485107421875, 0.78887939453125, 0.8299102783203125, 0.870941162109375, 0.9119720458984375, 0.9530029296875, 0.9940338134765625, 1.035064697265625, 1.0760955810546875, 1.11712646484375, 1.1581573486328125, 1.199188232421875, 1.2402191162109375, 1.28125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 6.0, 8.0, 8.0, 10.0, 22.0, 13.0, 20.0, 23.0, 24.0, 25.0, 28.0, 26.0, 33.0, 28.0, 28.0, 37.0, 47.0, 39.0, 43.0, 45.0, 33.0, 50.0, 50.0, 31.0, 49.0, 29.0, 32.0, 35.0, 16.0, 30.0, 15.0, 17.0, 12.0, 11.0, 9.0, 11.0, 10.0, 10.0, 7.0, 4.0, 9.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.78515625, -0.7636032104492188, -0.7420501708984375, -0.7204971313476562, -0.698944091796875, -0.6773910522460938, -0.6558380126953125, -0.6342849731445312, -0.61273193359375, -0.5911788940429688, -0.5696258544921875, -0.5480728149414062, -0.526519775390625, -0.5049667358398438, -0.4834136962890625, -0.46186065673828125, -0.4403076171875, -0.41875457763671875, -0.3972015380859375, -0.37564849853515625, -0.354095458984375, -0.33254241943359375, -0.3109893798828125, -0.28943634033203125, -0.26788330078125, -0.24633026123046875, -0.2247772216796875, -0.20322418212890625, -0.181671142578125, -0.16011810302734375, -0.1385650634765625, -0.11701202392578125, -0.095458984375, -0.07390594482421875, -0.0523529052734375, -0.03079986572265625, -0.009246826171875, 0.01230621337890625, 0.0338592529296875, 0.05541229248046875, 0.07696533203125, 0.09851837158203125, 0.1200714111328125, 0.14162445068359375, 0.163177490234375, 0.18473052978515625, 0.2062835693359375, 0.22783660888671875, 0.2493896484375, 0.27094268798828125, 0.2924957275390625, 0.31404876708984375, 0.335601806640625, 0.35715484619140625, 0.3787078857421875, 0.40026092529296875, 0.42181396484375, 0.44336700439453125, 0.4649200439453125, 0.48647308349609375, 0.508026123046875, 0.5295791625976562, 0.5511322021484375, 0.5726852416992188, 0.59423828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 11.0, 6.0, 14.0, 26.0, 30.0, 45.0, 72.0, 133.0, 228.0, 480.0, 1184.0, 3991.0, 26229.0, 638219.0, 356519.0, 16455.0, 3026.0, 953.0, 436.0, 203.0, 92.0, 55.0, 49.0, 17.0, 14.0, 13.0, 16.0, 9.0, 6.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9453125, -0.915679931640625, -0.88604736328125, -0.856414794921875, -0.8267822265625, -0.797149658203125, -0.76751708984375, -0.737884521484375, -0.708251953125, -0.678619384765625, -0.64898681640625, -0.619354248046875, -0.5897216796875, -0.560089111328125, -0.53045654296875, -0.500823974609375, -0.47119140625, -0.441558837890625, -0.41192626953125, -0.382293701171875, -0.3526611328125, -0.323028564453125, -0.29339599609375, -0.263763427734375, -0.234130859375, -0.204498291015625, -0.17486572265625, -0.145233154296875, -0.1156005859375, -0.085968017578125, -0.05633544921875, -0.026702880859375, 0.0029296875, 0.032562255859375, 0.06219482421875, 0.091827392578125, 0.1214599609375, 0.151092529296875, 0.18072509765625, 0.210357666015625, 0.239990234375, 0.269622802734375, 0.29925537109375, 0.328887939453125, 0.3585205078125, 0.388153076171875, 0.41778564453125, 0.447418212890625, 0.47705078125, 0.506683349609375, 0.53631591796875, 0.565948486328125, 0.5955810546875, 0.625213623046875, 0.65484619140625, 0.684478759765625, 0.714111328125, 0.743743896484375, 0.77337646484375, 0.803009033203125, 0.8326416015625, 0.862274169921875, 0.89190673828125, 0.921539306640625, 0.951171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 16.0, 13.0, 17.0, 26.0, 30.0, 60.0, 74.0, 90.0, 116.0, 115.0, 105.0, 87.0, 60.0, 35.0, 33.0, 31.0, 11.0, 17.0, 12.0, 4.0, 9.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.374980926513672e-05, -4.194770008325577e-05, -4.014559090137482e-05, -3.8343481719493866e-05, -3.6541372537612915e-05, -3.4739263355731964e-05, -3.293715417385101e-05, -3.113504499197006e-05, -2.933293581008911e-05, -2.753082662820816e-05, -2.572871744632721e-05, -2.392660826444626e-05, -2.2124499082565308e-05, -2.0322389900684357e-05, -1.8520280718803406e-05, -1.6718171536922455e-05, -1.4916062355041504e-05, -1.3113953173160553e-05, -1.1311843991279602e-05, -9.509734809398651e-06, -7.7076256275177e-06, -5.905516445636749e-06, -4.103407263755798e-06, -2.3012980818748474e-06, -4.991888999938965e-07, 1.3029202818870544e-06, 3.1050294637680054e-06, 4.907138645648956e-06, 6.709247827529907e-06, 8.511357009410858e-06, 1.0313466191291809e-05, 1.211557537317276e-05, 1.3917684555053711e-05, 1.5719793736934662e-05, 1.7521902918815613e-05, 1.9324012100696564e-05, 2.1126121282577515e-05, 2.2928230464458466e-05, 2.4730339646339417e-05, 2.6532448828220367e-05, 2.833455801010132e-05, 3.013666719198227e-05, 3.193877637386322e-05, 3.374088555574417e-05, 3.554299473762512e-05, 3.734510391950607e-05, 3.9147213101387024e-05, 4.0949322283267975e-05, 4.2751431465148926e-05, 4.455354064702988e-05, 4.635564982891083e-05, 4.815775901079178e-05, 4.995986819267273e-05, 5.176197737455368e-05, 5.356408655643463e-05, 5.536619573831558e-05, 5.716830492019653e-05, 5.8970414102077484e-05, 6.0772523283958435e-05, 6.257463246583939e-05, 6.437674164772034e-05, 6.617885082960129e-05, 6.798096001148224e-05, 6.978306919336319e-05, 7.158517837524414e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 10.0, 12.0, 18.0, 17.0, 40.0, 65.0, 108.0, 153.0, 308.0, 591.0, 1378.0, 4242.0, 21432.0, 363264.0, 616129.0, 32161.0, 5401.0, 1667.0, 688.0, 323.0, 207.0, 105.0, 62.0, 51.0, 32.0, 25.0, 18.0, 13.0, 5.0, 7.0, 6.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9266433715820312, -0.8947906494140625, -0.8629379272460938, -0.831085205078125, -0.7992324829101562, -0.7673797607421875, -0.7355270385742188, -0.70367431640625, -0.6718215942382812, -0.6399688720703125, -0.6081161499023438, -0.576263427734375, -0.5444107055664062, -0.5125579833984375, -0.48070526123046875, -0.4488525390625, -0.41699981689453125, -0.3851470947265625, -0.35329437255859375, -0.321441650390625, -0.28958892822265625, -0.2577362060546875, -0.22588348388671875, -0.19403076171875, -0.16217803955078125, -0.1303253173828125, -0.09847259521484375, -0.066619873046875, -0.03476715087890625, -0.0029144287109375, 0.02893829345703125, 0.060791015625, 0.09264373779296875, 0.1244964599609375, 0.15634918212890625, 0.188201904296875, 0.22005462646484375, 0.2519073486328125, 0.28376007080078125, 0.31561279296875, 0.34746551513671875, 0.3793182373046875, 0.41117095947265625, 0.443023681640625, 0.47487640380859375, 0.5067291259765625, 0.5385818481445312, 0.5704345703125, 0.6022872924804688, 0.6341400146484375, 0.6659927368164062, 0.697845458984375, 0.7296981811523438, 0.7615509033203125, 0.7934036254882812, 0.82525634765625, 0.8571090698242188, 0.8889617919921875, 0.9208145141601562, 0.952667236328125, 0.9845199584960938, 1.0163726806640625, 1.0482254028320312, 1.080078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 3.0, 8.0, 9.0, 16.0, 18.0, 24.0, 38.0, 33.0, 49.0, 62.0, 85.0, 94.0, 97.0, 105.0, 74.0, 69.0, 53.0, 36.0, 35.0, 16.0, 14.0, 9.0, 10.0, 7.0, 9.0, 9.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.468017578125, -0.4548454284667969, -0.44167327880859375, -0.4285011291503906, -0.4153289794921875, -0.4021568298339844, -0.38898468017578125, -0.3758125305175781, -0.362640380859375, -0.3494682312011719, -0.33629608154296875, -0.3231239318847656, -0.3099517822265625, -0.2967796325683594, -0.28360748291015625, -0.2704353332519531, -0.25726318359375, -0.24409103393554688, -0.23091888427734375, -0.21774673461914062, -0.2045745849609375, -0.19140243530273438, -0.17823028564453125, -0.16505813598632812, -0.151885986328125, -0.13871383666992188, -0.12554168701171875, -0.11236953735351562, -0.0991973876953125, -0.08602523803710938, -0.07285308837890625, -0.059680938720703125, -0.0465087890625, -0.033336639404296875, -0.02016448974609375, -0.006992340087890625, 0.0061798095703125, 0.019351959228515625, 0.03252410888671875, 0.045696258544921875, 0.058868408203125, 0.07204055786132812, 0.08521270751953125, 0.09838485717773438, 0.1115570068359375, 0.12472915649414062, 0.13790130615234375, 0.15107345581054688, 0.16424560546875, 0.17741775512695312, 0.19058990478515625, 0.20376205444335938, 0.2169342041015625, 0.23010635375976562, 0.24327850341796875, 0.2564506530761719, 0.269622802734375, 0.2827949523925781, 0.29596710205078125, 0.3091392517089844, 0.3223114013671875, 0.3354835510253906, 0.34865570068359375, 0.3618278503417969, 0.375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 63.0, 550.0, 337.0, 29.0, 8.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-46.234886169433594, -45.391357421875, -44.547828674316406, -43.70429611206055, -42.86076736450195, -42.01723861694336, -41.173709869384766, -40.33018112182617, -39.48664855957031, -38.64311981201172, -37.799591064453125, -36.956058502197266, -36.11252975463867, -35.26900100708008, -34.425472259521484, -33.58194351196289, -32.7384147644043, -31.894886016845703, -31.051355361938477, -30.207826614379883, -29.364295959472656, -28.520767211914062, -27.67723846435547, -26.833707809448242, -25.990177154541016, -25.146648406982422, -24.303117752075195, -23.4595890045166, -22.616058349609375, -21.77252960205078, -20.929000854492188, -20.08547019958496, -19.241939544677734, -18.39841079711914, -17.554880142211914, -16.71135139465332, -15.86782169342041, -15.0242919921875, -14.18076229095459, -13.33723258972168, -12.493703842163086, -11.650174140930176, -10.806644439697266, -9.963115692138672, -9.119585990905762, -8.276056289672852, -7.432526588439941, -6.5889973640441895, -5.7454681396484375, -4.901938438415527, -4.058409214019775, -3.2148795127868652, -2.371350049972534, -1.5278205871582031, -0.684290885925293, 0.15923833847045898, 1.0027680397033691, 1.8462975025177002, 2.6898269653320312, 3.5333566665649414, 4.376886367797852, 5.2204155921936035, 6.063945293426514, 6.907474517822266, 7.751004219055176]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 1.0, 4.0, 11.0, 12.0, 19.0, 20.0, 29.0, 37.0, 58.0, 66.0, 109.0, 114.0, 99.0, 77.0, 71.0, 68.0, 54.0, 43.0, 40.0, 20.0, 20.0, 10.0, 11.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.965963363647461, -13.643281936645508, -13.320601463317871, -12.997920036315918, -12.675239562988281, -12.352558135986328, -12.029876708984375, -11.707195281982422, -11.384514808654785, -11.061833381652832, -10.739152908325195, -10.416471481323242, -10.093790054321289, -9.771109580993652, -9.4484281539917, -9.125747680664062, -8.80306625366211, -8.480384826660156, -8.15770435333252, -7.835022926330566, -7.5123419761657715, -7.189661026000977, -6.866979598999023, -6.5442986488342285, -6.221617698669434, -5.898936748504639, -5.576255798339844, -5.253574371337891, -4.930893421173096, -4.608212471008301, -4.285531044006348, -3.9628500938415527, -3.6401681900024414, -3.3174872398376465, -2.9948060512542725, -2.6721248626708984, -2.3494439125061035, -2.0267629623413086, -1.7040817737579346, -1.3814005851745605, -1.0587196350097656, -0.7360385656356812, -0.4133574962615967, -0.09067642688751221, 0.23200464248657227, 0.5546857118606567, 0.8773667812347412, 1.2000479698181152, 1.5227289199829102, 1.8454099893569946, 2.168091058731079, 2.490772247314453, 2.813453197479248, 3.136134147644043, 3.458815336227417, 3.781496524810791, 4.104177474975586, 4.426858425140381, 4.749539375305176, 5.072220802307129, 5.394901752471924, 5.717582702636719, 6.040264129638672, 6.362945079803467, 6.685626029968262]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 21.0, 25.0, 94.0, 219.0, 1158.0, 3879492.0, 312215.0, 748.0, 172.0, 76.0, 24.0, 11.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-20.9375, -20.4385986328125, -19.939697265625, -19.4407958984375, -18.94189453125, -18.4429931640625, -17.944091796875, -17.4451904296875, -16.9462890625, -16.4473876953125, -15.948486328125, -15.4495849609375, -14.95068359375, -14.4517822265625, -13.952880859375, -13.4539794921875, -12.955078125, -12.4561767578125, -11.957275390625, -11.4583740234375, -10.95947265625, -10.4605712890625, -9.961669921875, -9.4627685546875, -8.9638671875, -8.4649658203125, -7.966064453125, -7.4671630859375, -6.96826171875, -6.4693603515625, -5.970458984375, -5.4715576171875, -4.97265625, -4.4737548828125, -3.974853515625, -3.4759521484375, -2.97705078125, -2.4781494140625, -1.979248046875, -1.4803466796875, -0.9814453125, -0.4825439453125, 0.016357421875, 0.5152587890625, 1.01416015625, 1.5130615234375, 2.011962890625, 2.5108642578125, 3.009765625, 3.5086669921875, 4.007568359375, 4.5064697265625, 5.00537109375, 5.5042724609375, 6.003173828125, 6.5020751953125, 7.0009765625, 7.4998779296875, 7.998779296875, 8.4976806640625, 8.99658203125, 9.4954833984375, 9.994384765625, 10.4932861328125, 10.9921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 31.0, 68.0, 149.0, 220.0, 234.0, 147.0, 77.0, 25.0, 17.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.58740234375, -0.5734062194824219, -0.5594100952148438, -0.5454139709472656, -0.5314178466796875, -0.5174217224121094, -0.5034255981445312, -0.4894294738769531, -0.475433349609375, -0.4614372253417969, -0.44744110107421875, -0.4334449768066406, -0.4194488525390625, -0.4054527282714844, -0.39145660400390625, -0.3774604797363281, -0.36346435546875, -0.3494682312011719, -0.33547210693359375, -0.3214759826660156, -0.3074798583984375, -0.2934837341308594, -0.27948760986328125, -0.2654914855957031, -0.251495361328125, -0.23749923706054688, -0.22350311279296875, -0.20950698852539062, -0.1955108642578125, -0.18151473999023438, -0.16751861572265625, -0.15352249145507812, -0.1395263671875, -0.12553024291992188, -0.11153411865234375, -0.09753799438476562, -0.0835418701171875, -0.06954574584960938, -0.05554962158203125, -0.041553497314453125, -0.027557373046875, -0.013561248779296875, 0.00043487548828125, 0.014430999755859375, 0.0284271240234375, 0.042423248291015625, 0.05641937255859375, 0.07041549682617188, 0.08441162109375, 0.09840774536132812, 0.11240386962890625, 0.12639999389648438, 0.1403961181640625, 0.15439224243164062, 0.16838836669921875, 0.18238449096679688, 0.196380615234375, 0.21037673950195312, 0.22437286376953125, 0.23836898803710938, 0.2523651123046875, 0.2663612365722656, 0.28035736083984375, 0.2943534851074219, 0.308349609375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 10.0, 15.0, 26.0, 37.0, 73.0, 123.0, 242.0, 414.0, 892.0, 2468.0, 10227.0, 88301.0, 3750747.0, 314346.0, 19920.0, 3936.0, 1251.0, 525.0, 272.0, 179.0, 97.0, 58.0, 31.0, 14.0, 20.0, 10.0, 11.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4140625, -1.356781005859375, -1.29949951171875, -1.242218017578125, -1.1849365234375, -1.127655029296875, -1.07037353515625, -1.013092041015625, -0.955810546875, -0.898529052734375, -0.84124755859375, -0.783966064453125, -0.7266845703125, -0.669403076171875, -0.61212158203125, -0.554840087890625, -0.49755859375, -0.440277099609375, -0.38299560546875, -0.325714111328125, -0.2684326171875, -0.211151123046875, -0.15386962890625, -0.096588134765625, -0.039306640625, 0.017974853515625, 0.07525634765625, 0.132537841796875, 0.1898193359375, 0.247100830078125, 0.30438232421875, 0.361663818359375, 0.4189453125, 0.476226806640625, 0.53350830078125, 0.590789794921875, 0.6480712890625, 0.705352783203125, 0.76263427734375, 0.819915771484375, 0.877197265625, 0.934478759765625, 0.99176025390625, 1.049041748046875, 1.1063232421875, 1.163604736328125, 1.22088623046875, 1.278167724609375, 1.33544921875, 1.392730712890625, 1.45001220703125, 1.507293701171875, 1.5645751953125, 1.621856689453125, 1.67913818359375, 1.736419677734375, 1.793701171875, 1.850982666015625, 1.90826416015625, 1.965545654296875, 2.0228271484375, 2.080108642578125, 2.13739013671875, 2.194671630859375, 2.251953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 8.0, 12.0, 18.0, 22.0, 23.0, 35.0, 58.0, 70.0, 91.0, 171.0, 316.0, 766.0, 1246.0, 518.0, 265.0, 133.0, 88.0, 61.0, 46.0, 25.0, 18.0, 16.0, 13.0, 6.0, 7.0, 4.0, 3.0, 0.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.296875, -0.28820037841796875, -0.2795257568359375, -0.27085113525390625, -0.262176513671875, -0.25350189208984375, -0.2448272705078125, -0.23615264892578125, -0.22747802734375, -0.21880340576171875, -0.2101287841796875, -0.20145416259765625, -0.192779541015625, -0.18410491943359375, -0.1754302978515625, -0.16675567626953125, -0.1580810546875, -0.14940643310546875, -0.1407318115234375, -0.13205718994140625, -0.123382568359375, -0.11470794677734375, -0.1060333251953125, -0.09735870361328125, -0.08868408203125, -0.08000946044921875, -0.0713348388671875, -0.06266021728515625, -0.053985595703125, -0.04531097412109375, -0.0366363525390625, -0.02796173095703125, -0.019287109375, -0.01061248779296875, -0.0019378662109375, 0.00673675537109375, 0.015411376953125, 0.02408599853515625, 0.0327606201171875, 0.04143524169921875, 0.05010986328125, 0.05878448486328125, 0.0674591064453125, 0.07613372802734375, 0.084808349609375, 0.09348297119140625, 0.1021575927734375, 0.11083221435546875, 0.1195068359375, 0.12818145751953125, 0.1368560791015625, 0.14553070068359375, 0.154205322265625, 0.16287994384765625, 0.1715545654296875, 0.18022918701171875, 0.18890380859375, 0.19757843017578125, 0.2062530517578125, 0.21492767333984375, 0.223602294921875, 0.23227691650390625, 0.2409515380859375, 0.24962615966796875, 0.25830078125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 13.0, 34.0, 123.0, 325.0, 332.0, 124.0, 36.0, 8.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2764358520507812, -2.1725354194641113, -2.0686349868774414, -1.964734435081482, -1.8608338832855225, -1.7569334506988525, -1.6530330181121826, -1.5491325855255127, -1.4452320337295532, -1.3413316011428833, -1.2374310493469238, -1.133530616760254, -1.029630184173584, -0.9257296323776245, -0.8218291997909546, -0.7179287075996399, -0.6140282154083252, -0.5101277232170105, -0.4062272608280182, -0.3023267984390259, -0.19842630624771118, -0.09452581405639648, 0.009374618530273438, 0.11327511072158813, 0.21717560291290283, 0.32107609510421753, 0.42497655749320984, 0.5288770198822021, 0.6327775120735168, 0.7366780042648315, 0.8405784368515015, 0.9444789290428162, 1.0483794212341309, 1.1522798538208008, 1.2561804056167603, 1.3600808382034302, 1.4639813899993896, 1.5678818225860596, 1.6717822551727295, 1.7756826877593994, 1.8795832395553589, 1.9834836721420288, 2.0873842239379883, 2.191284656524658, 2.295185089111328, 2.399085521697998, 2.502985954284668, 2.606886625289917, 2.710787057876587, 2.814687490463257, 2.9185879230499268, 3.022488594055176, 3.1263890266418457, 3.2302894592285156, 3.3341898918151855, 3.4380903244018555, 3.5419907569885254, 3.6458911895751953, 3.7497916221618652, 3.853692054748535, 3.957592725753784, 4.061492919921875, 4.165393829345703, 4.269294261932373, 4.373194694519043]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 0.0, 4.0, 3.0, 8.0, 5.0, 5.0, 10.0, 11.0, 5.0, 13.0, 17.0, 25.0, 23.0, 26.0, 30.0, 33.0, 30.0, 42.0, 42.0, 37.0, 41.0, 44.0, 46.0, 34.0, 34.0, 50.0, 27.0, 42.0, 45.0, 32.0, 33.0, 27.0, 27.0, 16.0, 21.0, 26.0, 16.0, 9.0, 13.0, 15.0, 9.0, 6.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.8889794945716858, -0.8624259829521179, -0.83587247133255, -0.809319019317627, -0.7827655076980591, -0.7562119960784912, -0.7296584844589233, -0.7031049728393555, -0.6765514612197876, -0.6499979496002197, -0.6234444379806519, -0.596890926361084, -0.5703374743461609, -0.543783962726593, -0.5172304511070251, -0.4906769394874573, -0.4641234874725342, -0.4375699758529663, -0.4110164940357208, -0.38446298241615295, -0.35790950059890747, -0.3313559889793396, -0.30480247735977173, -0.27824896574020386, -0.2516954839229584, -0.2251419872045517, -0.19858849048614502, -0.17203497886657715, -0.14548148214817047, -0.1189279854297638, -0.09237447381019592, -0.06582097709178925, -0.03926748037338257, -0.012713979929685593, 0.013839520514011383, 0.04039302468299866, 0.06694652140140533, 0.09350001811981201, 0.12005352973937988, 0.14660702645778656, 0.17316052317619324, 0.19971401989459991, 0.2262675166130066, 0.25282102823257446, 0.27937453985214233, 0.3059280216693878, 0.3324815332889557, 0.35903501510620117, 0.38558852672576904, 0.4121420383453369, 0.4386955201625824, 0.46524903178215027, 0.49180251359939575, 0.5183560252189636, 0.5449095368385315, 0.5714630484580994, 0.5980165004730225, 0.6245700120925903, 0.6511235237121582, 0.6776770353317261, 0.7042304873466492, 0.730783998966217, 0.7573375105857849, 0.7838910222053528, 0.8104445338249207]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 16.0, 20.0, 39.0, 52.0, 98.0, 233.0, 582.0, 1740.0, 7455.0, 555539.0, 473178.0, 6919.0, 1636.0, 565.0, 230.0, 114.0, 39.0, 28.0, 23.0, 8.0, 9.0, 8.0, 3.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66796875, -3.5567626953125, -3.445556640625, -3.3343505859375, -3.22314453125, -3.1119384765625, -3.000732421875, -2.8895263671875, -2.7783203125, -2.6671142578125, -2.555908203125, -2.4447021484375, -2.33349609375, -2.2222900390625, -2.111083984375, -1.9998779296875, -1.888671875, -1.7774658203125, -1.666259765625, -1.5550537109375, -1.44384765625, -1.3326416015625, -1.221435546875, -1.1102294921875, -0.9990234375, -0.8878173828125, -0.776611328125, -0.6654052734375, -0.55419921875, -0.4429931640625, -0.331787109375, -0.2205810546875, -0.109375, 0.0018310546875, 0.113037109375, 0.2242431640625, 0.33544921875, 0.4466552734375, 0.557861328125, 0.6690673828125, 0.7802734375, 0.8914794921875, 1.002685546875, 1.1138916015625, 1.22509765625, 1.3363037109375, 1.447509765625, 1.5587158203125, 1.669921875, 1.7811279296875, 1.892333984375, 2.0035400390625, 2.11474609375, 2.2259521484375, 2.337158203125, 2.4483642578125, 2.5595703125, 2.6707763671875, 2.781982421875, 2.8931884765625, 3.00439453125, 3.1156005859375, 3.226806640625, 3.3380126953125, 3.44921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 13.0, 27.0, 89.0, 164.0, 224.0, 228.0, 142.0, 65.0, 23.0, 11.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.61083984375, -0.5968894958496094, -0.5829391479492188, -0.5689888000488281, -0.5550384521484375, -0.5410881042480469, -0.5271377563476562, -0.5131874084472656, -0.499237060546875, -0.4852867126464844, -0.47133636474609375, -0.4573860168457031, -0.4434356689453125, -0.4294853210449219, -0.41553497314453125, -0.4015846252441406, -0.38763427734375, -0.3736839294433594, -0.35973358154296875, -0.3457832336425781, -0.3318328857421875, -0.3178825378417969, -0.30393218994140625, -0.2899818420410156, -0.276031494140625, -0.2620811462402344, -0.24813079833984375, -0.23418045043945312, -0.2202301025390625, -0.20627975463867188, -0.19232940673828125, -0.17837905883789062, -0.1644287109375, -0.15047836303710938, -0.13652801513671875, -0.12257766723632812, -0.1086273193359375, -0.09467697143554688, -0.08072662353515625, -0.06677627563476562, -0.052825927734375, -0.038875579833984375, -0.02492523193359375, -0.010974884033203125, 0.0029754638671875, 0.016925811767578125, 0.03087615966796875, 0.044826507568359375, 0.05877685546875, 0.07272720336914062, 0.08667755126953125, 0.10062789916992188, 0.1145782470703125, 0.12852859497070312, 0.14247894287109375, 0.15642929077148438, 0.170379638671875, 0.18432998657226562, 0.19828033447265625, 0.21223068237304688, 0.2261810302734375, 0.24013137817382812, 0.25408172607421875, 0.2680320739746094, 0.281982421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 4.0, 9.0, 17.0, 17.0, 26.0, 35.0, 48.0, 77.0, 103.0, 144.0, 209.0, 323.0, 450.0, 681.0, 1303.0, 2708.0, 7501.0, 30143.0, 180184.0, 586512.0, 192437.0, 31776.0, 7790.0, 2681.0, 1276.0, 721.0, 436.0, 310.0, 181.0, 115.0, 87.0, 80.0, 39.0, 35.0, 23.0, 23.0, 11.0, 7.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0732421875, -1.035614013671875, -0.99798583984375, -0.960357666015625, -0.9227294921875, -0.885101318359375, -0.84747314453125, -0.809844970703125, -0.772216796875, -0.734588623046875, -0.69696044921875, -0.659332275390625, -0.6217041015625, -0.584075927734375, -0.54644775390625, -0.508819580078125, -0.47119140625, -0.433563232421875, -0.39593505859375, -0.358306884765625, -0.3206787109375, -0.283050537109375, -0.24542236328125, -0.207794189453125, -0.170166015625, -0.132537841796875, -0.09490966796875, -0.057281494140625, -0.0196533203125, 0.017974853515625, 0.05560302734375, 0.093231201171875, 0.130859375, 0.168487548828125, 0.20611572265625, 0.243743896484375, 0.2813720703125, 0.319000244140625, 0.35662841796875, 0.394256591796875, 0.431884765625, 0.469512939453125, 0.50714111328125, 0.544769287109375, 0.5823974609375, 0.620025634765625, 0.65765380859375, 0.695281982421875, 0.73291015625, 0.770538330078125, 0.80816650390625, 0.845794677734375, 0.8834228515625, 0.921051025390625, 0.95867919921875, 0.996307373046875, 1.033935546875, 1.071563720703125, 1.10919189453125, 1.146820068359375, 1.1844482421875, 1.222076416015625, 1.25970458984375, 1.297332763671875, 1.3349609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 1.0, 8.0, 11.0, 14.0, 8.0, 12.0, 15.0, 22.0, 22.0, 30.0, 30.0, 35.0, 36.0, 37.0, 42.0, 40.0, 46.0, 52.0, 44.0, 45.0, 54.0, 28.0, 48.0, 39.0, 38.0, 33.0, 28.0, 24.0, 26.0, 18.0, 14.0, 11.0, 13.0, 13.0, 8.0, 8.0, 6.0, 4.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.84326171875, -0.81719970703125, -0.7911376953125, -0.76507568359375, -0.739013671875, -0.71295166015625, -0.6868896484375, -0.66082763671875, -0.634765625, -0.60870361328125, -0.5826416015625, -0.55657958984375, -0.530517578125, -0.50445556640625, -0.4783935546875, -0.45233154296875, -0.42626953125, -0.40020751953125, -0.3741455078125, -0.34808349609375, -0.322021484375, -0.29595947265625, -0.2698974609375, -0.24383544921875, -0.2177734375, -0.19171142578125, -0.1656494140625, -0.13958740234375, -0.113525390625, -0.08746337890625, -0.0614013671875, -0.03533935546875, -0.00927734375, 0.01678466796875, 0.0428466796875, 0.06890869140625, 0.094970703125, 0.12103271484375, 0.1470947265625, 0.17315673828125, 0.19921875, 0.22528076171875, 0.2513427734375, 0.27740478515625, 0.303466796875, 0.32952880859375, 0.3555908203125, 0.38165283203125, 0.40771484375, 0.43377685546875, 0.4598388671875, 0.48590087890625, 0.511962890625, 0.53802490234375, 0.5640869140625, 0.59014892578125, 0.6162109375, 0.64227294921875, 0.6683349609375, 0.69439697265625, 0.720458984375, 0.74652099609375, 0.7725830078125, 0.79864501953125, 0.82470703125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 18.0, 30.0, 106.0, 288.0, 1088.0, 14380.0, 1003668.0, 26957.0, 1393.0, 367.0, 126.0, 44.0, 28.0, 20.0, 7.0, 1.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.17578125, -2.12078857421875, -2.0657958984375, -2.01080322265625, -1.955810546875, -1.90081787109375, -1.8458251953125, -1.79083251953125, -1.73583984375, -1.68084716796875, -1.6258544921875, -1.57086181640625, -1.515869140625, -1.46087646484375, -1.4058837890625, -1.35089111328125, -1.2958984375, -1.24090576171875, -1.1859130859375, -1.13092041015625, -1.075927734375, -1.02093505859375, -0.9659423828125, -0.91094970703125, -0.85595703125, -0.80096435546875, -0.7459716796875, -0.69097900390625, -0.635986328125, -0.58099365234375, -0.5260009765625, -0.47100830078125, -0.416015625, -0.36102294921875, -0.3060302734375, -0.25103759765625, -0.196044921875, -0.14105224609375, -0.0860595703125, -0.03106689453125, 0.02392578125, 0.07891845703125, 0.1339111328125, 0.18890380859375, 0.243896484375, 0.29888916015625, 0.3538818359375, 0.40887451171875, 0.4638671875, 0.51885986328125, 0.5738525390625, 0.62884521484375, 0.683837890625, 0.73883056640625, 0.7938232421875, 0.84881591796875, 0.90380859375, 0.95880126953125, 1.0137939453125, 1.06878662109375, 1.123779296875, 1.17877197265625, 1.2337646484375, 1.28875732421875, 1.34375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 14.0, 10.0, 24.0, 47.0, 82.0, 106.0, 181.0, 166.0, 130.0, 93.0, 59.0, 27.0, 24.0, 9.0, 9.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5789947509765625e-05, -5.314406007528305e-05, -5.0498172640800476e-05, -4.78522852063179e-05, -4.520639777183533e-05, -4.256051033735275e-05, -3.991462290287018e-05, -3.7268735468387604e-05, -3.462284803390503e-05, -3.1976960599422455e-05, -2.933107316493988e-05, -2.6685185730457306e-05, -2.403929829597473e-05, -2.1393410861492157e-05, -1.8747523427009583e-05, -1.6101635992527008e-05, -1.3455748558044434e-05, -1.0809861123561859e-05, -8.163973689079285e-06, -5.51808625459671e-06, -2.8721988201141357e-06, -2.2631138563156128e-07, 2.419576048851013e-06, 5.065463483333588e-06, 7.711350917816162e-06, 1.0357238352298737e-05, 1.3003125786781311e-05, 1.5649013221263885e-05, 1.829490065574646e-05, 2.0940788090229034e-05, 2.358667552471161e-05, 2.6232562959194183e-05, 2.8878450393676758e-05, 3.152433782815933e-05, 3.417022526264191e-05, 3.681611269712448e-05, 3.9462000131607056e-05, 4.210788756608963e-05, 4.4753775000572205e-05, 4.739966243505478e-05, 5.0045549869537354e-05, 5.269143730401993e-05, 5.53373247385025e-05, 5.798321217298508e-05, 6.062909960746765e-05, 6.327498704195023e-05, 6.59208744764328e-05, 6.856676191091537e-05, 7.121264934539795e-05, 7.385853677988052e-05, 7.65044242143631e-05, 7.915031164884567e-05, 8.179619908332825e-05, 8.444208651781082e-05, 8.70879739522934e-05, 8.973386138677597e-05, 9.237974882125854e-05, 9.502563625574112e-05, 9.76715236902237e-05, 0.00010031741112470627, 0.00010296329855918884, 0.00010560918599367142, 0.00010825507342815399, 0.00011090096086263657, 0.00011354684829711914]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 0.0, 4.0, 3.0, 3.0, 8.0, 14.0, 23.0, 33.0, 37.0, 70.0, 121.0, 196.0, 348.0, 732.0, 1697.0, 5167.0, 29044.0, 411715.0, 550770.0, 38774.0, 6137.0, 1955.0, 811.0, 387.0, 168.0, 125.0, 63.0, 41.0, 30.0, 22.0, 18.0, 12.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.78759765625, -0.7637786865234375, -0.739959716796875, -0.7161407470703125, -0.69232177734375, -0.6685028076171875, -0.644683837890625, -0.6208648681640625, -0.5970458984375, -0.5732269287109375, -0.549407958984375, -0.5255889892578125, -0.50177001953125, -0.4779510498046875, -0.454132080078125, -0.4303131103515625, -0.406494140625, -0.3826751708984375, -0.358856201171875, -0.3350372314453125, -0.31121826171875, -0.2873992919921875, -0.263580322265625, -0.2397613525390625, -0.2159423828125, -0.1921234130859375, -0.168304443359375, -0.1444854736328125, -0.12066650390625, -0.0968475341796875, -0.073028564453125, -0.0492095947265625, -0.025390625, -0.0015716552734375, 0.022247314453125, 0.0460662841796875, 0.06988525390625, 0.0937042236328125, 0.117523193359375, 0.1413421630859375, 0.1651611328125, 0.1889801025390625, 0.212799072265625, 0.2366180419921875, 0.26043701171875, 0.2842559814453125, 0.308074951171875, 0.3318939208984375, 0.355712890625, 0.3795318603515625, 0.403350830078125, 0.4271697998046875, 0.45098876953125, 0.4748077392578125, 0.498626708984375, 0.5224456787109375, 0.5462646484375, 0.5700836181640625, 0.593902587890625, 0.6177215576171875, 0.64154052734375, 0.6653594970703125, 0.689178466796875, 0.7129974365234375, 0.73681640625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 9.0, 16.0, 18.0, 27.0, 30.0, 33.0, 47.0, 53.0, 80.0, 84.0, 79.0, 94.0, 84.0, 79.0, 71.0, 50.0, 32.0, 29.0, 12.0, 7.0, 18.0, 5.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4786643981933594, -0.46538543701171875, -0.4521064758300781, -0.4388275146484375, -0.4255485534667969, -0.41226959228515625, -0.3989906311035156, -0.385711669921875, -0.3724327087402344, -0.35915374755859375, -0.3458747863769531, -0.3325958251953125, -0.3193168640136719, -0.30603790283203125, -0.2927589416503906, -0.27947998046875, -0.2662010192871094, -0.25292205810546875, -0.23964309692382812, -0.2263641357421875, -0.21308517456054688, -0.19980621337890625, -0.18652725219726562, -0.173248291015625, -0.15996932983398438, -0.14669036865234375, -0.13341140747070312, -0.1201324462890625, -0.10685348510742188, -0.09357452392578125, -0.08029556274414062, -0.0670166015625, -0.053737640380859375, -0.04045867919921875, -0.027179718017578125, -0.0139007568359375, -0.000621795654296875, 0.01265716552734375, 0.025936126708984375, 0.039215087890625, 0.052494049072265625, 0.06577301025390625, 0.07905197143554688, 0.0923309326171875, 0.10560989379882812, 0.11888885498046875, 0.13216781616210938, 0.14544677734375, 0.15872573852539062, 0.17200469970703125, 0.18528366088867188, 0.1985626220703125, 0.21184158325195312, 0.22512054443359375, 0.23839950561523438, 0.251678466796875, 0.2649574279785156, 0.27823638916015625, 0.2915153503417969, 0.3047943115234375, 0.3180732727050781, 0.33135223388671875, 0.3446311950683594, 0.35791015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 52.0, 617.0, 310.0, 20.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.89696502685547, -55.858402252197266, -54.81983947753906, -53.781272888183594, -52.74271011352539, -51.70414733886719, -50.665584564208984, -49.62702178955078, -48.58845901489258, -47.549896240234375, -46.51133346557617, -45.47277069091797, -44.4342041015625, -43.3956413269043, -42.357078552246094, -41.31851577758789, -40.27995300292969, -39.241390228271484, -38.20282745361328, -37.16426086425781, -36.12569808959961, -35.087135314941406, -34.0485725402832, -33.010009765625, -31.97144317626953, -30.932880401611328, -29.894315719604492, -28.85575294494629, -27.817190170288086, -26.77862548828125, -25.740062713623047, -24.701499938964844, -23.662935256958008, -22.624372482299805, -21.58580780029297, -20.547245025634766, -19.508682250976562, -18.47011947631836, -17.431554794311523, -16.39299201965332, -15.3544282913208, -14.315864562988281, -13.277301788330078, -12.238738059997559, -11.200174331665039, -10.161611557006836, -9.123047828674316, -8.084484100341797, -7.045921325683594, -6.007358074188232, -4.968794822692871, -3.9302310943603516, -2.8916678428649902, -1.853104591369629, -0.8145408630371094, 0.22402238845825195, 1.2625856399536133, 2.3011488914489746, 3.339712381362915, 4.3782758712768555, 5.416839122772217, 6.455402374267578, 7.493966102600098, 8.532529830932617, 9.57109260559082]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 6.0, 11.0, 8.0, 12.0, 16.0, 17.0, 22.0, 24.0, 35.0, 36.0, 38.0, 43.0, 51.0, 54.0, 53.0, 53.0, 75.0, 47.0, 59.0, 57.0, 42.0, 26.0, 33.0, 40.0, 29.0, 24.0, 15.0, 18.0, 13.0, 12.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.507131099700928, -7.302495002746582, -7.097858905792236, -6.893222808837891, -6.688587188720703, -6.483950614929199, -6.279314994812012, -6.074678897857666, -5.87004280090332, -5.665406703948975, -5.460770606994629, -5.256134510040283, -5.0514984130859375, -4.84686279296875, -4.642226696014404, -4.437590599060059, -4.232954502105713, -4.028318405151367, -3.8236823081970215, -3.619046449661255, -3.414410352706909, -3.2097742557525635, -3.005138397216797, -2.800502300262451, -2.5958662033081055, -2.3912301063537598, -2.186594009399414, -1.9819581508636475, -1.7773220539093018, -1.572685956954956, -1.3680499792099, -1.1634140014648438, -0.958777904510498, -0.7541418671607971, -0.5495058298110962, -0.34486979246139526, -0.14023375511169434, 0.06440234184265137, 0.2690383195877075, 0.47367429733276367, 0.6783103942871094, 0.8829464316368103, 1.0875824689865112, 1.2922184467315674, 1.496854543685913, 1.7014906406402588, 1.906126618385315, 2.110762596130371, 2.315398693084717, 2.5200347900390625, 2.724670886993408, 2.929306745529175, 3.1339428424835205, 3.338578939437866, 3.543214797973633, 3.7478508949279785, 3.952486991882324, 4.15712308883667, 4.361759185791016, 4.566395282745361, 4.771031379699707, 4.9756669998168945, 5.18030309677124, 5.384939193725586, 5.589575290679932]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 8.0, 1.0, 5.0, 10.0, 9.0, 21.0, 32.0, 39.0, 72.0, 106.0, 204.0, 499.0, 1282.0, 5247.0, 90323.0, 4070113.0, 22348.0, 2699.0, 729.0, 263.0, 121.0, 63.0, 26.0, 23.0, 13.0, 5.0, 9.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.412750244140625, -4.30596923828125, -4.199188232421875, -4.0924072265625, -3.985626220703125, -3.87884521484375, -3.772064208984375, -3.665283203125, -3.558502197265625, -3.45172119140625, -3.344940185546875, -3.2381591796875, -3.131378173828125, -3.02459716796875, -2.917816162109375, -2.81103515625, -2.704254150390625, -2.59747314453125, -2.490692138671875, -2.3839111328125, -2.277130126953125, -2.17034912109375, -2.063568115234375, -1.956787109375, -1.850006103515625, -1.74322509765625, -1.636444091796875, -1.5296630859375, -1.422882080078125, -1.31610107421875, -1.209320068359375, -1.1025390625, -0.995758056640625, -0.88897705078125, -0.782196044921875, -0.6754150390625, -0.568634033203125, -0.46185302734375, -0.355072021484375, -0.248291015625, -0.141510009765625, -0.03472900390625, 0.072052001953125, 0.1788330078125, 0.285614013671875, 0.39239501953125, 0.499176025390625, 0.60595703125, 0.712738037109375, 0.81951904296875, 0.926300048828125, 1.0330810546875, 1.139862060546875, 1.24664306640625, 1.353424072265625, 1.460205078125, 1.566986083984375, 1.67376708984375, 1.780548095703125, 1.8873291015625, 1.994110107421875, 2.10089111328125, 2.207672119140625, 2.314453125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 18.0, 33.0, 66.0, 104.0, 148.0, 170.0, 153.0, 147.0, 75.0, 37.0, 17.0, 14.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.623046875, -0.6087684631347656, -0.5944900512695312, -0.5802116394042969, -0.5659332275390625, -0.5516548156738281, -0.5373764038085938, -0.5230979919433594, -0.508819580078125, -0.4945411682128906, -0.48026275634765625, -0.4659843444824219, -0.4517059326171875, -0.4374275207519531, -0.42314910888671875, -0.4088706970214844, -0.39459228515625, -0.3803138732910156, -0.36603546142578125, -0.3517570495605469, -0.3374786376953125, -0.3232002258300781, -0.30892181396484375, -0.2946434020996094, -0.280364990234375, -0.2660865783691406, -0.25180816650390625, -0.23752975463867188, -0.2232513427734375, -0.20897293090820312, -0.19469451904296875, -0.18041610717773438, -0.1661376953125, -0.15185928344726562, -0.13758087158203125, -0.12330245971679688, -0.1090240478515625, -0.09474563598632812, -0.08046722412109375, -0.06618881225585938, -0.051910400390625, -0.037631988525390625, -0.02335357666015625, -0.009075164794921875, 0.0052032470703125, 0.019481658935546875, 0.03376007080078125, 0.048038482666015625, 0.06231689453125, 0.07659530639648438, 0.09087371826171875, 0.10515213012695312, 0.1194305419921875, 0.13370895385742188, 0.14798736572265625, 0.16226577758789062, 0.176544189453125, 0.19082260131835938, 0.20510101318359375, 0.21937942504882812, 0.2336578369140625, 0.24793624877929688, 0.26221466064453125, 0.2764930725097656, 0.290771484375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 2.0, 9.0, 16.0, 25.0, 26.0, 30.0, 56.0, 82.0, 160.0, 293.0, 666.0, 1483.0, 4489.0, 18710.0, 188098.0, 3792547.0, 165492.0, 16342.0, 3634.0, 1198.0, 491.0, 197.0, 84.0, 56.0, 31.0, 13.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.8056182861328125, -1.758697509765625, -1.7117767333984375, -1.66485595703125, -1.6179351806640625, -1.571014404296875, -1.5240936279296875, -1.4771728515625, -1.4302520751953125, -1.383331298828125, -1.3364105224609375, -1.28948974609375, -1.2425689697265625, -1.195648193359375, -1.1487274169921875, -1.101806640625, -1.0548858642578125, -1.007965087890625, -0.9610443115234375, -0.91412353515625, -0.8672027587890625, -0.820281982421875, -0.7733612060546875, -0.7264404296875, -0.6795196533203125, -0.632598876953125, -0.5856781005859375, -0.53875732421875, -0.4918365478515625, -0.444915771484375, -0.3979949951171875, -0.35107421875, -0.3041534423828125, -0.257232666015625, -0.2103118896484375, -0.16339111328125, -0.1164703369140625, -0.069549560546875, -0.0226287841796875, 0.0242919921875, 0.0712127685546875, 0.118133544921875, 0.1650543212890625, 0.21197509765625, 0.2588958740234375, 0.305816650390625, 0.3527374267578125, 0.399658203125, 0.4465789794921875, 0.493499755859375, 0.5404205322265625, 0.58734130859375, 0.6342620849609375, 0.681182861328125, 0.7281036376953125, 0.7750244140625, 0.8219451904296875, 0.868865966796875, 0.9157867431640625, 0.96270751953125, 1.0096282958984375, 1.056549072265625, 1.1034698486328125, 1.150390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 11.0, 17.0, 14.0, 26.0, 36.0, 53.0, 85.0, 138.0, 320.0, 849.0, 1501.0, 527.0, 212.0, 116.0, 42.0, 49.0, 15.0, 18.0, 12.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5068359375, -0.4945335388183594, -0.48223114013671875, -0.4699287414550781, -0.4576263427734375, -0.4453239440917969, -0.43302154541015625, -0.4207191467285156, -0.408416748046875, -0.3961143493652344, -0.38381195068359375, -0.3715095520019531, -0.3592071533203125, -0.3469047546386719, -0.33460235595703125, -0.3222999572753906, -0.30999755859375, -0.2976951599121094, -0.28539276123046875, -0.2730903625488281, -0.2607879638671875, -0.24848556518554688, -0.23618316650390625, -0.22388076782226562, -0.211578369140625, -0.19927597045898438, -0.18697357177734375, -0.17467117309570312, -0.1623687744140625, -0.15006637573242188, -0.13776397705078125, -0.12546157836914062, -0.1131591796875, -0.10085678100585938, -0.08855438232421875, -0.07625198364257812, -0.0639495849609375, -0.051647186279296875, -0.03934478759765625, -0.027042388916015625, -0.014739990234375, -0.002437591552734375, 0.00986480712890625, 0.022167205810546875, 0.0344696044921875, 0.046772003173828125, 0.05907440185546875, 0.07137680053710938, 0.08367919921875, 0.09598159790039062, 0.10828399658203125, 0.12058639526367188, 0.1328887939453125, 0.14519119262695312, 0.15749359130859375, 0.16979598999023438, 0.182098388671875, 0.19440078735351562, 0.20670318603515625, 0.21900558471679688, 0.2313079833984375, 0.24361038208007812, 0.25591278076171875, 0.2682151794433594, 0.280517578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 47.0, 242.0, 488.0, 186.0, 32.0, 8.0, 0.0, 2.0], "bins": [-9.454107284545898, -9.292083740234375, -9.130060195922852, -8.968036651611328, -8.806012153625488, -8.643988609313965, -8.481965065002441, -8.319941520690918, -8.157917976379395, -7.995894432067871, -7.8338704109191895, -7.671846866607666, -7.509823322296143, -7.347799301147461, -7.1857757568359375, -7.023752212524414, -6.861728191375732, -6.699704647064209, -6.537680625915527, -6.375657081604004, -6.2136335372924805, -6.051609992980957, -5.889585971832275, -5.727562427520752, -5.56553840637207, -5.403514862060547, -5.241490840911865, -5.079467296600342, -4.917443752288818, -4.755419731140137, -4.593396186828613, -4.43137264251709, -4.269349098205566, -4.107325553894043, -3.9453017711639404, -3.783277988433838, -3.6212544441223145, -3.459230661392212, -3.2972068786621094, -3.135183334350586, -2.9731593132019043, -2.8111355304718018, -2.6491119861602783, -2.487088203430176, -2.3250646591186523, -2.16304087638855, -2.0010170936584473, -1.8389934301376343, -1.6769698858261108, -1.5149462223052979, -1.3529224395751953, -1.1908987760543823, -1.0288751125335693, -0.8668514490127563, -0.7048277258872986, -0.5428040027618408, -0.38078033924102783, -0.21875664591789246, -0.05673295259475708, 0.1052907407283783, 0.26731443405151367, 0.42933809757232666, 0.5913618206977844, 0.7533855438232422, 0.9154092073440552]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 8.0, 5.0, 12.0, 15.0, 16.0, 17.0, 16.0, 23.0, 23.0, 33.0, 39.0, 37.0, 47.0, 41.0, 58.0, 39.0, 52.0, 46.0, 46.0, 34.0, 43.0, 41.0, 47.0, 46.0, 38.0, 23.0, 31.0, 25.0, 19.0, 18.0, 13.0, 10.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.303438425064087, -1.2693150043487549, -1.2351917028427124, -1.2010682821273804, -1.1669448614120483, -1.1328215599060059, -1.0986981391906738, -1.0645747184753418, -1.0304512977600098, -0.9963279366493225, -0.9622045159339905, -0.9280811548233032, -0.8939577341079712, -0.8598343729972839, -0.8257110118865967, -0.7915875911712646, -0.7574642896652222, -0.7233409285545349, -0.6892175078392029, -0.6550941467285156, -0.6209707260131836, -0.5868473649024963, -0.5527240037918091, -0.518600583076477, -0.4844772219657898, -0.45035383105278015, -0.4162304401397705, -0.38210707902908325, -0.3479836881160736, -0.31386029720306396, -0.2797369360923767, -0.24561354517936707, -0.21149015426635742, -0.17736676335334778, -0.14324338734149933, -0.10912000387907028, -0.07499662041664124, -0.04087322950363159, -0.006749853491783142, 0.027373522520065308, 0.06149691343307495, 0.095620296895504, 0.12974368035793304, 0.1638670563697815, 0.19799044728279114, 0.23211383819580078, 0.26623719930648804, 0.3003605902194977, 0.3344839811325073, 0.36860737204551697, 0.4027307629585266, 0.43685412406921387, 0.4709775149822235, 0.5051009058952332, 0.5392242670059204, 0.5733476877212524, 0.6074710488319397, 0.641594409942627, 0.675717830657959, 0.7098411917686462, 0.7439645528793335, 0.7780879735946655, 0.8122113347053528, 0.84633469581604, 0.8804581165313721]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 10.0, 13.0, 10.0, 19.0, 30.0, 37.0, 49.0, 64.0, 90.0, 148.0, 231.0, 350.0, 555.0, 900.0, 1612.0, 3539.0, 11610.0, 67344.0, 474776.0, 414380.0, 55444.0, 10018.0, 3295.0, 1547.0, 908.0, 534.0, 342.0, 229.0, 165.0, 93.0, 62.0, 39.0, 21.0, 31.0, 12.0, 17.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.01171875, -0.97552490234375, -0.9393310546875, -0.90313720703125, -0.866943359375, -0.83074951171875, -0.7945556640625, -0.75836181640625, -0.72216796875, -0.68597412109375, -0.6497802734375, -0.61358642578125, -0.577392578125, -0.54119873046875, -0.5050048828125, -0.46881103515625, -0.4326171875, -0.39642333984375, -0.3602294921875, -0.32403564453125, -0.287841796875, -0.25164794921875, -0.2154541015625, -0.17926025390625, -0.14306640625, -0.10687255859375, -0.0706787109375, -0.03448486328125, 0.001708984375, 0.03790283203125, 0.0740966796875, 0.11029052734375, 0.146484375, 0.18267822265625, 0.2188720703125, 0.25506591796875, 0.291259765625, 0.32745361328125, 0.3636474609375, 0.39984130859375, 0.43603515625, 0.47222900390625, 0.5084228515625, 0.54461669921875, 0.580810546875, 0.61700439453125, 0.6531982421875, 0.68939208984375, 0.7255859375, 0.76177978515625, 0.7979736328125, 0.83416748046875, 0.870361328125, 0.90655517578125, 0.9427490234375, 0.97894287109375, 1.01513671875, 1.05133056640625, 1.0875244140625, 1.12371826171875, 1.159912109375, 1.19610595703125, 1.2322998046875, 1.26849365234375, 1.3046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 17.0, 34.0, 61.0, 112.0, 149.0, 170.0, 172.0, 119.0, 76.0, 45.0, 17.0, 10.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6083984375, -0.5941200256347656, -0.5798416137695312, -0.5655632019042969, -0.5512847900390625, -0.5370063781738281, -0.5227279663085938, -0.5084495544433594, -0.494171142578125, -0.4798927307128906, -0.46561431884765625, -0.4513359069824219, -0.4370574951171875, -0.4227790832519531, -0.40850067138671875, -0.3942222595214844, -0.37994384765625, -0.3656654357910156, -0.35138702392578125, -0.3371086120605469, -0.3228302001953125, -0.3085517883300781, -0.29427337646484375, -0.2799949645996094, -0.265716552734375, -0.2514381408691406, -0.23715972900390625, -0.22288131713867188, -0.2086029052734375, -0.19432449340820312, -0.18004608154296875, -0.16576766967773438, -0.1514892578125, -0.13721084594726562, -0.12293243408203125, -0.10865402221679688, -0.0943756103515625, -0.08009719848632812, -0.06581878662109375, -0.051540374755859375, -0.037261962890625, -0.022983551025390625, -0.00870513916015625, 0.005573272705078125, 0.0198516845703125, 0.034130096435546875, 0.04840850830078125, 0.06268692016601562, 0.07696533203125, 0.09124374389648438, 0.10552215576171875, 0.11980056762695312, 0.1340789794921875, 0.14835739135742188, 0.16263580322265625, 0.17691421508789062, 0.191192626953125, 0.20547103881835938, 0.21974945068359375, 0.23402786254882812, 0.2483062744140625, 0.2625846862792969, 0.27686309814453125, 0.2911415100097656, 0.305419921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 9.0, 10.0, 14.0, 18.0, 24.0, 35.0, 48.0, 74.0, 121.0, 174.0, 218.0, 327.0, 504.0, 891.0, 1574.0, 3119.0, 8001.0, 24631.0, 99735.0, 411115.0, 374681.0, 87318.0, 21970.0, 7158.0, 2919.0, 1456.0, 865.0, 481.0, 318.0, 198.0, 164.0, 105.0, 78.0, 49.0, 37.0, 36.0, 23.0, 16.0, 7.0, 5.0, 3.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.0400390625, -1.0074920654296875, -0.974945068359375, -0.9423980712890625, -0.90985107421875, -0.8773040771484375, -0.844757080078125, -0.8122100830078125, -0.7796630859375, -0.7471160888671875, -0.714569091796875, -0.6820220947265625, -0.64947509765625, -0.6169281005859375, -0.584381103515625, -0.5518341064453125, -0.519287109375, -0.4867401123046875, -0.454193115234375, -0.4216461181640625, -0.38909912109375, -0.3565521240234375, -0.324005126953125, -0.2914581298828125, -0.2589111328125, -0.2263641357421875, -0.193817138671875, -0.1612701416015625, -0.12872314453125, -0.0961761474609375, -0.063629150390625, -0.0310821533203125, 0.00146484375, 0.0340118408203125, 0.066558837890625, 0.0991058349609375, 0.13165283203125, 0.1641998291015625, 0.196746826171875, 0.2292938232421875, 0.2618408203125, 0.2943878173828125, 0.326934814453125, 0.3594818115234375, 0.39202880859375, 0.4245758056640625, 0.457122802734375, 0.4896697998046875, 0.522216796875, 0.5547637939453125, 0.587310791015625, 0.6198577880859375, 0.65240478515625, 0.6849517822265625, 0.717498779296875, 0.7500457763671875, 0.7825927734375, 0.8151397705078125, 0.847686767578125, 0.8802337646484375, 0.91278076171875, 0.9453277587890625, 0.977874755859375, 1.0104217529296875, 1.04296875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 4.0, 6.0, 16.0, 20.0, 14.0, 12.0, 25.0, 34.0, 29.0, 42.0, 38.0, 41.0, 55.0, 45.0, 57.0, 58.0, 60.0, 56.0, 49.0, 46.0, 33.0, 56.0, 30.0, 28.0, 33.0, 28.0, 17.0, 11.0, 14.0, 7.0, 11.0, 8.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3095703125, -1.2720489501953125, -1.234527587890625, -1.1970062255859375, -1.15948486328125, -1.1219635009765625, -1.084442138671875, -1.0469207763671875, -1.0093994140625, -0.9718780517578125, -0.934356689453125, -0.8968353271484375, -0.85931396484375, -0.8217926025390625, -0.784271240234375, -0.7467498779296875, -0.709228515625, -0.6717071533203125, -0.634185791015625, -0.5966644287109375, -0.55914306640625, -0.5216217041015625, -0.484100341796875, -0.4465789794921875, -0.4090576171875, -0.3715362548828125, -0.334014892578125, -0.2964935302734375, -0.25897216796875, -0.2214508056640625, -0.183929443359375, -0.1464080810546875, -0.10888671875, -0.0713653564453125, -0.033843994140625, 0.0036773681640625, 0.04119873046875, 0.0787200927734375, 0.116241455078125, 0.1537628173828125, 0.1912841796875, 0.2288055419921875, 0.266326904296875, 0.3038482666015625, 0.34136962890625, 0.3788909912109375, 0.416412353515625, 0.4539337158203125, 0.491455078125, 0.5289764404296875, 0.566497802734375, 0.6040191650390625, 0.64154052734375, 0.6790618896484375, 0.716583251953125, 0.7541046142578125, 0.7916259765625, 0.8291473388671875, 0.866668701171875, 0.9041900634765625, 0.94171142578125, 0.9792327880859375, 1.016754150390625, 1.0542755126953125, 1.091796875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 9.0, 8.0, 16.0, 42.0, 110.0, 273.0, 1053.0, 7735.0, 583130.0, 447973.0, 6853.0, 924.0, 255.0, 94.0, 44.0, 16.0, 11.0, 7.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0245361328125, -0.991455078125, -0.9583740234375, -0.92529296875, -0.8922119140625, -0.859130859375, -0.8260498046875, -0.79296875, -0.7598876953125, -0.726806640625, -0.6937255859375, -0.66064453125, -0.6275634765625, -0.594482421875, -0.5614013671875, -0.5283203125, -0.4952392578125, -0.462158203125, -0.4290771484375, -0.39599609375, -0.3629150390625, -0.329833984375, -0.2967529296875, -0.263671875, -0.2305908203125, -0.197509765625, -0.1644287109375, -0.13134765625, -0.0982666015625, -0.065185546875, -0.0321044921875, 0.0009765625, 0.0340576171875, 0.067138671875, 0.1002197265625, 0.13330078125, 0.1663818359375, 0.199462890625, 0.2325439453125, 0.265625, 0.2987060546875, 0.331787109375, 0.3648681640625, 0.39794921875, 0.4310302734375, 0.464111328125, 0.4971923828125, 0.5302734375, 0.5633544921875, 0.596435546875, 0.6295166015625, 0.66259765625, 0.6956787109375, 0.728759765625, 0.7618408203125, 0.794921875, 0.8280029296875, 0.861083984375, 0.8941650390625, 0.92724609375, 0.9603271484375, 0.993408203125, 1.0264892578125, 1.0595703125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 4.0, 7.0, 7.0, 12.0, 19.0, 12.0, 33.0, 28.0, 39.0, 56.0, 55.0, 80.0, 91.0, 107.0, 91.0, 73.0, 78.0, 64.0, 45.0, 21.0, 18.0, 25.0, 14.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.357099533081055e-05, -4.216376692056656e-05, -4.075653851032257e-05, -3.934931010007858e-05, -3.7942081689834595e-05, -3.653485327959061e-05, -3.512762486934662e-05, -3.372039645910263e-05, -3.231316804885864e-05, -3.0905939638614655e-05, -2.9498711228370667e-05, -2.809148281812668e-05, -2.668425440788269e-05, -2.5277025997638702e-05, -2.3869797587394714e-05, -2.2462569177150726e-05, -2.1055340766906738e-05, -1.964811235666275e-05, -1.8240883946418762e-05, -1.6833655536174774e-05, -1.5426427125930786e-05, -1.4019198715686798e-05, -1.261197030544281e-05, -1.1204741895198822e-05, -9.797513484954834e-06, -8.390285074710846e-06, -6.983056664466858e-06, -5.57582825422287e-06, -4.168599843978882e-06, -2.761371433734894e-06, -1.3541430234909058e-06, 5.3085386753082275e-08, 1.4603137969970703e-06, 2.8675422072410583e-06, 4.274770617485046e-06, 5.6819990277290344e-06, 7.0892274379730225e-06, 8.49645584821701e-06, 9.903684258460999e-06, 1.1310912668704987e-05, 1.2718141078948975e-05, 1.4125369489192963e-05, 1.553259789943695e-05, 1.693982630968094e-05, 1.8347054719924927e-05, 1.9754283130168915e-05, 2.1161511540412903e-05, 2.256873995065689e-05, 2.397596836090088e-05, 2.5383196771144867e-05, 2.6790425181388855e-05, 2.8197653591632843e-05, 2.960488200187683e-05, 3.101211041212082e-05, 3.241933882236481e-05, 3.3826567232608795e-05, 3.523379564285278e-05, 3.664102405309677e-05, 3.804825246334076e-05, 3.945548087358475e-05, 4.0862709283828735e-05, 4.2269937694072723e-05, 4.367716610431671e-05, 4.50843945145607e-05, 4.649162292480469e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 13.0, 28.0, 44.0, 86.0, 182.0, 441.0, 1572.0, 8858.0, 239519.0, 769523.0, 24283.0, 2799.0, 697.0, 259.0, 105.0, 49.0, 38.0, 14.0, 14.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7238388061523438, -0.6981658935546875, -0.6724929809570312, -0.646820068359375, -0.6211471557617188, -0.5954742431640625, -0.5698013305664062, -0.54412841796875, -0.5184555053710938, -0.4927825927734375, -0.46710968017578125, -0.441436767578125, -0.41576385498046875, -0.3900909423828125, -0.36441802978515625, -0.3387451171875, -0.31307220458984375, -0.2873992919921875, -0.26172637939453125, -0.236053466796875, -0.21038055419921875, -0.1847076416015625, -0.15903472900390625, -0.13336181640625, -0.10768890380859375, -0.0820159912109375, -0.05634307861328125, -0.030670166015625, -0.00499725341796875, 0.0206756591796875, 0.04634857177734375, 0.072021484375, 0.09769439697265625, 0.1233673095703125, 0.14904022216796875, 0.174713134765625, 0.20038604736328125, 0.2260589599609375, 0.25173187255859375, 0.27740478515625, 0.30307769775390625, 0.3287506103515625, 0.35442352294921875, 0.380096435546875, 0.40576934814453125, 0.4314422607421875, 0.45711517333984375, 0.4827880859375, 0.5084609985351562, 0.5341339111328125, 0.5598068237304688, 0.585479736328125, 0.6111526489257812, 0.6368255615234375, 0.6624984741210938, 0.68817138671875, 0.7138442993164062, 0.7395172119140625, 0.7651901245117188, 0.790863037109375, 0.8165359497070312, 0.8422088623046875, 0.8678817749023438, 0.8935546875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 11.0, 20.0, 24.0, 47.0, 66.0, 119.0, 153.0, 146.0, 128.0, 122.0, 68.0, 33.0, 22.0, 22.0, 10.0, 9.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.215545654296875, -0.19818115234375, -0.180816650390625, -0.1634521484375, -0.146087646484375, -0.12872314453125, -0.111358642578125, -0.093994140625, -0.076629638671875, -0.05926513671875, -0.041900634765625, -0.0245361328125, -0.007171630859375, 0.01019287109375, 0.027557373046875, 0.044921875, 0.062286376953125, 0.07965087890625, 0.097015380859375, 0.1143798828125, 0.131744384765625, 0.14910888671875, 0.166473388671875, 0.183837890625, 0.201202392578125, 0.21856689453125, 0.235931396484375, 0.2532958984375, 0.270660400390625, 0.28802490234375, 0.305389404296875, 0.32275390625, 0.340118408203125, 0.35748291015625, 0.374847412109375, 0.3922119140625, 0.409576416015625, 0.42694091796875, 0.444305419921875, 0.461669921875, 0.479034423828125, 0.49639892578125, 0.513763427734375, 0.5311279296875, 0.548492431640625, 0.56585693359375, 0.583221435546875, 0.6005859375, 0.617950439453125, 0.63531494140625, 0.652679443359375, 0.6700439453125, 0.687408447265625, 0.70477294921875, 0.722137451171875, 0.739501953125, 0.756866455078125, 0.77423095703125, 0.791595458984375, 0.8089599609375, 0.826324462890625, 0.84368896484375, 0.861053466796875, 0.87841796875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 36.0, 287.0, 520.0, 123.0, 28.0, 10.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.64372253417969, -39.88019943237305, -39.11667251586914, -38.3531494140625, -37.589622497558594, -36.82609939575195, -36.06257629394531, -35.299049377441406, -34.535526275634766, -33.772003173828125, -33.00847625732422, -32.24495315551758, -31.481428146362305, -30.71790313720703, -29.954378128051758, -29.190853118896484, -28.427330017089844, -27.66380500793457, -26.900279998779297, -26.136756896972656, -25.373231887817383, -24.60970687866211, -23.846181869506836, -23.082656860351562, -22.31913185119629, -21.555606842041016, -20.792081832885742, -20.0285587310791, -19.265033721923828, -18.501508712768555, -17.73798370361328, -16.97446060180664, -16.210935592651367, -15.447410583496094, -14.683886528015137, -13.920361518859863, -13.156837463378906, -12.393312454223633, -11.62978744506836, -10.866263389587402, -10.102739334106445, -9.339214324951172, -8.575690269470215, -7.812165260314941, -7.048641204833984, -6.285116195678711, -5.521591663360596, -4.7580671310424805, -3.994542121887207, -3.231017589569092, -2.4674930572509766, -1.7039682865142822, -0.940443754196167, -0.17691922187805176, 0.5866055488586426, 1.3501300811767578, 2.113654613494873, 2.8771791458129883, 3.6407036781311035, 4.404228210449219, 5.167753219604492, 5.931277275085449, 6.694802284240723, 7.458326816558838, 8.221851348876953]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 5.0, 8.0, 6.0, 10.0, 10.0, 15.0, 8.0, 14.0, 24.0, 25.0, 26.0, 15.0, 30.0, 30.0, 31.0, 40.0, 36.0, 37.0, 46.0, 63.0, 50.0, 50.0, 42.0, 36.0, 41.0, 35.0, 39.0, 24.0, 27.0, 17.0, 30.0, 18.0, 11.0, 12.0, 16.0, 14.0, 11.0, 8.0, 5.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.682868957519531, -5.49736213684082, -5.311855316162109, -5.126348495483398, -4.9408416748046875, -4.755334854125977, -4.569828033447266, -4.384321212768555, -4.198814392089844, -4.013307571411133, -3.827800750732422, -3.642293930053711, -3.456787109375, -3.271280288696289, -3.085773229598999, -2.900266408920288, -2.714759349822998, -2.529252529144287, -2.343745708465576, -2.1582388877868652, -1.9727319478988647, -1.7872251272201538, -1.6017181873321533, -1.4162113666534424, -1.2307045459747314, -1.0451977252960205, -0.8596908450126648, -0.6741839647293091, -0.48867714405059814, -0.3031703233718872, -0.11766338348388672, 0.06784343719482422, 0.25335025787353516, 0.4388571083545685, 0.6243639588356018, 0.8098708391189575, 0.9953776597976685, 1.1808844804763794, 1.3663914203643799, 1.5518982410430908, 1.7374050617218018, 1.9229118824005127, 2.1084187030792236, 2.2939257621765137, 2.4794325828552246, 2.6649394035339355, 2.8504462242126465, 3.0359530448913574, 3.2214598655700684, 3.4069666862487793, 3.5924735069274902, 3.777980327606201, 3.963487148284912, 4.148993968963623, 4.334501266479492, 4.520008087158203, 4.705514907836914, 4.891021728515625, 5.076528549194336, 5.262035369873047, 5.447542190551758, 5.633049011230469, 5.81855583190918, 6.004062652587891, 6.189569473266602]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 9.0, 8.0, 11.0, 10.0, 17.0, 18.0, 43.0, 62.0, 106.0, 192.0, 378.0, 1135.0, 4979.0, 72184.0, 4086295.0, 24465.0, 2990.0, 787.0, 282.0, 140.0, 79.0, 43.0, 22.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.33984375, -3.260986328125, -3.18212890625, -3.103271484375, -3.0244140625, -2.945556640625, -2.86669921875, -2.787841796875, -2.708984375, -2.630126953125, -2.55126953125, -2.472412109375, -2.3935546875, -2.314697265625, -2.23583984375, -2.156982421875, -2.078125, -1.999267578125, -1.92041015625, -1.841552734375, -1.7626953125, -1.683837890625, -1.60498046875, -1.526123046875, -1.447265625, -1.368408203125, -1.28955078125, -1.210693359375, -1.1318359375, -1.052978515625, -0.97412109375, -0.895263671875, -0.81640625, -0.737548828125, -0.65869140625, -0.579833984375, -0.5009765625, -0.422119140625, -0.34326171875, -0.264404296875, -0.185546875, -0.106689453125, -0.02783203125, 0.051025390625, 0.1298828125, 0.208740234375, 0.28759765625, 0.366455078125, 0.4453125, 0.524169921875, 0.60302734375, 0.681884765625, 0.7607421875, 0.839599609375, 0.91845703125, 0.997314453125, 1.076171875, 1.155029296875, 1.23388671875, 1.312744140625, 1.3916015625, 1.470458984375, 1.54931640625, 1.628173828125, 1.70703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 12.0, 25.0, 51.0, 68.0, 89.0, 133.0, 120.0, 149.0, 119.0, 74.0, 56.0, 45.0, 23.0, 10.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.6103515625, -0.5967369079589844, -0.5831222534179688, -0.5695075988769531, -0.5558929443359375, -0.5422782897949219, -0.5286636352539062, -0.5150489807128906, -0.501434326171875, -0.4878196716308594, -0.47420501708984375, -0.4605903625488281, -0.4469757080078125, -0.4333610534667969, -0.41974639892578125, -0.4061317443847656, -0.39251708984375, -0.3789024353027344, -0.36528778076171875, -0.3516731262207031, -0.3380584716796875, -0.3244438171386719, -0.31082916259765625, -0.2972145080566406, -0.283599853515625, -0.2699851989746094, -0.25637054443359375, -0.24275588989257812, -0.2291412353515625, -0.21552658081054688, -0.20191192626953125, -0.18829727172851562, -0.1746826171875, -0.16106796264648438, -0.14745330810546875, -0.13383865356445312, -0.1202239990234375, -0.10660934448242188, -0.09299468994140625, -0.07938003540039062, -0.065765380859375, -0.052150726318359375, -0.03853607177734375, -0.024921417236328125, -0.0113067626953125, 0.002307891845703125, 0.01592254638671875, 0.029537200927734375, 0.04315185546875, 0.056766510009765625, 0.07038116455078125, 0.08399581909179688, 0.0976104736328125, 0.11122512817382812, 0.12483978271484375, 0.13845443725585938, 0.152069091796875, 0.16568374633789062, 0.17929840087890625, 0.19291305541992188, 0.2065277099609375, 0.22014236450195312, 0.23375701904296875, 0.24737167358398438, 0.260986328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 2.0, 5.0, 7.0, 7.0, 3.0, 8.0, 16.0, 19.0, 34.0, 56.0, 95.0, 159.0, 260.0, 515.0, 1192.0, 3077.0, 10207.0, 72444.0, 3811471.0, 270304.0, 17585.0, 3986.0, 1419.0, 652.0, 316.0, 195.0, 101.0, 60.0, 30.0, 20.0, 19.0, 7.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3046875, -1.2607421875, -1.216796875, -1.1728515625, -1.12890625, -1.0849609375, -1.041015625, -0.9970703125, -0.953125, -0.9091796875, -0.865234375, -0.8212890625, -0.77734375, -0.7333984375, -0.689453125, -0.6455078125, -0.6015625, -0.5576171875, -0.513671875, -0.4697265625, -0.42578125, -0.3818359375, -0.337890625, -0.2939453125, -0.25, -0.2060546875, -0.162109375, -0.1181640625, -0.07421875, -0.0302734375, 0.013671875, 0.0576171875, 0.1015625, 0.1455078125, 0.189453125, 0.2333984375, 0.27734375, 0.3212890625, 0.365234375, 0.4091796875, 0.453125, 0.4970703125, 0.541015625, 0.5849609375, 0.62890625, 0.6728515625, 0.716796875, 0.7607421875, 0.8046875, 0.8486328125, 0.892578125, 0.9365234375, 0.98046875, 1.0244140625, 1.068359375, 1.1123046875, 1.15625, 1.2001953125, 1.244140625, 1.2880859375, 1.33203125, 1.3759765625, 1.419921875, 1.4638671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 0.0, 5.0, 6.0, 6.0, 10.0, 9.0, 13.0, 24.0, 30.0, 91.0, 185.0, 626.0, 2148.0, 568.0, 174.0, 85.0, 38.0, 16.0, 18.0, 6.0, 4.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4150390625, -0.40093994140625, -0.3868408203125, -0.37274169921875, -0.358642578125, -0.34454345703125, -0.3304443359375, -0.31634521484375, -0.30224609375, -0.28814697265625, -0.2740478515625, -0.25994873046875, -0.245849609375, -0.23175048828125, -0.2176513671875, -0.20355224609375, -0.189453125, -0.17535400390625, -0.1612548828125, -0.14715576171875, -0.133056640625, -0.11895751953125, -0.1048583984375, -0.09075927734375, -0.07666015625, -0.06256103515625, -0.0484619140625, -0.03436279296875, -0.020263671875, -0.00616455078125, 0.0079345703125, 0.02203369140625, 0.0361328125, 0.05023193359375, 0.0643310546875, 0.07843017578125, 0.092529296875, 0.10662841796875, 0.1207275390625, 0.13482666015625, 0.14892578125, 0.16302490234375, 0.1771240234375, 0.19122314453125, 0.205322265625, 0.21942138671875, 0.2335205078125, 0.24761962890625, 0.26171875, 0.27581787109375, 0.2899169921875, 0.30401611328125, 0.318115234375, 0.33221435546875, 0.3463134765625, 0.36041259765625, 0.37451171875, 0.38861083984375, 0.4027099609375, 0.41680908203125, 0.430908203125, 0.44500732421875, 0.4591064453125, 0.47320556640625, 0.4873046875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 57.0, 358.0, 487.0, 86.0, 13.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.768314361572266, -7.610096454620361, -7.451878547668457, -7.2936601638793945, -7.13544225692749, -6.977224349975586, -6.819005966186523, -6.660788059234619, -6.502570152282715, -6.3443522453308105, -6.186134338378906, -6.027915954589844, -5.8696980476379395, -5.711480140686035, -5.553261756896973, -5.395043849945068, -5.236825942993164, -5.07860803604126, -4.9203901290893555, -4.762171745300293, -4.603953838348389, -4.445735931396484, -4.287517547607422, -4.129299640655518, -3.9710817337036133, -3.812863826751709, -3.6546456813812256, -3.496427536010742, -3.338209629058838, -3.1799917221069336, -3.02177357673645, -2.863555431365967, -2.7053372859954834, -2.547119140625, -2.3889012336730957, -2.2306833267211914, -2.072465181350708, -1.9142471551895142, -1.7560291290283203, -1.5978111028671265, -1.4395930767059326, -1.2813750505447388, -1.123157024383545, -0.9649389982223511, -0.8067209720611572, -0.6485029458999634, -0.49028491973876953, -0.3320668935775757, -0.17384886741638184, -0.01563084125518799, 0.14258718490600586, 0.3008052110671997, 0.45902323722839355, 0.6172412633895874, 0.7754592895507812, 0.9336773157119751, 1.091895341873169, 1.2501133680343628, 1.4083313941955566, 1.5665494203567505, 1.7247674465179443, 1.8829854726791382, 2.041203498840332, 2.1994214057922363, 2.3576395511627197]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 5.0, 14.0, 10.0, 12.0, 19.0, 18.0, 20.0, 22.0, 28.0, 30.0, 25.0, 33.0, 38.0, 39.0, 51.0, 48.0, 58.0, 49.0, 48.0, 48.0, 40.0, 38.0, 42.0, 29.0, 36.0, 26.0, 18.0, 17.0, 18.0, 15.0, 16.0, 12.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8638261556625366, -0.8372650146484375, -0.8107039332389832, -0.7841428518295288, -0.7575817108154297, -0.7310205698013306, -0.7044594883918762, -0.6778984069824219, -0.6513372659683228, -0.6247761249542236, -0.5982150435447693, -0.5716539621353149, -0.5450928211212158, -0.5185316801071167, -0.49197059869766235, -0.4654094874858856, -0.4388483762741089, -0.41228726506233215, -0.3857261538505554, -0.3591650426387787, -0.33260393142700195, -0.3060428202152252, -0.2794817090034485, -0.25292059779167175, -0.22635948657989502, -0.1997983753681183, -0.17323726415634155, -0.14667615294456482, -0.12011504173278809, -0.09355393052101135, -0.06699281930923462, -0.040431708097457886, -0.013870596885681152, 0.012690514326095581, 0.039251625537872314, 0.06581273674964905, 0.09237384796142578, 0.11893495917320251, 0.14549607038497925, 0.17205718159675598, 0.19861829280853271, 0.22517940402030945, 0.2517405152320862, 0.2783016264438629, 0.30486273765563965, 0.3314238488674164, 0.3579849600791931, 0.38454607129096985, 0.4111071825027466, 0.4376682937145233, 0.46422940492630005, 0.4907905161380768, 0.5173516273498535, 0.5439127683639526, 0.570473849773407, 0.5970349311828613, 0.6235960721969604, 0.6501572132110596, 0.6767182946205139, 0.7032793760299683, 0.7298405170440674, 0.7564016580581665, 0.7829627394676208, 0.8095238208770752, 0.8360849618911743]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 8.0, 15.0, 15.0, 20.0, 37.0, 50.0, 60.0, 99.0, 174.0, 254.0, 459.0, 902.0, 1747.0, 4566.0, 17977.0, 129592.0, 648839.0, 207382.0, 26088.0, 5814.0, 2108.0, 970.0, 524.0, 330.0, 179.0, 114.0, 67.0, 39.0, 31.0, 24.0, 20.0, 13.0, 10.0, 10.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.69921875, -1.6573715209960938, -1.6155242919921875, -1.5736770629882812, -1.531829833984375, -1.4899826049804688, -1.4481353759765625, -1.4062881469726562, -1.36444091796875, -1.3225936889648438, -1.2807464599609375, -1.2388992309570312, -1.197052001953125, -1.1552047729492188, -1.1133575439453125, -1.0715103149414062, -1.0296630859375, -0.9878158569335938, -0.9459686279296875, -0.9041213989257812, -0.862274169921875, -0.8204269409179688, -0.7785797119140625, -0.7367324829101562, -0.69488525390625, -0.6530380249023438, -0.6111907958984375, -0.5693435668945312, -0.527496337890625, -0.48564910888671875, -0.4438018798828125, -0.40195465087890625, -0.360107421875, -0.31826019287109375, -0.2764129638671875, -0.23456573486328125, -0.192718505859375, -0.15087127685546875, -0.1090240478515625, -0.06717681884765625, -0.02532958984375, 0.01651763916015625, 0.0583648681640625, 0.10021209716796875, 0.142059326171875, 0.18390655517578125, 0.2257537841796875, 0.26760101318359375, 0.3094482421875, 0.35129547119140625, 0.3931427001953125, 0.43498992919921875, 0.476837158203125, 0.5186843872070312, 0.5605316162109375, 0.6023788452148438, 0.64422607421875, 0.6860733032226562, 0.7279205322265625, 0.7697677612304688, 0.811614990234375, 0.8534622192382812, 0.8953094482421875, 0.9371566772460938, 0.97900390625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 10.0, 17.0, 57.0, 72.0, 82.0, 112.0, 143.0, 134.0, 133.0, 74.0, 60.0, 49.0, 23.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.615234375, -0.6015548706054688, -0.5878753662109375, -0.5741958618164062, -0.560516357421875, -0.5468368530273438, -0.5331573486328125, -0.5194778442382812, -0.50579833984375, -0.49211883544921875, -0.4784393310546875, -0.46475982666015625, -0.451080322265625, -0.43740081787109375, -0.4237213134765625, -0.41004180908203125, -0.3963623046875, -0.38268280029296875, -0.3690032958984375, -0.35532379150390625, -0.341644287109375, -0.32796478271484375, -0.3142852783203125, -0.30060577392578125, -0.28692626953125, -0.27324676513671875, -0.2595672607421875, -0.24588775634765625, -0.232208251953125, -0.21852874755859375, -0.2048492431640625, -0.19116973876953125, -0.177490234375, -0.16381072998046875, -0.1501312255859375, -0.13645172119140625, -0.122772216796875, -0.10909271240234375, -0.0954132080078125, -0.08173370361328125, -0.06805419921875, -0.05437469482421875, -0.0406951904296875, -0.02701568603515625, -0.013336181640625, 0.00034332275390625, 0.0140228271484375, 0.02770233154296875, 0.0413818359375, 0.05506134033203125, 0.0687408447265625, 0.08242034912109375, 0.096099853515625, 0.10977935791015625, 0.1234588623046875, 0.13713836669921875, 0.15081787109375, 0.16449737548828125, 0.1781768798828125, 0.19185638427734375, 0.205535888671875, 0.21921539306640625, 0.2328948974609375, 0.24657440185546875, 0.26025390625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 8.0, 12.0, 14.0, 11.0, 22.0, 26.0, 43.0, 72.0, 86.0, 124.0, 159.0, 230.0, 373.0, 628.0, 951.0, 1715.0, 3501.0, 8433.0, 24902.0, 90635.0, 344409.0, 404513.0, 117361.0, 31235.0, 10171.0, 4055.0, 1957.0, 1026.0, 612.0, 382.0, 233.0, 183.0, 132.0, 94.0, 64.0, 51.0, 37.0, 27.0, 14.0, 11.0, 10.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.8037109375, -0.7751007080078125, -0.746490478515625, -0.7178802490234375, -0.68927001953125, -0.6606597900390625, -0.632049560546875, -0.6034393310546875, -0.5748291015625, -0.5462188720703125, -0.517608642578125, -0.4889984130859375, -0.46038818359375, -0.4317779541015625, -0.403167724609375, -0.3745574951171875, -0.345947265625, -0.3173370361328125, -0.288726806640625, -0.2601165771484375, -0.23150634765625, -0.2028961181640625, -0.174285888671875, -0.1456756591796875, -0.1170654296875, -0.0884552001953125, -0.059844970703125, -0.0312347412109375, -0.00262451171875, 0.0259857177734375, 0.054595947265625, 0.0832061767578125, 0.11181640625, 0.1404266357421875, 0.169036865234375, 0.1976470947265625, 0.22625732421875, 0.2548675537109375, 0.283477783203125, 0.3120880126953125, 0.3406982421875, 0.3693084716796875, 0.397918701171875, 0.4265289306640625, 0.45513916015625, 0.4837493896484375, 0.512359619140625, 0.5409698486328125, 0.569580078125, 0.5981903076171875, 0.626800537109375, 0.6554107666015625, 0.68402099609375, 0.7126312255859375, 0.741241455078125, 0.7698516845703125, 0.7984619140625, 0.8270721435546875, 0.855682373046875, 0.8842926025390625, 0.91290283203125, 0.9415130615234375, 0.970123291015625, 0.9987335205078125, 1.02734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 5.0, 17.0, 17.0, 17.0, 20.0, 24.0, 24.0, 22.0, 39.0, 33.0, 41.0, 47.0, 44.0, 46.0, 56.0, 39.0, 43.0, 49.0, 45.0, 53.0, 42.0, 26.0, 30.0, 27.0, 35.0, 20.0, 21.0, 20.0, 16.0, 18.0, 15.0, 8.0, 10.0, 3.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93994140625, -0.9080581665039062, -0.8761749267578125, -0.8442916870117188, -0.812408447265625, -0.7805252075195312, -0.7486419677734375, -0.7167587280273438, -0.68487548828125, -0.6529922485351562, -0.6211090087890625, -0.5892257690429688, -0.557342529296875, -0.5254592895507812, -0.4935760498046875, -0.46169281005859375, -0.4298095703125, -0.39792633056640625, -0.3660430908203125, -0.33415985107421875, -0.302276611328125, -0.27039337158203125, -0.2385101318359375, -0.20662689208984375, -0.17474365234375, -0.14286041259765625, -0.1109771728515625, -0.07909393310546875, -0.047210693359375, -0.01532745361328125, 0.0165557861328125, 0.04843902587890625, 0.080322265625, 0.11220550537109375, 0.1440887451171875, 0.17597198486328125, 0.207855224609375, 0.23973846435546875, 0.2716217041015625, 0.30350494384765625, 0.33538818359375, 0.36727142333984375, 0.3991546630859375, 0.43103790283203125, 0.462921142578125, 0.49480438232421875, 0.5266876220703125, 0.5585708618164062, 0.5904541015625, 0.6223373413085938, 0.6542205810546875, 0.6861038208007812, 0.717987060546875, 0.7498703002929688, 0.7817535400390625, 0.8136367797851562, 0.84552001953125, 0.8774032592773438, 0.9092864990234375, 0.9411697387695312, 0.973052978515625, 1.0049362182617188, 1.0368194580078125, 1.0687026977539062, 1.1005859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 15.0, 16.0, 45.0, 97.0, 245.0, 729.0, 3385.0, 50112.0, 927427.0, 61520.0, 3767.0, 787.0, 231.0, 92.0, 45.0, 17.0, 5.0, 11.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8165130615234375, -0.789764404296875, -0.7630157470703125, -0.73626708984375, -0.7095184326171875, -0.682769775390625, -0.6560211181640625, -0.6292724609375, -0.6025238037109375, -0.575775146484375, -0.5490264892578125, -0.52227783203125, -0.4955291748046875, -0.468780517578125, -0.4420318603515625, -0.415283203125, -0.3885345458984375, -0.361785888671875, -0.3350372314453125, -0.30828857421875, -0.2815399169921875, -0.254791259765625, -0.2280426025390625, -0.2012939453125, -0.1745452880859375, -0.147796630859375, -0.1210479736328125, -0.09429931640625, -0.0675506591796875, -0.040802001953125, -0.0140533447265625, 0.0126953125, 0.0394439697265625, 0.066192626953125, 0.0929412841796875, 0.11968994140625, 0.1464385986328125, 0.173187255859375, 0.1999359130859375, 0.2266845703125, 0.2534332275390625, 0.280181884765625, 0.3069305419921875, 0.33367919921875, 0.3604278564453125, 0.387176513671875, 0.4139251708984375, 0.440673828125, 0.4674224853515625, 0.494171142578125, 0.5209197998046875, 0.54766845703125, 0.5744171142578125, 0.601165771484375, 0.6279144287109375, 0.6546630859375, 0.6814117431640625, 0.708160400390625, 0.7349090576171875, 0.76165771484375, 0.7884063720703125, 0.815155029296875, 0.8419036865234375, 0.86865234375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 6.0, 7.0, 5.0, 7.0, 12.0, 18.0, 26.0, 31.0, 44.0, 52.0, 60.0, 82.0, 91.0, 108.0, 93.0, 70.0, 74.0, 62.0, 33.0, 36.0, 15.0, 14.0, 11.0, 10.0, 7.0, 10.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.62396240234375e-05, -3.47113236784935e-05, -3.31830233335495e-05, -3.16547229886055e-05, -3.01264226436615e-05, -2.85981222987175e-05, -2.70698219537735e-05, -2.5541521608829498e-05, -2.4013221263885498e-05, -2.2484920918941498e-05, -2.0956620573997498e-05, -1.9428320229053497e-05, -1.7900019884109497e-05, -1.6371719539165497e-05, -1.4843419194221497e-05, -1.3315118849277496e-05, -1.1786818504333496e-05, -1.0258518159389496e-05, -8.730217814445496e-06, -7.201917469501495e-06, -5.673617124557495e-06, -4.145316779613495e-06, -2.6170164346694946e-06, -1.0887160897254944e-06, 4.3958425521850586e-07, 1.967884600162506e-06, 3.4961849451065063e-06, 5.024485290050507e-06, 6.552785634994507e-06, 8.081085979938507e-06, 9.609386324882507e-06, 1.1137686669826508e-05, 1.2665987014770508e-05, 1.4194287359714508e-05, 1.5722587704658508e-05, 1.725088804960251e-05, 1.877918839454651e-05, 2.030748873949051e-05, 2.183578908443451e-05, 2.336408942937851e-05, 2.489238977432251e-05, 2.642069011926651e-05, 2.794899046421051e-05, 2.947729080915451e-05, 3.100559115409851e-05, 3.253389149904251e-05, 3.406219184398651e-05, 3.559049218893051e-05, 3.711879253387451e-05, 3.864709287881851e-05, 4.017539322376251e-05, 4.170369356870651e-05, 4.323199391365051e-05, 4.476029425859451e-05, 4.628859460353851e-05, 4.7816894948482513e-05, 4.9345195293426514e-05, 5.0873495638370514e-05, 5.2401795983314514e-05, 5.3930096328258514e-05, 5.5458396673202515e-05, 5.6986697018146515e-05, 5.8514997363090515e-05, 6.0043297708034515e-05, 6.157159805297852e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 9.0, 7.0, 8.0, 8.0, 18.0, 17.0, 36.0, 47.0, 100.0, 181.0, 346.0, 701.0, 1942.0, 8175.0, 89252.0, 830869.0, 104134.0, 9044.0, 2067.0, 815.0, 321.0, 210.0, 89.0, 63.0, 37.0, 14.0, 10.0, 12.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58251953125, -0.5627899169921875, -0.543060302734375, -0.5233306884765625, -0.50360107421875, -0.4838714599609375, -0.464141845703125, -0.4444122314453125, -0.4246826171875, -0.4049530029296875, -0.385223388671875, -0.3654937744140625, -0.34576416015625, -0.3260345458984375, -0.306304931640625, -0.2865753173828125, -0.266845703125, -0.2471160888671875, -0.227386474609375, -0.2076568603515625, -0.18792724609375, -0.1681976318359375, -0.148468017578125, -0.1287384033203125, -0.1090087890625, -0.0892791748046875, -0.069549560546875, -0.0498199462890625, -0.03009033203125, -0.0103607177734375, 0.009368896484375, 0.0290985107421875, 0.048828125, 0.0685577392578125, 0.088287353515625, 0.1080169677734375, 0.12774658203125, 0.1474761962890625, 0.167205810546875, 0.1869354248046875, 0.2066650390625, 0.2263946533203125, 0.246124267578125, 0.2658538818359375, 0.28558349609375, 0.3053131103515625, 0.325042724609375, 0.3447723388671875, 0.364501953125, 0.3842315673828125, 0.403961181640625, 0.4236907958984375, 0.44342041015625, 0.4631500244140625, 0.482879638671875, 0.5026092529296875, 0.5223388671875, 0.5420684814453125, 0.561798095703125, 0.5815277099609375, 0.60125732421875, 0.6209869384765625, 0.640716552734375, 0.6604461669921875, 0.68017578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 15.0, 23.0, 30.0, 55.0, 100.0, 140.0, 174.0, 154.0, 130.0, 79.0, 47.0, 20.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452392578125, -0.4333076477050781, -0.41422271728515625, -0.3951377868652344, -0.3760528564453125, -0.3569679260253906, -0.33788299560546875, -0.3187980651855469, -0.299713134765625, -0.2806282043457031, -0.26154327392578125, -0.24245834350585938, -0.2233734130859375, -0.20428848266601562, -0.18520355224609375, -0.16611862182617188, -0.14703369140625, -0.12794876098632812, -0.10886383056640625, -0.08977890014648438, -0.0706939697265625, -0.051609039306640625, -0.03252410888671875, -0.013439178466796875, 0.005645751953125, 0.024730682373046875, 0.04381561279296875, 0.06290054321289062, 0.0819854736328125, 0.10107040405273438, 0.12015533447265625, 0.13924026489257812, 0.1583251953125, 0.17741012573242188, 0.19649505615234375, 0.21557998657226562, 0.2346649169921875, 0.2537498474121094, 0.27283477783203125, 0.2919197082519531, 0.311004638671875, 0.3300895690917969, 0.34917449951171875, 0.3682594299316406, 0.3873443603515625, 0.4064292907714844, 0.42551422119140625, 0.4445991516113281, 0.46368408203125, 0.4827690124511719, 0.5018539428710938, 0.5209388732910156, 0.5400238037109375, 0.5591087341308594, 0.5781936645507812, 0.5972785949707031, 0.616363525390625, 0.6354484558105469, 0.6545333862304688, 0.6736183166503906, 0.6927032470703125, 0.7117881774902344, 0.7308731079101562, 0.7499580383300781, 0.76904296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 20.0, 84.0, 247.0, 389.0, 178.0, 49.0, 17.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.617172241210938, -24.128032684326172, -23.63889503479004, -23.149755477905273, -22.660615921020508, -22.171476364135742, -21.68233871459961, -21.193199157714844, -20.704059600830078, -20.214920043945312, -19.72578239440918, -19.236642837524414, -18.74750328063965, -18.258363723754883, -17.76922607421875, -17.280086517333984, -16.79094696044922, -16.301807403564453, -15.812668800354004, -15.323530197143555, -14.834390640258789, -14.34525203704834, -13.856112480163574, -13.366973876953125, -12.877835273742676, -12.388696670532227, -11.899557113647461, -11.410418510437012, -10.921278953552246, -10.432140350341797, -9.943000793457031, -9.453862190246582, -8.964722633361816, -8.475584030151367, -7.986444473266602, -7.497305393218994, -7.008166313171387, -6.5190277099609375, -6.029888153076172, -5.540749549865723, -5.051609992980957, -4.56247091293335, -4.073331832885742, -3.5841927528381348, -3.0950536727905273, -2.605914831161499, -2.1167757511138916, -1.6276366710662842, -1.1384978294372559, -0.6493587493896484, -0.1602197289466858, 0.32891929149627686, 0.8180583715438843, 1.3071973323822021, 1.7963364124298096, 2.285475492477417, 2.7746145725250244, 3.263753652572632, 3.7528927326202393, 4.242031574249268, 4.731170654296875, 5.220309734344482, 5.70944881439209, 6.198587894439697, 6.687726974487305]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 19.0, 12.0, 15.0, 21.0, 20.0, 35.0, 42.0, 51.0, 40.0, 59.0, 61.0, 70.0, 62.0, 58.0, 66.0, 58.0, 56.0, 49.0, 31.0, 33.0, 24.0, 35.0, 24.0, 18.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.508939266204834, -7.276609897613525, -7.044280052185059, -6.81195068359375, -6.579621315002441, -6.347291946411133, -6.114962577819824, -5.882632732391357, -5.650303363800049, -5.41797399520874, -5.185644149780273, -4.953314781188965, -4.720985412597656, -4.488656044006348, -4.256326675415039, -4.023996829986572, -3.7916674613952637, -3.559338092803955, -3.3270084857940674, -3.0946788787841797, -2.862349510192871, -2.6300201416015625, -2.397690534591675, -2.165360927581787, -1.9330315589904785, -1.7007020711898804, -1.4683725833892822, -1.236043095588684, -1.003713607788086, -0.7713841199874878, -0.5390546321868896, -0.3067251443862915, -0.07439613342285156, 0.15793335437774658, 0.3902628421783447, 0.6225923299789429, 0.854921817779541, 1.0872513055801392, 1.3195807933807373, 1.5519102811813354, 1.7842397689819336, 2.016569137573242, 2.24889874458313, 2.4812283515930176, 2.713557720184326, 2.9458870887756348, 3.1782166957855225, 3.41054630279541, 3.6428756713867188, 3.8752050399780273, 4.107534408569336, 4.339864253997803, 4.572193622589111, 4.80452299118042, 5.036852836608887, 5.269182205200195, 5.501511573791504, 5.7338409423828125, 5.966170310974121, 6.198500156402588, 6.4308295249938965, 6.663158893585205, 6.895488739013672, 7.1278181076049805, 7.360147476196289]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 9.0, 6.0, 11.0, 6.0, 10.0, 24.0, 25.0, 36.0, 35.0, 74.0, 115.0, 169.0, 334.0, 575.0, 1140.0, 3200.0, 13507.0, 169427.0, 3925360.0, 68287.0, 8297.0, 2095.0, 804.0, 331.0, 172.0, 99.0, 50.0, 24.0, 21.0, 12.0, 6.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 4.0], "bins": [-2.48828125, -2.43218994140625, -2.3760986328125, -2.32000732421875, -2.263916015625, -2.20782470703125, -2.1517333984375, -2.09564208984375, -2.03955078125, -1.98345947265625, -1.9273681640625, -1.87127685546875, -1.815185546875, -1.75909423828125, -1.7030029296875, -1.64691162109375, -1.5908203125, -1.53472900390625, -1.4786376953125, -1.42254638671875, -1.366455078125, -1.31036376953125, -1.2542724609375, -1.19818115234375, -1.14208984375, -1.08599853515625, -1.0299072265625, -0.97381591796875, -0.917724609375, -0.86163330078125, -0.8055419921875, -0.74945068359375, -0.693359375, -0.63726806640625, -0.5811767578125, -0.52508544921875, -0.468994140625, -0.41290283203125, -0.3568115234375, -0.30072021484375, -0.24462890625, -0.18853759765625, -0.1324462890625, -0.07635498046875, -0.020263671875, 0.03582763671875, 0.0919189453125, 0.14801025390625, 0.2041015625, 0.26019287109375, 0.3162841796875, 0.37237548828125, 0.428466796875, 0.48455810546875, 0.5406494140625, 0.59674072265625, 0.65283203125, 0.70892333984375, 0.7650146484375, 0.82110595703125, 0.877197265625, 0.93328857421875, 0.9893798828125, 1.04547119140625, 1.1015625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 32.0, 35.0, 64.0, 100.0, 120.0, 130.0, 142.0, 123.0, 90.0, 67.0, 36.0, 21.0, 10.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.646484375, -0.6317558288574219, -0.6170272827148438, -0.6022987365722656, -0.5875701904296875, -0.5728416442871094, -0.5581130981445312, -0.5433845520019531, -0.528656005859375, -0.5139274597167969, -0.49919891357421875, -0.4844703674316406, -0.4697418212890625, -0.4550132751464844, -0.44028472900390625, -0.4255561828613281, -0.41082763671875, -0.3960990905761719, -0.38137054443359375, -0.3666419982910156, -0.3519134521484375, -0.3371849060058594, -0.32245635986328125, -0.3077278137207031, -0.292999267578125, -0.2782707214355469, -0.26354217529296875, -0.24881362915039062, -0.2340850830078125, -0.21935653686523438, -0.20462799072265625, -0.18989944458007812, -0.1751708984375, -0.16044235229492188, -0.14571380615234375, -0.13098526000976562, -0.1162567138671875, -0.10152816772460938, -0.08679962158203125, -0.07207107543945312, -0.057342529296875, -0.042613983154296875, -0.02788543701171875, -0.013156890869140625, 0.0015716552734375, 0.016300201416015625, 0.03102874755859375, 0.045757293701171875, 0.06048583984375, 0.07521438598632812, 0.08994293212890625, 0.10467147827148438, 0.1194000244140625, 0.13412857055664062, 0.14885711669921875, 0.16358566284179688, 0.178314208984375, 0.19304275512695312, 0.20777130126953125, 0.22249984741210938, 0.2372283935546875, 0.2519569396972656, 0.26668548583984375, 0.2814140319824219, 0.296142578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 12.0, 5.0, 15.0, 24.0, 26.0, 37.0, 84.0, 153.0, 263.0, 620.0, 1397.0, 3956.0, 14827.0, 105520.0, 3586890.0, 439121.0, 30645.0, 6542.0, 2216.0, 915.0, 445.0, 255.0, 106.0, 74.0, 32.0, 27.0, 20.0, 9.0, 7.0, 6.0, 2.0, 2.0, 7.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.18359375, -1.1450653076171875, -1.106536865234375, -1.0680084228515625, -1.02947998046875, -0.9909515380859375, -0.952423095703125, -0.9138946533203125, -0.8753662109375, -0.8368377685546875, -0.798309326171875, -0.7597808837890625, -0.72125244140625, -0.6827239990234375, -0.644195556640625, -0.6056671142578125, -0.567138671875, -0.5286102294921875, -0.490081787109375, -0.4515533447265625, -0.41302490234375, -0.3744964599609375, -0.335968017578125, -0.2974395751953125, -0.2589111328125, -0.2203826904296875, -0.181854248046875, -0.1433258056640625, -0.10479736328125, -0.0662689208984375, -0.027740478515625, 0.0107879638671875, 0.04931640625, 0.0878448486328125, 0.126373291015625, 0.1649017333984375, 0.20343017578125, 0.2419586181640625, 0.280487060546875, 0.3190155029296875, 0.3575439453125, 0.3960723876953125, 0.434600830078125, 0.4731292724609375, 0.51165771484375, 0.5501861572265625, 0.588714599609375, 0.6272430419921875, 0.665771484375, 0.7042999267578125, 0.742828369140625, 0.7813568115234375, 0.81988525390625, 0.8584136962890625, 0.896942138671875, 0.9354705810546875, 0.9739990234375, 1.0125274658203125, 1.051055908203125, 1.0895843505859375, 1.12811279296875, 1.1666412353515625, 1.205169677734375, 1.2436981201171875, 1.2822265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 7.0, 7.0, 6.0, 19.0, 16.0, 26.0, 46.0, 65.0, 117.0, 205.0, 445.0, 1216.0, 1063.0, 404.0, 163.0, 94.0, 57.0, 33.0, 15.0, 16.0, 14.0, 5.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427978515625, -0.4131813049316406, -0.39838409423828125, -0.3835868835449219, -0.3687896728515625, -0.3539924621582031, -0.33919525146484375, -0.3243980407714844, -0.309600830078125, -0.2948036193847656, -0.28000640869140625, -0.2652091979980469, -0.2504119873046875, -0.23561477661132812, -0.22081756591796875, -0.20602035522460938, -0.19122314453125, -0.17642593383789062, -0.16162872314453125, -0.14683151245117188, -0.1320343017578125, -0.11723709106445312, -0.10243988037109375, -0.08764266967773438, -0.072845458984375, -0.058048248291015625, -0.04325103759765625, -0.028453826904296875, -0.0136566162109375, 0.001140594482421875, 0.01593780517578125, 0.030735015869140625, 0.0455322265625, 0.060329437255859375, 0.07512664794921875, 0.08992385864257812, 0.1047210693359375, 0.11951828002929688, 0.13431549072265625, 0.14911270141601562, 0.163909912109375, 0.17870712280273438, 0.19350433349609375, 0.20830154418945312, 0.2230987548828125, 0.23789596557617188, 0.25269317626953125, 0.2674903869628906, 0.28228759765625, 0.2970848083496094, 0.31188201904296875, 0.3266792297363281, 0.3414764404296875, 0.3562736511230469, 0.37107086181640625, 0.3858680725097656, 0.400665283203125, 0.4154624938964844, 0.43025970458984375, 0.4450569152832031, 0.4598541259765625, 0.4746513366699219, 0.48944854736328125, 0.5042457580566406, 0.51904296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 6.0, 39.0, 105.0, 258.0, 343.0, 170.0, 50.0, 13.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.707042217254639, -6.545083999633789, -6.3831257820129395, -6.22116756439209, -6.059208869934082, -5.897250652313232, -5.735292434692383, -5.573334217071533, -5.411375999450684, -5.249417781829834, -5.087459564208984, -4.925500869750977, -4.763542652130127, -4.601584434509277, -4.439626216888428, -4.277667999267578, -4.11570930480957, -3.9537510871887207, -3.791792631149292, -3.6298344135284424, -3.4678761959075928, -3.305917739868164, -3.1439595222473145, -2.982001304626465, -2.8200430870056152, -2.6580848693847656, -2.496126413345337, -2.3341681957244873, -2.1722099781036377, -2.010251522064209, -1.8482933044433594, -1.6863350868225098, -1.5243768692016602, -1.362418532371521, -1.2004603147506714, -1.0385019779205322, -0.8765437006950378, -0.7145854234695435, -0.5526270866394043, -0.3906688690185547, -0.22871053218841553, -0.06675224006175995, 0.09520605206489563, 0.2571643590927124, 0.4191226363182068, 0.5810809135437012, 0.7430392503738403, 0.9049974679946899, 1.066955804824829, 1.2289141416549683, 1.3908723592758179, 1.552830696105957, 1.7147889137268066, 1.8767472505569458, 2.038705587387085, 2.2006638050079346, 2.3626222610473633, 2.524580478668213, 2.6865389347076416, 2.848497152328491, 3.010455369949341, 3.1724138259887695, 3.334372043609619, 3.4963302612304688, 3.6582884788513184]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 8.0, 13.0, 12.0, 15.0, 13.0, 27.0, 28.0, 45.0, 35.0, 42.0, 60.0, 41.0, 54.0, 48.0, 57.0, 53.0, 55.0, 41.0, 57.0, 52.0, 45.0, 31.0, 43.0, 30.0, 20.0, 17.0, 9.0, 12.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.59987473487854, -1.5462814569473267, -1.4926881790161133, -1.4390947818756104, -1.385501503944397, -1.3319082260131836, -1.2783149480819702, -1.2247216701507568, -1.171128273010254, -1.1175349950790405, -1.0639417171478271, -1.0103483200073242, -0.9567550420761108, -0.9031617641448975, -0.8495684862136841, -0.7959751486778259, -0.7423818707466125, -0.6887885928153992, -0.635195255279541, -0.5816019773483276, -0.5280086398124695, -0.4744153618812561, -0.42082205414772034, -0.36722874641418457, -0.3136354386806488, -0.26004213094711304, -0.20644882321357727, -0.1528555303812027, -0.09926222264766693, -0.04566892981529236, 0.007924377918243408, 0.061517685651779175, 0.11511099338531494, 0.1687043011188507, 0.22229760885238647, 0.27589088678359985, 0.329484224319458, 0.3830775022506714, 0.43667080998420715, 0.4902641177177429, 0.5438574552536011, 0.5974507331848145, 0.6510440707206726, 0.704637348651886, 0.7582306861877441, 0.8118239641189575, 0.8654172420501709, 0.919010579586029, 0.9726038575172424, 1.0261971950531006, 1.079790472984314, 1.1333837509155273, 1.1869770288467407, 1.240570306777954, 1.294163703918457, 1.3477569818496704, 1.4013502597808838, 1.4549435377120972, 1.5085368156433105, 1.5621302127838135, 1.6157234907150269, 1.6693167686462402, 1.7229100465774536, 1.776503324508667, 1.83009672164917]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 3.0, 4.0, 7.0, 16.0, 15.0, 30.0, 41.0, 77.0, 121.0, 165.0, 295.0, 533.0, 1081.0, 2530.0, 7820.0, 55770.0, 645521.0, 301992.0, 23992.0, 4814.0, 1762.0, 820.0, 440.0, 284.0, 146.0, 83.0, 55.0, 35.0, 34.0, 27.0, 10.0, 9.0, 5.0, 3.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.564453125, -1.508209228515625, -1.45196533203125, -1.395721435546875, -1.3394775390625, -1.283233642578125, -1.22698974609375, -1.170745849609375, -1.114501953125, -1.058258056640625, -1.00201416015625, -0.945770263671875, -0.8895263671875, -0.833282470703125, -0.77703857421875, -0.720794677734375, -0.66455078125, -0.608306884765625, -0.55206298828125, -0.495819091796875, -0.4395751953125, -0.383331298828125, -0.32708740234375, -0.270843505859375, -0.214599609375, -0.158355712890625, -0.10211181640625, -0.045867919921875, 0.0103759765625, 0.066619873046875, 0.12286376953125, 0.179107666015625, 0.2353515625, 0.291595458984375, 0.34783935546875, 0.404083251953125, 0.4603271484375, 0.516571044921875, 0.57281494140625, 0.629058837890625, 0.685302734375, 0.741546630859375, 0.79779052734375, 0.854034423828125, 0.9102783203125, 0.966522216796875, 1.02276611328125, 1.079010009765625, 1.13525390625, 1.191497802734375, 1.24774169921875, 1.303985595703125, 1.3602294921875, 1.416473388671875, 1.47271728515625, 1.528961181640625, 1.585205078125, 1.641448974609375, 1.69769287109375, 1.753936767578125, 1.8101806640625, 1.866424560546875, 1.92266845703125, 1.978912353515625, 2.03515625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 13.0, 24.0, 50.0, 80.0, 119.0, 145.0, 132.0, 147.0, 103.0, 72.0, 64.0, 21.0, 12.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6865234375, -0.6710624694824219, -0.6556015014648438, -0.6401405334472656, -0.6246795654296875, -0.6092185974121094, -0.5937576293945312, -0.5782966613769531, -0.562835693359375, -0.5473747253417969, -0.5319137573242188, -0.5164527893066406, -0.5009918212890625, -0.4855308532714844, -0.47006988525390625, -0.4546089172363281, -0.43914794921875, -0.4236869812011719, -0.40822601318359375, -0.3927650451660156, -0.3773040771484375, -0.3618431091308594, -0.34638214111328125, -0.3309211730957031, -0.315460205078125, -0.2999992370605469, -0.28453826904296875, -0.2690773010253906, -0.2536163330078125, -0.23815536499023438, -0.22269439697265625, -0.20723342895507812, -0.1917724609375, -0.17631149291992188, -0.16085052490234375, -0.14538955688476562, -0.1299285888671875, -0.11446762084960938, -0.09900665283203125, -0.08354568481445312, -0.068084716796875, -0.052623748779296875, -0.03716278076171875, -0.021701812744140625, -0.0062408447265625, 0.009220123291015625, 0.02468109130859375, 0.040142059326171875, 0.05560302734375, 0.07106399536132812, 0.08652496337890625, 0.10198593139648438, 0.1174468994140625, 0.13290786743164062, 0.14836883544921875, 0.16382980346679688, 0.179290771484375, 0.19475173950195312, 0.21021270751953125, 0.22567367553710938, 0.2411346435546875, 0.2565956115722656, 0.27205657958984375, 0.2875175476074219, 0.302978515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 10.0, 16.0, 20.0, 33.0, 58.0, 88.0, 192.0, 390.0, 761.0, 1991.0, 6143.0, 27479.0, 217329.0, 654952.0, 114340.0, 17377.0, 4513.0, 1558.0, 635.0, 308.0, 165.0, 68.0, 40.0, 27.0, 16.0, 9.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5558929443359375, -1.509246826171875, -1.4626007080078125, -1.41595458984375, -1.3693084716796875, -1.322662353515625, -1.2760162353515625, -1.2293701171875, -1.1827239990234375, -1.136077880859375, -1.0894317626953125, -1.04278564453125, -0.9961395263671875, -0.949493408203125, -0.9028472900390625, -0.856201171875, -0.8095550537109375, -0.762908935546875, -0.7162628173828125, -0.66961669921875, -0.6229705810546875, -0.576324462890625, -0.5296783447265625, -0.4830322265625, -0.4363861083984375, -0.389739990234375, -0.3430938720703125, -0.29644775390625, -0.2498016357421875, -0.203155517578125, -0.1565093994140625, -0.10986328125, -0.0632171630859375, -0.016571044921875, 0.0300750732421875, 0.07672119140625, 0.1233673095703125, 0.170013427734375, 0.2166595458984375, 0.2633056640625, 0.3099517822265625, 0.356597900390625, 0.4032440185546875, 0.44989013671875, 0.4965362548828125, 0.543182373046875, 0.5898284912109375, 0.636474609375, 0.6831207275390625, 0.729766845703125, 0.7764129638671875, 0.82305908203125, 0.8697052001953125, 0.916351318359375, 0.9629974365234375, 1.0096435546875, 1.0562896728515625, 1.102935791015625, 1.1495819091796875, 1.19622802734375, 1.2428741455078125, 1.289520263671875, 1.3361663818359375, 1.3828125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 6.0, 7.0, 9.0, 6.0, 18.0, 18.0, 17.0, 23.0, 31.0, 44.0, 39.0, 53.0, 47.0, 56.0, 50.0, 67.0, 48.0, 50.0, 57.0, 63.0, 44.0, 40.0, 46.0, 25.0, 26.0, 23.0, 28.0, 12.0, 10.0, 8.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2919921875, -1.2544708251953125, -1.216949462890625, -1.1794281005859375, -1.14190673828125, -1.1043853759765625, -1.066864013671875, -1.0293426513671875, -0.9918212890625, -0.9542999267578125, -0.916778564453125, -0.8792572021484375, -0.84173583984375, -0.8042144775390625, -0.766693115234375, -0.7291717529296875, -0.691650390625, -0.6541290283203125, -0.616607666015625, -0.5790863037109375, -0.54156494140625, -0.5040435791015625, -0.466522216796875, -0.4290008544921875, -0.3914794921875, -0.3539581298828125, -0.316436767578125, -0.2789154052734375, -0.24139404296875, -0.2038726806640625, -0.166351318359375, -0.1288299560546875, -0.09130859375, -0.0537872314453125, -0.016265869140625, 0.0212554931640625, 0.05877685546875, 0.0962982177734375, 0.133819580078125, 0.1713409423828125, 0.2088623046875, 0.2463836669921875, 0.283905029296875, 0.3214263916015625, 0.35894775390625, 0.3964691162109375, 0.433990478515625, 0.4715118408203125, 0.509033203125, 0.5465545654296875, 0.584075927734375, 0.6215972900390625, 0.65911865234375, 0.6966400146484375, 0.734161376953125, 0.7716827392578125, 0.8092041015625, 0.8467254638671875, 0.884246826171875, 0.9217681884765625, 0.95928955078125, 0.9968109130859375, 1.034332275390625, 1.0718536376953125, 1.109375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 3.0, 0.0, 4.0, 5.0, 5.0, 9.0, 9.0, 18.0, 24.0, 32.0, 72.0, 89.0, 176.0, 330.0, 605.0, 1380.0, 3916.0, 15230.0, 163396.0, 794950.0, 54761.0, 8891.0, 2556.0, 973.0, 461.0, 252.0, 151.0, 80.0, 62.0, 34.0, 30.0, 25.0, 13.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445556640625, -0.4255943298339844, -0.40563201904296875, -0.3856697082519531, -0.3657073974609375, -0.3457450866699219, -0.32578277587890625, -0.3058204650878906, -0.285858154296875, -0.2658958435058594, -0.24593353271484375, -0.22597122192382812, -0.2060089111328125, -0.18604660034179688, -0.16608428955078125, -0.14612197875976562, -0.12615966796875, -0.10619735717773438, -0.08623504638671875, -0.06627273559570312, -0.0463104248046875, -0.026348114013671875, -0.00638580322265625, 0.013576507568359375, 0.033538818359375, 0.053501129150390625, 0.07346343994140625, 0.09342575073242188, 0.1133880615234375, 0.13335037231445312, 0.15331268310546875, 0.17327499389648438, 0.1932373046875, 0.21319961547851562, 0.23316192626953125, 0.2531242370605469, 0.2730865478515625, 0.2930488586425781, 0.31301116943359375, 0.3329734802246094, 0.352935791015625, 0.3728981018066406, 0.39286041259765625, 0.4128227233886719, 0.4327850341796875, 0.4527473449707031, 0.47270965576171875, 0.4926719665527344, 0.51263427734375, 0.5325965881347656, 0.5525588989257812, 0.5725212097167969, 0.5924835205078125, 0.6124458312988281, 0.6324081420898438, 0.6523704528808594, 0.672332763671875, 0.6922950744628906, 0.7122573852539062, 0.7322196960449219, 0.7521820068359375, 0.7721443176269531, 0.7921066284179688, 0.8120689392089844, 0.83203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 4.0, 4.0, 8.0, 12.0, 21.0, 35.0, 43.0, 66.0, 108.0, 129.0, 140.0, 125.0, 105.0, 71.0, 41.0, 27.0, 18.0, 17.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.973743438720703e-05, -6.771180778741837e-05, -6.56861811876297e-05, -6.366055458784103e-05, -6.163492798805237e-05, -5.96093013882637e-05, -5.758367478847504e-05, -5.555804818868637e-05, -5.3532421588897705e-05, -5.150679498910904e-05, -4.9481168389320374e-05, -4.745554178953171e-05, -4.542991518974304e-05, -4.3404288589954376e-05, -4.137866199016571e-05, -3.9353035390377045e-05, -3.732740879058838e-05, -3.530178219079971e-05, -3.327615559101105e-05, -3.125052899122238e-05, -2.9224902391433716e-05, -2.719927579164505e-05, -2.5173649191856384e-05, -2.314802259206772e-05, -2.1122395992279053e-05, -1.9096769392490387e-05, -1.707114279270172e-05, -1.5045516192913055e-05, -1.301988959312439e-05, -1.0994262993335724e-05, -8.968636393547058e-06, -6.943009793758392e-06, -4.9173831939697266e-06, -2.891756594181061e-06, -8.66129994392395e-07, 1.1594966053962708e-06, 3.1851232051849365e-06, 5.210749804973602e-06, 7.236376404762268e-06, 9.262003004550934e-06, 1.12876296043396e-05, 1.3313256204128265e-05, 1.533888280391693e-05, 1.7364509403705597e-05, 1.9390136003494263e-05, 2.141576260328293e-05, 2.3441389203071594e-05, 2.546701580286026e-05, 2.7492642402648926e-05, 2.951826900243759e-05, 3.154389560222626e-05, 3.356952220201492e-05, 3.559514880180359e-05, 3.7620775401592255e-05, 3.964640200138092e-05, 4.1672028601169586e-05, 4.369765520095825e-05, 4.572328180074692e-05, 4.7748908400535583e-05, 4.977453500032425e-05, 5.1800161600112915e-05, 5.382578819990158e-05, 5.5851414799690247e-05, 5.787704139947891e-05, 5.990266799926758e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 3.0, 9.0, 11.0, 14.0, 19.0, 24.0, 43.0, 58.0, 89.0, 159.0, 286.0, 448.0, 832.0, 1925.0, 4437.0, 12350.0, 45578.0, 271916.0, 553489.0, 119243.0, 24126.0, 7561.0, 2989.0, 1332.0, 705.0, 327.0, 193.0, 143.0, 74.0, 43.0, 32.0, 27.0, 15.0, 18.0, 10.0, 11.0, 3.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.318603515625, -0.30841827392578125, -0.2982330322265625, -0.28804779052734375, -0.277862548828125, -0.26767730712890625, -0.2574920654296875, -0.24730682373046875, -0.23712158203125, -0.22693634033203125, -0.2167510986328125, -0.20656585693359375, -0.196380615234375, -0.18619537353515625, -0.1760101318359375, -0.16582489013671875, -0.1556396484375, -0.14545440673828125, -0.1352691650390625, -0.12508392333984375, -0.114898681640625, -0.10471343994140625, -0.0945281982421875, -0.08434295654296875, -0.07415771484375, -0.06397247314453125, -0.0537872314453125, -0.04360198974609375, -0.033416748046875, -0.02323150634765625, -0.0130462646484375, -0.00286102294921875, 0.00732421875, 0.01750946044921875, 0.0276947021484375, 0.03787994384765625, 0.048065185546875, 0.05825042724609375, 0.0684356689453125, 0.07862091064453125, 0.08880615234375, 0.09899139404296875, 0.1091766357421875, 0.11936187744140625, 0.129547119140625, 0.13973236083984375, 0.1499176025390625, 0.16010284423828125, 0.1702880859375, 0.18047332763671875, 0.1906585693359375, 0.20084381103515625, 0.211029052734375, 0.22121429443359375, 0.2313995361328125, 0.24158477783203125, 0.25177001953125, 0.26195526123046875, 0.2721405029296875, 0.28232574462890625, 0.292510986328125, 0.30269622802734375, 0.3128814697265625, 0.32306671142578125, 0.333251953125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 2.0, 9.0, 12.0, 18.0, 28.0, 33.0, 31.0, 53.0, 66.0, 78.0, 110.0, 96.0, 111.0, 79.0, 66.0, 46.0, 28.0, 28.0, 24.0, 13.0, 15.0, 9.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.339599609375, -0.3299713134765625, -0.320343017578125, -0.3107147216796875, -0.30108642578125, -0.2914581298828125, -0.281829833984375, -0.2722015380859375, -0.2625732421875, -0.2529449462890625, -0.243316650390625, -0.2336883544921875, -0.22406005859375, -0.2144317626953125, -0.204803466796875, -0.1951751708984375, -0.185546875, -0.1759185791015625, -0.166290283203125, -0.1566619873046875, -0.14703369140625, -0.1374053955078125, -0.127777099609375, -0.1181488037109375, -0.1085205078125, -0.0988922119140625, -0.089263916015625, -0.0796356201171875, -0.07000732421875, -0.0603790283203125, -0.050750732421875, -0.0411224365234375, -0.031494140625, -0.0218658447265625, -0.012237548828125, -0.0026092529296875, 0.00701904296875, 0.0166473388671875, 0.026275634765625, 0.0359039306640625, 0.0455322265625, 0.0551605224609375, 0.064788818359375, 0.0744171142578125, 0.08404541015625, 0.0936737060546875, 0.103302001953125, 0.1129302978515625, 0.12255859375, 0.1321868896484375, 0.141815185546875, 0.1514434814453125, 0.16107177734375, 0.1707000732421875, 0.180328369140625, 0.1899566650390625, 0.1995849609375, 0.2092132568359375, 0.218841552734375, 0.2284698486328125, 0.23809814453125, 0.2477264404296875, 0.257354736328125, 0.2669830322265625, 0.276611328125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 4.0, 13.0, 19.0, 32.0, 30.0, 73.0, 102.0, 142.0, 158.0, 148.0, 96.0, 73.0, 43.0, 31.0, 12.0, 11.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11306619644165, -6.905798435211182, -6.698530197143555, -6.491262435913086, -6.283994674682617, -6.07672643661499, -5.8694586753845215, -5.6621904373168945, -5.454922676086426, -5.247654914855957, -5.04038667678833, -4.833118915557861, -4.625850677490234, -4.418582916259766, -4.211315155029297, -4.004047393798828, -3.796779155731201, -3.5895111560821533, -3.3822431564331055, -3.1749753952026367, -2.967707395553589, -2.760439395904541, -2.5531716346740723, -2.3459036350250244, -2.1386356353759766, -1.9313676357269287, -1.7240997552871704, -1.516831874847412, -1.3095638751983643, -1.1022958755493164, -0.8950279951095581, -0.6877601146697998, -0.48049163818359375, -0.2732236981391907, -0.0659557580947876, 0.14131218194961548, 0.34858012199401855, 0.5558481216430664, 0.7631160020828247, 0.970383882522583, 1.1776518821716309, 1.3849198818206787, 1.592187762260437, 1.7994556427001953, 2.006723642349243, 2.213991641998291, 2.4212594032287598, 2.6285274028778076, 2.8357954025268555, 3.0430634021759033, 3.250331401824951, 3.45759916305542, 3.6648671627044678, 3.8721351623535156, 4.079402923583984, 4.286670684814453, 4.49393892288208, 4.701206684112549, 4.908474922180176, 5.1157426834106445, 5.323010444641113, 5.53027868270874, 5.737546443939209, 5.944814682006836, 6.152082443237305]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 8.0, 15.0, 11.0, 19.0, 28.0, 23.0, 27.0, 31.0, 34.0, 41.0, 44.0, 45.0, 40.0, 52.0, 58.0, 56.0, 52.0, 56.0, 43.0, 57.0, 32.0, 44.0, 32.0, 22.0, 24.0, 19.0, 14.0, 9.0, 11.0, 16.0, 13.0, 6.0, 5.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.602704048156738, -7.400277137756348, -7.197849750518799, -6.99542236328125, -6.792995452880859, -6.590568542480469, -6.38814115524292, -6.185713768005371, -5.9832868576049805, -5.78085994720459, -5.578432559967041, -5.376005172729492, -5.173578262329102, -4.971151351928711, -4.768723964691162, -4.566296577453613, -4.363869667053223, -4.161442756652832, -3.959015369415283, -3.7565882205963135, -3.5541610717773438, -3.351733922958374, -3.1493067741394043, -2.9468796253204346, -2.744452476501465, -2.542025327682495, -2.3395981788635254, -2.1371710300445557, -1.934743881225586, -1.7323167324066162, -1.5298895835876465, -1.3274624347686768, -1.1250348091125488, -0.9226076602935791, -0.7201805114746094, -0.5177533626556396, -0.3153262138366699, -0.1128990650177002, 0.08952808380126953, 0.29195523262023926, 0.494382381439209, 0.6968095302581787, 0.8992366790771484, 1.1016638278961182, 1.304090976715088, 1.5065181255340576, 1.7089452743530273, 1.911372423171997, 2.113799571990967, 2.3162267208099365, 2.5186538696289062, 2.721081018447876, 2.9235081672668457, 3.1259353160858154, 3.328362464904785, 3.530789613723755, 3.7332167625427246, 3.9356439113616943, 4.138071060180664, 4.340497970581055, 4.5429253578186035, 4.745352745056152, 4.947779655456543, 5.150206565856934, 5.352633953094482]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 9.0, 5.0, 13.0, 26.0, 23.0, 34.0, 36.0, 72.0, 100.0, 183.0, 280.0, 584.0, 1499.0, 4875.0, 28371.0, 3810622.0, 328618.0, 14329.0, 2875.0, 939.0, 395.0, 177.0, 66.0, 48.0, 36.0, 19.0, 16.0, 6.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.369140625, -2.311126708984375, -2.25311279296875, -2.195098876953125, -2.1370849609375, -2.079071044921875, -2.02105712890625, -1.963043212890625, -1.905029296875, -1.847015380859375, -1.78900146484375, -1.730987548828125, -1.6729736328125, -1.614959716796875, -1.55694580078125, -1.498931884765625, -1.44091796875, -1.382904052734375, -1.32489013671875, -1.266876220703125, -1.2088623046875, -1.150848388671875, -1.09283447265625, -1.034820556640625, -0.976806640625, -0.918792724609375, -0.86077880859375, -0.802764892578125, -0.7447509765625, -0.686737060546875, -0.62872314453125, -0.570709228515625, -0.5126953125, -0.454681396484375, -0.39666748046875, -0.338653564453125, -0.2806396484375, -0.222625732421875, -0.16461181640625, -0.106597900390625, -0.048583984375, 0.009429931640625, 0.06744384765625, 0.125457763671875, 0.1834716796875, 0.241485595703125, 0.29949951171875, 0.357513427734375, 0.41552734375, 0.473541259765625, 0.53155517578125, 0.589569091796875, 0.6475830078125, 0.705596923828125, 0.76361083984375, 0.821624755859375, 0.879638671875, 0.937652587890625, 0.99566650390625, 1.053680419921875, 1.1116943359375, 1.169708251953125, 1.22772216796875, 1.285736083984375, 1.34375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 13.0, 21.0, 32.0, 49.0, 86.0, 108.0, 138.0, 137.0, 118.0, 111.0, 83.0, 43.0, 23.0, 15.0, 12.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.703125, -0.6864967346191406, -0.6698684692382812, -0.6532402038574219, -0.6366119384765625, -0.6199836730957031, -0.6033554077148438, -0.5867271423339844, -0.570098876953125, -0.5534706115722656, -0.5368423461914062, -0.5202140808105469, -0.5035858154296875, -0.4869575500488281, -0.47032928466796875, -0.4537010192871094, -0.43707275390625, -0.4204444885253906, -0.40381622314453125, -0.3871879577636719, -0.3705596923828125, -0.3539314270019531, -0.33730316162109375, -0.3206748962402344, -0.304046630859375, -0.2874183654785156, -0.27079010009765625, -0.2541618347167969, -0.2375335693359375, -0.22090530395507812, -0.20427703857421875, -0.18764877319335938, -0.1710205078125, -0.15439224243164062, -0.13776397705078125, -0.12113571166992188, -0.1045074462890625, -0.08787918090820312, -0.07125091552734375, -0.054622650146484375, -0.037994384765625, -0.021366119384765625, -0.00473785400390625, 0.011890411376953125, 0.0285186767578125, 0.045146942138671875, 0.06177520751953125, 0.07840347290039062, 0.09503173828125, 0.11166000366210938, 0.12828826904296875, 0.14491653442382812, 0.1615447998046875, 0.17817306518554688, 0.19480133056640625, 0.21142959594726562, 0.228057861328125, 0.24468612670898438, 0.26131439208984375, 0.2779426574707031, 0.2945709228515625, 0.3111991882324219, 0.32782745361328125, 0.3444557189941406, 0.361083984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 11.0, 6.0, 25.0, 36.0, 71.0, 134.0, 239.0, 387.0, 778.0, 1589.0, 3898.0, 12071.0, 74746.0, 3509090.0, 546960.0, 32045.0, 7264.0, 2579.0, 1143.0, 560.0, 289.0, 148.0, 85.0, 46.0, 29.0, 15.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2353515625, -1.19769287109375, -1.1600341796875, -1.12237548828125, -1.084716796875, -1.04705810546875, -1.0093994140625, -0.97174072265625, -0.93408203125, -0.89642333984375, -0.8587646484375, -0.82110595703125, -0.783447265625, -0.74578857421875, -0.7081298828125, -0.67047119140625, -0.6328125, -0.59515380859375, -0.5574951171875, -0.51983642578125, -0.482177734375, -0.44451904296875, -0.4068603515625, -0.36920166015625, -0.33154296875, -0.29388427734375, -0.2562255859375, -0.21856689453125, -0.180908203125, -0.14324951171875, -0.1055908203125, -0.06793212890625, -0.0302734375, 0.00738525390625, 0.0450439453125, 0.08270263671875, 0.120361328125, 0.15802001953125, 0.1956787109375, 0.23333740234375, 0.27099609375, 0.30865478515625, 0.3463134765625, 0.38397216796875, 0.421630859375, 0.45928955078125, 0.4969482421875, 0.53460693359375, 0.572265625, 0.60992431640625, 0.6475830078125, 0.68524169921875, 0.722900390625, 0.76055908203125, 0.7982177734375, 0.83587646484375, 0.87353515625, 0.91119384765625, 0.9488525390625, 0.98651123046875, 1.024169921875, 1.06182861328125, 1.0994873046875, 1.13714599609375, 1.1748046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 6.0, 11.0, 21.0, 28.0, 38.0, 85.0, 165.0, 542.0, 2078.0, 683.0, 200.0, 93.0, 33.0, 23.0, 17.0, 10.0, 4.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.634429931640625, -0.61798095703125, -0.601531982421875, -0.5850830078125, -0.568634033203125, -0.55218505859375, -0.535736083984375, -0.519287109375, -0.502838134765625, -0.48638916015625, -0.469940185546875, -0.4534912109375, -0.437042236328125, -0.42059326171875, -0.404144287109375, -0.3876953125, -0.371246337890625, -0.35479736328125, -0.338348388671875, -0.3218994140625, -0.305450439453125, -0.28900146484375, -0.272552490234375, -0.256103515625, -0.239654541015625, -0.22320556640625, -0.206756591796875, -0.1903076171875, -0.173858642578125, -0.15740966796875, -0.140960693359375, -0.12451171875, -0.108062744140625, -0.09161376953125, -0.075164794921875, -0.0587158203125, -0.042266845703125, -0.02581787109375, -0.009368896484375, 0.007080078125, 0.023529052734375, 0.03997802734375, 0.056427001953125, 0.0728759765625, 0.089324951171875, 0.10577392578125, 0.122222900390625, 0.138671875, 0.155120849609375, 0.17156982421875, 0.188018798828125, 0.2044677734375, 0.220916748046875, 0.23736572265625, 0.253814697265625, 0.270263671875, 0.286712646484375, 0.30316162109375, 0.319610595703125, 0.3360595703125, 0.352508544921875, 0.36895751953125, 0.385406494140625, 0.40185546875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 13.0, 29.0, 91.0, 270.0, 349.0, 182.0, 48.0, 16.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.683925151824951, -6.545823097229004, -6.407721519470215, -6.269619941711426, -6.1315178871154785, -5.993415832519531, -5.855314254760742, -5.717212677001953, -5.579110622406006, -5.441008567810059, -5.3029069900512695, -5.1648054122924805, -5.026703357696533, -4.888601303100586, -4.750499725341797, -4.612398147583008, -4.4742960929870605, -4.336194038391113, -4.198092460632324, -4.059990882873535, -3.921888828277588, -3.7837870121002197, -3.6456851959228516, -3.5075833797454834, -3.3694815635681152, -3.231379747390747, -3.093277931213379, -2.9551761150360107, -2.8170742988586426, -2.6789724826812744, -2.5408706665039062, -2.402768850326538, -2.264667510986328, -2.12656569480896, -1.9884638786315918, -1.8503620624542236, -1.7122602462768555, -1.5741584300994873, -1.4360566139221191, -1.297954797744751, -1.1598529815673828, -1.0217511653900146, -0.8836493492126465, -0.7455475330352783, -0.6074457168579102, -0.469343900680542, -0.33124208450317383, -0.19314026832580566, -0.0550384521484375, 0.08306336402893066, 0.22116518020629883, 0.359266996383667, 0.49736881256103516, 0.6354706287384033, 0.7735724449157715, 0.9116742610931396, 1.0497760772705078, 1.187877893447876, 1.3259797096252441, 1.4640815258026123, 1.6021833419799805, 1.7402851581573486, 1.8783869743347168, 2.016488790512085, 2.154590606689453]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 5.0, 10.0, 6.0, 9.0, 11.0, 14.0, 15.0, 29.0, 27.0, 28.0, 35.0, 47.0, 45.0, 53.0, 54.0, 53.0, 59.0, 57.0, 37.0, 57.0, 58.0, 62.0, 40.0, 40.0, 26.0, 28.0, 17.0, 23.0, 12.0, 11.0, 13.0, 5.0, 3.0, 5.0, 2.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3751063346862793, -1.328284502029419, -1.2814627885818481, -1.2346409559249878, -1.187819242477417, -1.1409974098205566, -1.0941755771636963, -1.047353744506836, -1.0005320310592651, -0.9537102580070496, -0.906888484954834, -0.8600666522979736, -0.8132448792457581, -0.7664231061935425, -0.7196012735366821, -0.6727795004844666, -0.625957727432251, -0.5791359543800354, -0.5323141813278198, -0.4854923486709595, -0.4386705756187439, -0.3918488025665283, -0.34502699971199036, -0.2982051968574524, -0.2513834238052368, -0.20456163585186005, -0.15773984789848328, -0.1109180599451065, -0.06409627199172974, -0.017274484038352966, 0.029547303915023804, 0.07636910676956177, 0.12319076061248779, 0.17001254856586456, 0.21683433651924133, 0.2636561393737793, 0.3104779124259949, 0.35729968547821045, 0.4041214883327484, 0.4509432911872864, 0.49776506423950195, 0.5445868372917175, 0.5914086103439331, 0.6382304430007935, 0.685052216053009, 0.7318739891052246, 0.778695821762085, 0.8255175948143005, 0.8723393678665161, 0.9191611409187317, 0.9659829139709473, 1.0128047466278076, 1.059626579284668, 1.1064482927322388, 1.1532701253890991, 1.20009183883667, 1.2469136714935303, 1.2937355041503906, 1.3405572175979614, 1.3873790502548218, 1.4342007637023926, 1.481022596359253, 1.5278444290161133, 1.5746662616729736, 1.6214879751205444]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 6.0, 13.0, 22.0, 33.0, 40.0, 73.0, 106.0, 161.0, 288.0, 420.0, 804.0, 1721.0, 4538.0, 19685.0, 168441.0, 695852.0, 132214.0, 16731.0, 4100.0, 1491.0, 734.0, 395.0, 232.0, 150.0, 92.0, 73.0, 40.0, 34.0, 24.0, 10.0, 5.0, 9.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.79296875, -1.7340850830078125, -1.675201416015625, -1.6163177490234375, -1.55743408203125, -1.4985504150390625, -1.439666748046875, -1.3807830810546875, -1.3218994140625, -1.2630157470703125, -1.204132080078125, -1.1452484130859375, -1.08636474609375, -1.0274810791015625, -0.968597412109375, -0.9097137451171875, -0.850830078125, -0.7919464111328125, -0.733062744140625, -0.6741790771484375, -0.61529541015625, -0.5564117431640625, -0.497528076171875, -0.4386444091796875, -0.3797607421875, -0.3208770751953125, -0.261993408203125, -0.2031097412109375, -0.14422607421875, -0.0853424072265625, -0.026458740234375, 0.0324249267578125, 0.09130859375, 0.1501922607421875, 0.209075927734375, 0.2679595947265625, 0.32684326171875, 0.3857269287109375, 0.444610595703125, 0.5034942626953125, 0.5623779296875, 0.6212615966796875, 0.680145263671875, 0.7390289306640625, 0.79791259765625, 0.8567962646484375, 0.915679931640625, 0.9745635986328125, 1.033447265625, 1.0923309326171875, 1.151214599609375, 1.2100982666015625, 1.26898193359375, 1.3278656005859375, 1.386749267578125, 1.4456329345703125, 1.5045166015625, 1.5634002685546875, 1.622283935546875, 1.6811676025390625, 1.74005126953125, 1.7989349365234375, 1.857818603515625, 1.9167022705078125, 1.9755859375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 12.0, 19.0, 45.0, 69.0, 95.0, 138.0, 126.0, 144.0, 112.0, 93.0, 74.0, 24.0, 18.0, 17.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69873046875, -0.681610107421875, -0.66448974609375, -0.647369384765625, -0.6302490234375, -0.613128662109375, -0.59600830078125, -0.578887939453125, -0.561767578125, -0.544647216796875, -0.52752685546875, -0.510406494140625, -0.4932861328125, -0.476165771484375, -0.45904541015625, -0.441925048828125, -0.4248046875, -0.407684326171875, -0.39056396484375, -0.373443603515625, -0.3563232421875, -0.339202880859375, -0.32208251953125, -0.304962158203125, -0.287841796875, -0.270721435546875, -0.25360107421875, -0.236480712890625, -0.2193603515625, -0.202239990234375, -0.18511962890625, -0.167999267578125, -0.15087890625, -0.133758544921875, -0.11663818359375, -0.099517822265625, -0.0823974609375, -0.065277099609375, -0.04815673828125, -0.031036376953125, -0.013916015625, 0.003204345703125, 0.02032470703125, 0.037445068359375, 0.0545654296875, 0.071685791015625, 0.08880615234375, 0.105926513671875, 0.123046875, 0.140167236328125, 0.15728759765625, 0.174407958984375, 0.1915283203125, 0.208648681640625, 0.22576904296875, 0.242889404296875, 0.260009765625, 0.277130126953125, 0.29425048828125, 0.311370849609375, 0.3284912109375, 0.345611572265625, 0.36273193359375, 0.379852294921875, 0.39697265625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 8.0, 14.0, 18.0, 14.0, 29.0, 39.0, 49.0, 74.0, 67.0, 149.0, 200.0, 322.0, 485.0, 844.0, 1657.0, 3538.0, 9046.0, 26909.0, 96452.0, 341704.0, 393334.0, 121407.0, 32868.0, 10854.0, 4058.0, 1887.0, 870.0, 567.0, 331.0, 235.0, 147.0, 106.0, 74.0, 53.0, 40.0, 25.0, 26.0, 17.0, 5.0, 7.0, 4.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.93603515625, -0.9068603515625, -0.877685546875, -0.8485107421875, -0.8193359375, -0.7901611328125, -0.760986328125, -0.7318115234375, -0.70263671875, -0.6734619140625, -0.644287109375, -0.6151123046875, -0.5859375, -0.5567626953125, -0.527587890625, -0.4984130859375, -0.46923828125, -0.4400634765625, -0.410888671875, -0.3817138671875, -0.3525390625, -0.3233642578125, -0.294189453125, -0.2650146484375, -0.23583984375, -0.2066650390625, -0.177490234375, -0.1483154296875, -0.119140625, -0.0899658203125, -0.060791015625, -0.0316162109375, -0.00244140625, 0.0267333984375, 0.055908203125, 0.0850830078125, 0.1142578125, 0.1434326171875, 0.172607421875, 0.2017822265625, 0.23095703125, 0.2601318359375, 0.289306640625, 0.3184814453125, 0.34765625, 0.3768310546875, 0.406005859375, 0.4351806640625, 0.46435546875, 0.4935302734375, 0.522705078125, 0.5518798828125, 0.5810546875, 0.6102294921875, 0.639404296875, 0.6685791015625, 0.69775390625, 0.7269287109375, 0.756103515625, 0.7852783203125, 0.814453125, 0.8436279296875, 0.872802734375, 0.9019775390625, 0.93115234375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 15.0, 16.0, 14.0, 11.0, 28.0, 34.0, 26.0, 30.0, 39.0, 38.0, 35.0, 42.0, 44.0, 33.0, 49.0, 56.0, 55.0, 45.0, 43.0, 43.0, 38.0, 43.0, 32.0, 31.0, 22.0, 23.0, 21.0, 11.0, 16.0, 14.0, 10.0, 9.0, 6.0, 3.0, 3.0, 9.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1240234375, -1.0903778076171875, -1.056732177734375, -1.0230865478515625, -0.98944091796875, -0.9557952880859375, -0.922149658203125, -0.8885040283203125, -0.8548583984375, -0.8212127685546875, -0.787567138671875, -0.7539215087890625, -0.72027587890625, -0.6866302490234375, -0.652984619140625, -0.6193389892578125, -0.585693359375, -0.5520477294921875, -0.518402099609375, -0.4847564697265625, -0.45111083984375, -0.4174652099609375, -0.383819580078125, -0.3501739501953125, -0.3165283203125, -0.2828826904296875, -0.249237060546875, -0.2155914306640625, -0.18194580078125, -0.1483001708984375, -0.114654541015625, -0.0810089111328125, -0.04736328125, -0.0137176513671875, 0.019927978515625, 0.0535736083984375, 0.08721923828125, 0.1208648681640625, 0.154510498046875, 0.1881561279296875, 0.2218017578125, 0.2554473876953125, 0.289093017578125, 0.3227386474609375, 0.35638427734375, 0.3900299072265625, 0.423675537109375, 0.4573211669921875, 0.490966796875, 0.5246124267578125, 0.558258056640625, 0.5919036865234375, 0.62554931640625, 0.6591949462890625, 0.692840576171875, 0.7264862060546875, 0.7601318359375, 0.7937774658203125, 0.827423095703125, 0.8610687255859375, 0.89471435546875, 0.9283599853515625, 0.962005615234375, 0.9956512451171875, 1.029296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 10.0, 18.0, 32.0, 54.0, 103.0, 221.0, 410.0, 837.0, 2239.0, 7692.0, 43191.0, 391707.0, 525617.0, 61758.0, 10006.0, 2709.0, 964.0, 423.0, 231.0, 138.0, 65.0, 36.0, 29.0, 14.0, 13.0, 8.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55517578125, -0.5402069091796875, -0.525238037109375, -0.5102691650390625, -0.49530029296875, -0.4803314208984375, -0.465362548828125, -0.4503936767578125, -0.4354248046875, -0.4204559326171875, -0.405487060546875, -0.3905181884765625, -0.37554931640625, -0.3605804443359375, -0.345611572265625, -0.3306427001953125, -0.315673828125, -0.3007049560546875, -0.285736083984375, -0.2707672119140625, -0.25579833984375, -0.2408294677734375, -0.225860595703125, -0.2108917236328125, -0.1959228515625, -0.1809539794921875, -0.165985107421875, -0.1510162353515625, -0.13604736328125, -0.1210784912109375, -0.106109619140625, -0.0911407470703125, -0.076171875, -0.0612030029296875, -0.046234130859375, -0.0312652587890625, -0.01629638671875, -0.0013275146484375, 0.013641357421875, 0.0286102294921875, 0.0435791015625, 0.0585479736328125, 0.073516845703125, 0.0884857177734375, 0.10345458984375, 0.1184234619140625, 0.133392333984375, 0.1483612060546875, 0.163330078125, 0.1782989501953125, 0.193267822265625, 0.2082366943359375, 0.22320556640625, 0.2381744384765625, 0.253143310546875, 0.2681121826171875, 0.2830810546875, 0.2980499267578125, 0.313018798828125, 0.3279876708984375, 0.34295654296875, 0.3579254150390625, 0.372894287109375, 0.3878631591796875, 0.40283203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 8.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 10.0, 13.0, 9.0, 20.0, 22.0, 32.0, 36.0, 29.0, 38.0, 57.0, 64.0, 57.0, 52.0, 68.0, 73.0, 51.0, 52.0, 50.0, 34.0, 33.0, 34.0, 22.0, 18.0, 17.0, 9.0, 16.0, 9.0, 6.0, 7.0, 7.0, 8.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.855062484741211e-05, -2.75392085313797e-05, -2.652779221534729e-05, -2.551637589931488e-05, -2.450495958328247e-05, -2.349354326725006e-05, -2.248212695121765e-05, -2.1470710635185242e-05, -2.0459294319152832e-05, -1.9447878003120422e-05, -1.8436461687088013e-05, -1.7425045371055603e-05, -1.6413629055023193e-05, -1.5402212738990784e-05, -1.4390796422958374e-05, -1.3379380106925964e-05, -1.2367963790893555e-05, -1.1356547474861145e-05, -1.0345131158828735e-05, -9.333714842796326e-06, -8.322298526763916e-06, -7.310882210731506e-06, -6.299465894699097e-06, -5.288049578666687e-06, -4.276633262634277e-06, -3.2652169466018677e-06, -2.253800630569458e-06, -1.2423843145370483e-06, -2.3096799850463867e-07, 7.80448317527771e-07, 1.7918646335601807e-06, 2.8032809495925903e-06, 3.814697265625e-06, 4.82611358165741e-06, 5.837529897689819e-06, 6.848946213722229e-06, 7.860362529754639e-06, 8.871778845787048e-06, 9.883195161819458e-06, 1.0894611477851868e-05, 1.1906027793884277e-05, 1.2917444109916687e-05, 1.3928860425949097e-05, 1.4940276741981506e-05, 1.5951693058013916e-05, 1.6963109374046326e-05, 1.7974525690078735e-05, 1.8985942006111145e-05, 1.9997358322143555e-05, 2.1008774638175964e-05, 2.2020190954208374e-05, 2.3031607270240784e-05, 2.4043023586273193e-05, 2.5054439902305603e-05, 2.6065856218338013e-05, 2.7077272534370422e-05, 2.8088688850402832e-05, 2.9100105166435242e-05, 3.011152148246765e-05, 3.112293779850006e-05, 3.213435411453247e-05, 3.314577043056488e-05, 3.415718674659729e-05, 3.51686030626297e-05, 3.618001937866211e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 10.0, 7.0, 11.0, 13.0, 27.0, 22.0, 25.0, 41.0, 58.0, 105.0, 177.0, 265.0, 421.0, 666.0, 1165.0, 2389.0, 4909.0, 13323.0, 43157.0, 175347.0, 475388.0, 242874.0, 58530.0, 17165.0, 6352.0, 2679.0, 1389.0, 770.0, 391.0, 248.0, 174.0, 131.0, 99.0, 54.0, 51.0, 24.0, 25.0, 9.0, 15.0, 10.0, 8.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.25927734375, -0.2505226135253906, -0.24176788330078125, -0.23301315307617188, -0.2242584228515625, -0.21550369262695312, -0.20674896240234375, -0.19799423217773438, -0.189239501953125, -0.18048477172851562, -0.17173004150390625, -0.16297531127929688, -0.1542205810546875, -0.14546585083007812, -0.13671112060546875, -0.12795639038085938, -0.11920166015625, -0.11044692993164062, -0.10169219970703125, -0.09293746948242188, -0.0841827392578125, -0.07542800903320312, -0.06667327880859375, -0.057918548583984375, -0.049163818359375, -0.040409088134765625, -0.03165435791015625, -0.022899627685546875, -0.0141448974609375, -0.005390167236328125, 0.00336456298828125, 0.012119293212890625, 0.0208740234375, 0.029628753662109375, 0.03838348388671875, 0.047138214111328125, 0.0558929443359375, 0.06464767456054688, 0.07340240478515625, 0.08215713500976562, 0.090911865234375, 0.09966659545898438, 0.10842132568359375, 0.11717605590820312, 0.1259307861328125, 0.13468551635742188, 0.14344024658203125, 0.15219497680664062, 0.16094970703125, 0.16970443725585938, 0.17845916748046875, 0.18721389770507812, 0.1959686279296875, 0.20472335815429688, 0.21347808837890625, 0.22223281860351562, 0.230987548828125, 0.23974227905273438, 0.24849700927734375, 0.2572517395019531, 0.2660064697265625, 0.2747611999511719, 0.28351593017578125, 0.2922706604003906, 0.301025390625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 8.0, 10.0, 11.0, 14.0, 14.0, 14.0, 28.0, 32.0, 47.0, 32.0, 63.0, 60.0, 75.0, 74.0, 66.0, 72.0, 72.0, 63.0, 45.0, 42.0, 29.0, 31.0, 23.0, 16.0, 10.0, 6.0, 7.0, 5.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28369140625, -0.2751617431640625, -0.266632080078125, -0.2581024169921875, -0.24957275390625, -0.2410430908203125, -0.232513427734375, -0.2239837646484375, -0.2154541015625, -0.2069244384765625, -0.198394775390625, -0.1898651123046875, -0.18133544921875, -0.1728057861328125, -0.164276123046875, -0.1557464599609375, -0.147216796875, -0.1386871337890625, -0.130157470703125, -0.1216278076171875, -0.11309814453125, -0.1045684814453125, -0.096038818359375, -0.0875091552734375, -0.0789794921875, -0.0704498291015625, -0.061920166015625, -0.0533905029296875, -0.04486083984375, -0.0363311767578125, -0.027801513671875, -0.0192718505859375, -0.0107421875, -0.0022125244140625, 0.006317138671875, 0.0148468017578125, 0.02337646484375, 0.0319061279296875, 0.040435791015625, 0.0489654541015625, 0.0574951171875, 0.0660247802734375, 0.074554443359375, 0.0830841064453125, 0.09161376953125, 0.1001434326171875, 0.108673095703125, 0.1172027587890625, 0.125732421875, 0.1342620849609375, 0.142791748046875, 0.1513214111328125, 0.15985107421875, 0.1683807373046875, 0.176910400390625, 0.1854400634765625, 0.1939697265625, 0.2024993896484375, 0.211029052734375, 0.2195587158203125, 0.22808837890625, 0.2366180419921875, 0.245147705078125, 0.2536773681640625, 0.26220703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 13.0, 20.0, 51.0, 84.0, 185.0, 265.0, 198.0, 113.0, 45.0, 14.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.251853942871094, -17.866985321044922, -17.48211669921875, -17.097248077392578, -16.712379455566406, -16.3275089263916, -15.94264030456543, -15.557771682739258, -15.172903060913086, -14.788034439086914, -14.403165817260742, -14.018296241760254, -13.633427619934082, -13.24855899810791, -12.863689422607422, -12.47882080078125, -12.093952178955078, -11.709083557128906, -11.324214935302734, -10.939345359802246, -10.554476737976074, -10.169608116149902, -9.784738540649414, -9.399869918823242, -9.01500129699707, -8.630132675170898, -8.245264053344727, -7.860394477844238, -7.475525856018066, -7.0906572341918945, -6.7057881355285645, -6.320919036865234, -5.936049461364746, -5.551180839538574, -5.166311740875244, -4.781442642211914, -4.396574020385742, -4.01170539855957, -3.6268362998962402, -3.2419674396514893, -2.8570985794067383, -2.4722297191619873, -2.0873608589172363, -1.7024919986724854, -1.3176231384277344, -0.9327542781829834, -0.5478854179382324, -0.16301655769348145, 0.22185230255126953, 0.6067211627960205, 0.9915900230407715, 1.3764588832855225, 1.7613277435302734, 2.1461966037750244, 2.5310654640197754, 2.9159343242645264, 3.3008031845092773, 3.6856720447540283, 4.070540904998779, 4.455410003662109, 4.840278625488281, 5.225147247314453, 5.610016345977783, 5.994885444641113, 6.379754066467285]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 11.0, 11.0, 6.0, 12.0, 13.0, 13.0, 16.0, 29.0, 20.0, 30.0, 38.0, 34.0, 40.0, 56.0, 39.0, 48.0, 50.0, 59.0, 50.0, 54.0, 51.0, 42.0, 43.0, 30.0, 37.0, 23.0, 22.0, 26.0, 23.0, 18.0, 12.0, 11.0, 7.0, 10.0, 3.0, 3.0, 6.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.566643714904785, -6.343291282653809, -6.11993932723999, -5.896586894989014, -5.673234462738037, -5.449882507324219, -5.226530075073242, -5.003177642822266, -4.779825687408447, -4.556473255157471, -4.333121299743652, -4.109768867492676, -3.8864166736602783, -3.663064479827881, -3.4397120475769043, -3.216359853744507, -2.9930074214935303, -2.769655227661133, -2.5463027954101562, -2.322950601577759, -2.0995984077453613, -1.8762460947036743, -1.6528937816619873, -1.4295415878295898, -1.2061892747879028, -0.9828370213508606, -0.7594847679138184, -0.5361324548721313, -0.3127802014350891, -0.08942794799804688, 0.13392436504364014, 0.3572765588760376, 0.5806288719177246, 0.8039811253547668, 1.027333378791809, 1.250685691833496, 1.4740378856658936, 1.6973901987075806, 1.9207425117492676, 2.144094705581665, 2.3674468994140625, 2.59079909324646, 2.8141515254974365, 3.037503719329834, 3.2608559131622314, 3.484208106994629, 3.7075605392456055, 3.930912733078003, 4.154265403747559, 4.377617835998535, 4.6009697914123535, 4.82432222366333, 5.047674655914307, 5.271026611328125, 5.494379043579102, 5.717731475830078, 5.9410834312438965, 6.164435863494873, 6.387787818908691, 6.611140251159668, 6.8344926834106445, 7.057844638824463, 7.2811970710754395, 7.504549026489258, 7.727901458740234]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 8.0, 21.0, 14.0, 23.0, 24.0, 51.0, 81.0, 119.0, 192.0, 416.0, 737.0, 1692.0, 4983.0, 28416.0, 3716503.0, 418818.0, 16257.0, 3589.0, 1155.0, 547.0, 259.0, 142.0, 81.0, 45.0, 22.0, 19.0, 16.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.97265625, -1.9107513427734375, -1.848846435546875, -1.7869415283203125, -1.72503662109375, -1.6631317138671875, -1.601226806640625, -1.5393218994140625, -1.4774169921875, -1.4155120849609375, -1.353607177734375, -1.2917022705078125, -1.22979736328125, -1.1678924560546875, -1.105987548828125, -1.0440826416015625, -0.982177734375, -0.9202728271484375, -0.858367919921875, -0.7964630126953125, -0.73455810546875, -0.6726531982421875, -0.610748291015625, -0.5488433837890625, -0.4869384765625, -0.4250335693359375, -0.363128662109375, -0.3012237548828125, -0.23931884765625, -0.1774139404296875, -0.115509033203125, -0.0536041259765625, 0.00830078125, 0.0702056884765625, 0.132110595703125, 0.1940155029296875, 0.25592041015625, 0.3178253173828125, 0.379730224609375, 0.4416351318359375, 0.5035400390625, 0.5654449462890625, 0.627349853515625, 0.6892547607421875, 0.75115966796875, 0.8130645751953125, 0.874969482421875, 0.9368743896484375, 0.998779296875, 1.0606842041015625, 1.122589111328125, 1.1844940185546875, 1.24639892578125, 1.3083038330078125, 1.370208740234375, 1.4321136474609375, 1.4940185546875, 1.5559234619140625, 1.617828369140625, 1.6797332763671875, 1.74163818359375, 1.8035430908203125, 1.865447998046875, 1.9273529052734375, 1.9892578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 13.0, 37.0, 47.0, 63.0, 91.0, 113.0, 119.0, 125.0, 122.0, 99.0, 57.0, 43.0, 21.0, 15.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72802734375, -0.7097702026367188, -0.6915130615234375, -0.6732559204101562, -0.654998779296875, -0.6367416381835938, -0.6184844970703125, -0.6002273559570312, -0.58197021484375, -0.5637130737304688, -0.5454559326171875, -0.5271987915039062, -0.508941650390625, -0.49068450927734375, -0.4724273681640625, -0.45417022705078125, -0.4359130859375, -0.41765594482421875, -0.3993988037109375, -0.38114166259765625, -0.362884521484375, -0.34462738037109375, -0.3263702392578125, -0.30811309814453125, -0.28985595703125, -0.27159881591796875, -0.2533416748046875, -0.23508453369140625, -0.216827392578125, -0.19857025146484375, -0.1803131103515625, -0.16205596923828125, -0.143798828125, -0.12554168701171875, -0.1072845458984375, -0.08902740478515625, -0.070770263671875, -0.05251312255859375, -0.0342559814453125, -0.01599884033203125, 0.00225830078125, 0.02051544189453125, 0.0387725830078125, 0.05702972412109375, 0.075286865234375, 0.09354400634765625, 0.1118011474609375, 0.13005828857421875, 0.1483154296875, 0.16657257080078125, 0.1848297119140625, 0.20308685302734375, 0.221343994140625, 0.23960113525390625, 0.2578582763671875, 0.27611541748046875, 0.29437255859375, 0.31262969970703125, 0.3308868408203125, 0.34914398193359375, 0.367401123046875, 0.38565826416015625, 0.4039154052734375, 0.42217254638671875, 0.4404296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 12.0, 12.0, 24.0, 32.0, 57.0, 114.0, 216.0, 399.0, 792.0, 1663.0, 4429.0, 21256.0, 440252.0, 3662016.0, 50992.0, 7590.0, 2339.0, 1007.0, 480.0, 260.0, 153.0, 91.0, 40.0, 25.0, 12.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7158203125, -1.6641387939453125, -1.612457275390625, -1.5607757568359375, -1.50909423828125, -1.4574127197265625, -1.405731201171875, -1.3540496826171875, -1.3023681640625, -1.2506866455078125, -1.199005126953125, -1.1473236083984375, -1.09564208984375, -1.0439605712890625, -0.992279052734375, -0.9405975341796875, -0.888916015625, -0.8372344970703125, -0.785552978515625, -0.7338714599609375, -0.68218994140625, -0.6305084228515625, -0.578826904296875, -0.5271453857421875, -0.4754638671875, -0.4237823486328125, -0.372100830078125, -0.3204193115234375, -0.26873779296875, -0.2170562744140625, -0.165374755859375, -0.1136932373046875, -0.06201171875, -0.0103302001953125, 0.041351318359375, 0.0930328369140625, 0.14471435546875, 0.1963958740234375, 0.248077392578125, 0.2997589111328125, 0.3514404296875, 0.4031219482421875, 0.454803466796875, 0.5064849853515625, 0.55816650390625, 0.6098480224609375, 0.661529541015625, 0.7132110595703125, 0.764892578125, 0.8165740966796875, 0.868255615234375, 0.9199371337890625, 0.97161865234375, 1.0233001708984375, 1.074981689453125, 1.1266632080078125, 1.1783447265625, 1.2300262451171875, 1.281707763671875, 1.3333892822265625, 1.38507080078125, 1.4367523193359375, 1.488433837890625, 1.5401153564453125, 1.591796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 10.0, 10.0, 19.0, 35.0, 61.0, 157.0, 420.0, 2141.0, 826.0, 208.0, 83.0, 29.0, 21.0, 14.0, 13.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85205078125, -0.827484130859375, -0.80291748046875, -0.778350830078125, -0.7537841796875, -0.729217529296875, -0.70465087890625, -0.680084228515625, -0.655517578125, -0.630950927734375, -0.60638427734375, -0.581817626953125, -0.5572509765625, -0.532684326171875, -0.50811767578125, -0.483551025390625, -0.458984375, -0.434417724609375, -0.40985107421875, -0.385284423828125, -0.3607177734375, -0.336151123046875, -0.31158447265625, -0.287017822265625, -0.262451171875, -0.237884521484375, -0.21331787109375, -0.188751220703125, -0.1641845703125, -0.139617919921875, -0.11505126953125, -0.090484619140625, -0.06591796875, -0.041351318359375, -0.01678466796875, 0.007781982421875, 0.0323486328125, 0.056915283203125, 0.08148193359375, 0.106048583984375, 0.130615234375, 0.155181884765625, 0.17974853515625, 0.204315185546875, 0.2288818359375, 0.253448486328125, 0.27801513671875, 0.302581787109375, 0.3271484375, 0.351715087890625, 0.37628173828125, 0.400848388671875, 0.4254150390625, 0.449981689453125, 0.47454833984375, 0.499114990234375, 0.523681640625, 0.548248291015625, 0.57281494140625, 0.597381591796875, 0.6219482421875, 0.646514892578125, 0.67108154296875, 0.695648193359375, 0.72021484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 40.0, 80.0, 173.0, 252.0, 242.0, 121.0, 41.0, 27.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.880246162414551, -6.733365058898926, -6.586483478546143, -6.439601898193359, -6.292720794677734, -6.145839691162109, -5.998958110809326, -5.852076530456543, -5.705195426940918, -5.558314323425293, -5.41143274307251, -5.264551162719727, -5.117670059204102, -4.970788955688477, -4.823907375335693, -4.67702579498291, -4.530144691467285, -4.38326358795166, -4.236382007598877, -4.089500427246094, -3.9426193237304688, -3.7957379817962646, -3.6488566398620605, -3.5019752979278564, -3.3550939559936523, -3.2082126140594482, -3.061331272125244, -2.91444993019104, -2.767568588256836, -2.620687246322632, -2.4738059043884277, -2.3269245624542236, -2.1800436973571777, -2.0331623554229736, -1.8862810134887695, -1.7393996715545654, -1.5925183296203613, -1.4456369876861572, -1.2987556457519531, -1.151874303817749, -1.004992961883545, -0.8581116199493408, -0.7112302780151367, -0.5643489360809326, -0.4174675941467285, -0.2705862522125244, -0.12370491027832031, 0.02317643165588379, 0.1700577735900879, 0.316939115524292, 0.4638204574584961, 0.6107017993927002, 0.7575831413269043, 0.9044644832611084, 1.0513458251953125, 1.1982271671295166, 1.3451085090637207, 1.4919898509979248, 1.638871192932129, 1.785752534866333, 1.932633876800537, 2.079515218734741, 2.2263965606689453, 2.3732779026031494, 2.5201592445373535]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 8.0, 8.0, 6.0, 22.0, 20.0, 18.0, 22.0, 27.0, 26.0, 37.0, 23.0, 23.0, 39.0, 36.0, 32.0, 38.0, 52.0, 37.0, 34.0, 38.0, 39.0, 41.0, 39.0, 35.0, 26.0, 40.0, 31.0, 26.0, 23.0, 19.0, 23.0, 16.0, 13.0, 8.0, 13.0, 9.0, 6.0, 6.0, 9.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.476900577545166, -1.4313163757324219, -1.3857322931289673, -1.3401480913162231, -1.2945640087127686, -1.2489798069000244, -1.2033957242965698, -1.1578115224838257, -1.112227439880371, -1.066643238067627, -1.0210591554641724, -0.975475013256073, -0.9298908710479736, -0.8843067288398743, -0.8387225866317749, -0.7931383848190308, -0.7475542426109314, -0.701970100402832, -0.6563859581947327, -0.6108018159866333, -0.5652176737785339, -0.5196335315704346, -0.4740493595600128, -0.42846521735191345, -0.3828810751438141, -0.3372969329357147, -0.29171279072761536, -0.2461286336183548, -0.20054449141025543, -0.15496034920215607, -0.10937619209289551, -0.06379204988479614, -0.018207907676696777, 0.027376238256692886, 0.07296038419008255, 0.11854453384876251, 0.16412867605686188, 0.20971281826496124, 0.2552969753742218, 0.30088111758232117, 0.34646525979042053, 0.3920494019985199, 0.43763354420661926, 0.483217716217041, 0.5288018584251404, 0.5743860006332397, 0.6199701428413391, 0.6655542850494385, 0.7111384272575378, 0.7567225694656372, 0.8023067116737366, 0.8478908538818359, 0.8934749960899353, 0.9390591382980347, 0.9846433401107788, 1.0302274227142334, 1.0758116245269775, 1.1213958263397217, 1.1669799089431763, 1.2125641107559204, 1.258148193359375, 1.3037323951721191, 1.3493164777755737, 1.3949006795883179, 1.4404847621917725]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 6.0, 5.0, 7.0, 13.0, 18.0, 16.0, 20.0, 35.0, 46.0, 60.0, 85.0, 105.0, 150.0, 250.0, 344.0, 627.0, 985.0, 2102.0, 4824.0, 13253.0, 48432.0, 286135.0, 573839.0, 84055.0, 20088.0, 6728.0, 2818.0, 1346.0, 733.0, 431.0, 293.0, 213.0, 136.0, 59.0, 68.0, 42.0, 38.0, 22.0, 27.0, 20.0, 17.0, 10.0, 6.0, 15.0, 3.0, 7.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.259765625, -1.2193603515625, -1.178955078125, -1.1385498046875, -1.09814453125, -1.0577392578125, -1.017333984375, -0.9769287109375, -0.9365234375, -0.8961181640625, -0.855712890625, -0.8153076171875, -0.77490234375, -0.7344970703125, -0.694091796875, -0.6536865234375, -0.61328125, -0.5728759765625, -0.532470703125, -0.4920654296875, -0.45166015625, -0.4112548828125, -0.370849609375, -0.3304443359375, -0.2900390625, -0.2496337890625, -0.209228515625, -0.1688232421875, -0.12841796875, -0.0880126953125, -0.047607421875, -0.0072021484375, 0.033203125, 0.0736083984375, 0.114013671875, 0.1544189453125, 0.19482421875, 0.2352294921875, 0.275634765625, 0.3160400390625, 0.3564453125, 0.3968505859375, 0.437255859375, 0.4776611328125, 0.51806640625, 0.5584716796875, 0.598876953125, 0.6392822265625, 0.6796875, 0.7200927734375, 0.760498046875, 0.8009033203125, 0.84130859375, 0.8817138671875, 0.922119140625, 0.9625244140625, 1.0029296875, 1.0433349609375, 1.083740234375, 1.1241455078125, 1.16455078125, 1.2049560546875, 1.245361328125, 1.2857666015625, 1.326171875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 7.0, 30.0, 35.0, 54.0, 77.0, 102.0, 137.0, 122.0, 122.0, 120.0, 70.0, 38.0, 33.0, 21.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73095703125, -0.7123603820800781, -0.6937637329101562, -0.6751670837402344, -0.6565704345703125, -0.6379737854003906, -0.6193771362304688, -0.6007804870605469, -0.582183837890625, -0.5635871887207031, -0.5449905395507812, -0.5263938903808594, -0.5077972412109375, -0.4892005920410156, -0.47060394287109375, -0.4520072937011719, -0.43341064453125, -0.4148139953613281, -0.39621734619140625, -0.3776206970214844, -0.3590240478515625, -0.3404273986816406, -0.32183074951171875, -0.3032341003417969, -0.284637451171875, -0.2660408020019531, -0.24744415283203125, -0.22884750366210938, -0.2102508544921875, -0.19165420532226562, -0.17305755615234375, -0.15446090698242188, -0.1358642578125, -0.11726760864257812, -0.09867095947265625, -0.08007431030273438, -0.0614776611328125, -0.042881011962890625, -0.02428436279296875, -0.005687713623046875, 0.012908935546875, 0.031505584716796875, 0.05010223388671875, 0.06869888305664062, 0.0872955322265625, 0.10589218139648438, 0.12448883056640625, 0.14308547973632812, 0.16168212890625, 0.18027877807617188, 0.19887542724609375, 0.21747207641601562, 0.2360687255859375, 0.2546653747558594, 0.27326202392578125, 0.2918586730957031, 0.310455322265625, 0.3290519714355469, 0.34764862060546875, 0.3662452697753906, 0.3848419189453125, 0.4034385681152344, 0.42203521728515625, 0.4406318664550781, 0.459228515625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 6.0, 15.0, 22.0, 26.0, 30.0, 38.0, 57.0, 87.0, 113.0, 208.0, 316.0, 554.0, 978.0, 2134.0, 5101.0, 16664.0, 73566.0, 539938.0, 337210.0, 51015.0, 12465.0, 4057.0, 1753.0, 870.0, 468.0, 257.0, 177.0, 105.0, 85.0, 50.0, 49.0, 31.0, 23.0, 14.0, 14.0, 5.0, 5.0, 5.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.306640625, -1.2680816650390625, -1.229522705078125, -1.1909637451171875, -1.15240478515625, -1.1138458251953125, -1.075286865234375, -1.0367279052734375, -0.9981689453125, -0.9596099853515625, -0.921051025390625, -0.8824920654296875, -0.84393310546875, -0.8053741455078125, -0.766815185546875, -0.7282562255859375, -0.689697265625, -0.6511383056640625, -0.612579345703125, -0.5740203857421875, -0.53546142578125, -0.4969024658203125, -0.458343505859375, -0.4197845458984375, -0.3812255859375, -0.3426666259765625, -0.304107666015625, -0.2655487060546875, -0.22698974609375, -0.1884307861328125, -0.149871826171875, -0.1113128662109375, -0.07275390625, -0.0341949462890625, 0.004364013671875, 0.0429229736328125, 0.08148193359375, 0.1200408935546875, 0.158599853515625, 0.1971588134765625, 0.2357177734375, 0.2742767333984375, 0.312835693359375, 0.3513946533203125, 0.38995361328125, 0.4285125732421875, 0.467071533203125, 0.5056304931640625, 0.544189453125, 0.5827484130859375, 0.621307373046875, 0.6598663330078125, 0.69842529296875, 0.7369842529296875, 0.775543212890625, 0.8141021728515625, 0.8526611328125, 0.8912200927734375, 0.929779052734375, 0.9683380126953125, 1.00689697265625, 1.0454559326171875, 1.084014892578125, 1.1225738525390625, 1.1611328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 14.0, 12.0, 11.0, 15.0, 19.0, 35.0, 36.0, 26.0, 39.0, 42.0, 48.0, 44.0, 66.0, 49.0, 57.0, 52.0, 52.0, 49.0, 48.0, 43.0, 31.0, 39.0, 33.0, 24.0, 13.0, 18.0, 18.0, 4.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1435546875, -1.1057281494140625, -1.067901611328125, -1.0300750732421875, -0.99224853515625, -0.9544219970703125, -0.916595458984375, -0.8787689208984375, -0.8409423828125, -0.8031158447265625, -0.765289306640625, -0.7274627685546875, -0.68963623046875, -0.6518096923828125, -0.613983154296875, -0.5761566162109375, -0.538330078125, -0.5005035400390625, -0.462677001953125, -0.4248504638671875, -0.38702392578125, -0.3491973876953125, -0.311370849609375, -0.2735443115234375, -0.2357177734375, -0.1978912353515625, -0.160064697265625, -0.1222381591796875, -0.08441162109375, -0.0465850830078125, -0.008758544921875, 0.0290679931640625, 0.06689453125, 0.1047210693359375, 0.142547607421875, 0.1803741455078125, 0.21820068359375, 0.2560272216796875, 0.293853759765625, 0.3316802978515625, 0.3695068359375, 0.4073333740234375, 0.445159912109375, 0.4829864501953125, 0.52081298828125, 0.5586395263671875, 0.596466064453125, 0.6342926025390625, 0.672119140625, 0.7099456787109375, 0.747772216796875, 0.7855987548828125, 0.82342529296875, 0.8612518310546875, 0.899078369140625, 0.9369049072265625, 0.9747314453125, 1.0125579833984375, 1.050384521484375, 1.0882110595703125, 1.12603759765625, 1.1638641357421875, 1.201690673828125, 1.2395172119140625, 1.27734375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 6.0, 11.0, 7.0, 13.0, 18.0, 17.0, 35.0, 62.0, 91.0, 139.0, 204.0, 371.0, 648.0, 1412.0, 3755.0, 13162.0, 61029.0, 454690.0, 434486.0, 59021.0, 12691.0, 3700.0, 1372.0, 683.0, 350.0, 192.0, 132.0, 69.0, 56.0, 39.0, 23.0, 19.0, 11.0, 14.0, 10.0, 4.0, 3.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.322265625, -0.3115196228027344, -0.30077362060546875, -0.2900276184082031, -0.2792816162109375, -0.2685356140136719, -0.25778961181640625, -0.24704360961914062, -0.236297607421875, -0.22555160522460938, -0.21480560302734375, -0.20405960083007812, -0.1933135986328125, -0.18256759643554688, -0.17182159423828125, -0.16107559204101562, -0.15032958984375, -0.13958358764648438, -0.12883758544921875, -0.11809158325195312, -0.1073455810546875, -0.09659957885742188, -0.08585357666015625, -0.07510757446289062, -0.064361572265625, -0.053615570068359375, -0.04286956787109375, -0.032123565673828125, -0.0213775634765625, -0.010631561279296875, 0.00011444091796875, 0.010860443115234375, 0.0216064453125, 0.032352447509765625, 0.04309844970703125, 0.053844451904296875, 0.0645904541015625, 0.07533645629882812, 0.08608245849609375, 0.09682846069335938, 0.107574462890625, 0.11832046508789062, 0.12906646728515625, 0.13981246948242188, 0.1505584716796875, 0.16130447387695312, 0.17205047607421875, 0.18279647827148438, 0.19354248046875, 0.20428848266601562, 0.21503448486328125, 0.22578048706054688, 0.2365264892578125, 0.24727249145507812, 0.25801849365234375, 0.2687644958496094, 0.279510498046875, 0.2902565002441406, 0.30100250244140625, 0.3117485046386719, 0.3224945068359375, 0.3332405090332031, 0.34398651123046875, 0.3547325134277344, 0.365478515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 5.0, 6.0, 15.0, 25.0, 33.0, 39.0, 64.0, 65.0, 148.0, 186.0, 128.0, 86.0, 69.0, 29.0, 22.0, 17.0, 18.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410743713378906e-05, -4.214141517877579e-05, -4.017539322376251e-05, -3.820937126874924e-05, -3.624334931373596e-05, -3.427732735872269e-05, -3.231130540370941e-05, -3.0345283448696136e-05, -2.837926149368286e-05, -2.6413239538669586e-05, -2.444721758365631e-05, -2.2481195628643036e-05, -2.051517367362976e-05, -1.8549151718616486e-05, -1.658312976360321e-05, -1.4617107808589935e-05, -1.265108585357666e-05, -1.0685063898563385e-05, -8.71904194355011e-06, -6.753019988536835e-06, -4.7869980335235596e-06, -2.8209760785102844e-06, -8.549541234970093e-07, 1.1110678315162659e-06, 3.077089786529541e-06, 5.043111741542816e-06, 7.009133696556091e-06, 8.975155651569366e-06, 1.0941177606582642e-05, 1.2907199561595917e-05, 1.4873221516609192e-05, 1.6839243471622467e-05, 1.8805265426635742e-05, 2.0771287381649017e-05, 2.2737309336662292e-05, 2.4703331291675568e-05, 2.6669353246688843e-05, 2.8635375201702118e-05, 3.060139715671539e-05, 3.256741911172867e-05, 3.453344106674194e-05, 3.649946302175522e-05, 3.8465484976768494e-05, 4.043150693178177e-05, 4.2397528886795044e-05, 4.436355084180832e-05, 4.6329572796821594e-05, 4.829559475183487e-05, 5.0261616706848145e-05, 5.222763866186142e-05, 5.4193660616874695e-05, 5.615968257188797e-05, 5.8125704526901245e-05, 6.009172648191452e-05, 6.20577484369278e-05, 6.402377039194107e-05, 6.598979234695435e-05, 6.795581430196762e-05, 6.99218362569809e-05, 7.188785821199417e-05, 7.385388016700745e-05, 7.581990212202072e-05, 7.7785924077034e-05, 7.975194603204727e-05, 8.171796798706055e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 3.0, 9.0, 9.0, 21.0, 18.0, 41.0, 57.0, 77.0, 131.0, 229.0, 373.0, 786.0, 1927.0, 6363.0, 31564.0, 222504.0, 681364.0, 83462.0, 13804.0, 3357.0, 1122.0, 553.0, 298.0, 161.0, 117.0, 58.0, 45.0, 41.0, 19.0, 11.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3349609375, -0.3226737976074219, -0.31038665771484375, -0.2980995178222656, -0.2858123779296875, -0.2735252380371094, -0.26123809814453125, -0.24895095825195312, -0.236663818359375, -0.22437667846679688, -0.21208953857421875, -0.19980239868164062, -0.1875152587890625, -0.17522811889648438, -0.16294097900390625, -0.15065383911132812, -0.13836669921875, -0.12607955932617188, -0.11379241943359375, -0.10150527954101562, -0.0892181396484375, -0.07693099975585938, -0.06464385986328125, -0.052356719970703125, -0.040069580078125, -0.027782440185546875, -0.01549530029296875, -0.003208160400390625, 0.0090789794921875, 0.021366119384765625, 0.03365325927734375, 0.045940399169921875, 0.0582275390625, 0.07051467895507812, 0.08280181884765625, 0.09508895874023438, 0.1073760986328125, 0.11966323852539062, 0.13195037841796875, 0.14423751831054688, 0.156524658203125, 0.16881179809570312, 0.18109893798828125, 0.19338607788085938, 0.2056732177734375, 0.21796035766601562, 0.23024749755859375, 0.24253463745117188, 0.25482177734375, 0.2671089172363281, 0.27939605712890625, 0.2916831970214844, 0.3039703369140625, 0.3162574768066406, 0.32854461669921875, 0.3408317565917969, 0.353118896484375, 0.3654060363769531, 0.37769317626953125, 0.3899803161621094, 0.4022674560546875, 0.4145545959472656, 0.42684173583984375, 0.4391288757324219, 0.451416015625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 4.0, 14.0, 10.0, 14.0, 19.0, 19.0, 24.0, 27.0, 39.0, 25.0, 57.0, 74.0, 70.0, 104.0, 92.0, 72.0, 66.0, 45.0, 25.0, 28.0, 19.0, 20.0, 10.0, 11.0, 21.0, 6.0, 11.0, 13.0, 3.0, 9.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.2467041015625, -0.2401103973388672, -0.23351669311523438, -0.22692298889160156, -0.22032928466796875, -0.21373558044433594, -0.20714187622070312, -0.2005481719970703, -0.1939544677734375, -0.1873607635498047, -0.18076705932617188, -0.17417335510253906, -0.16757965087890625, -0.16098594665527344, -0.15439224243164062, -0.1477985382080078, -0.141204833984375, -0.1346111297607422, -0.12801742553710938, -0.12142372131347656, -0.11483001708984375, -0.10823631286621094, -0.10164260864257812, -0.09504890441894531, -0.0884552001953125, -0.08186149597167969, -0.07526779174804688, -0.06867408752441406, -0.06208038330078125, -0.05548667907714844, -0.048892974853515625, -0.04229927062988281, -0.03570556640625, -0.029111862182617188, -0.022518157958984375, -0.015924453735351562, -0.00933074951171875, -0.0027370452880859375, 0.003856658935546875, 0.010450363159179688, 0.0170440673828125, 0.023637771606445312, 0.030231475830078125, 0.03682518005371094, 0.04341888427734375, 0.05001258850097656, 0.056606292724609375, 0.06319999694824219, 0.069793701171875, 0.07638740539550781, 0.08298110961914062, 0.08957481384277344, 0.09616851806640625, 0.10276222229003906, 0.10935592651367188, 0.11594963073730469, 0.1225433349609375, 0.1291370391845703, 0.13573074340820312, 0.14232444763183594, 0.14891815185546875, 0.15551185607910156, 0.16210556030273438, 0.1686992645263672, 0.17529296875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 6.0, 14.0, 22.0, 42.0, 86.0, 144.0, 181.0, 184.0, 144.0, 92.0, 42.0, 14.0, 11.0, 7.0, 2.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.291058540344238, -11.034364700317383, -10.777670860290527, -10.520977020263672, -10.264284133911133, -10.007590293884277, -9.750896453857422, -9.494202613830566, -9.237508773803711, -8.980814933776855, -8.72412109375, -8.467427253723145, -8.210733413696289, -7.954040050506592, -7.6973466873168945, -7.440652847290039, -7.183959007263184, -6.927265167236328, -6.670571327209473, -6.413877964019775, -6.15718412399292, -5.9004902839660645, -5.643796920776367, -5.387103080749512, -5.130409240722656, -4.873715400695801, -4.617021560668945, -4.360328197479248, -4.103634357452393, -3.846940517425537, -3.5902469158172607, -3.3335533142089844, -3.076859951019287, -2.8201661109924316, -2.5634725093841553, -2.306778907775879, -2.0500850677490234, -1.7933913469314575, -1.5366976261138916, -1.2800039052963257, -1.0233101844787598, -0.7666164636611938, -0.5099227428436279, -0.253229022026062, 0.0034646987915039062, 0.2601584196090698, 0.5168521404266357, 0.7735458612442017, 1.0302395820617676, 1.2869333028793335, 1.5436270236968994, 1.8003207445144653, 2.0570144653320312, 2.3137083053588867, 2.570401906967163, 2.8270955085754395, 3.083789348602295, 3.3404831886291504, 3.5971767902374268, 3.853870391845703, 4.110564231872559, 4.367258071899414, 4.6239519119262695, 4.880645275115967, 5.137339115142822]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 3.0, 6.0, 8.0, 24.0, 20.0, 22.0, 26.0, 28.0, 32.0, 37.0, 30.0, 33.0, 42.0, 43.0, 50.0, 64.0, 48.0, 42.0, 49.0, 39.0, 55.0, 37.0, 38.0, 36.0, 27.0, 26.0, 20.0, 25.0, 17.0, 15.0, 8.0, 9.0, 8.0, 0.0, 5.0, 5.0, 6.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.1715803146362305, -5.996542453765869, -5.821504592895508, -5.6464667320251465, -5.471428871154785, -5.296391010284424, -5.1213531494140625, -4.946315288543701, -4.77127742767334, -4.5962395668029785, -4.421201705932617, -4.246163845062256, -4.0711259841918945, -3.896088123321533, -3.721050262451172, -3.5460124015808105, -3.370974540710449, -3.195936679840088, -3.0208988189697266, -2.8458609580993652, -2.670823097229004, -2.4957852363586426, -2.3207473754882812, -2.14570951461792, -1.9706716537475586, -1.7956337928771973, -1.620595932006836, -1.4455580711364746, -1.2705202102661133, -1.095482349395752, -0.9204444885253906, -0.7454066276550293, -0.5703682899475098, -0.39533042907714844, -0.2202925682067871, -0.04525470733642578, 0.12978315353393555, 0.3048210144042969, 0.4798588752746582, 0.6548967361450195, 0.8299345970153809, 1.0049724578857422, 1.1800103187561035, 1.3550481796264648, 1.5300860404968262, 1.7051239013671875, 1.8801617622375488, 2.05519962310791, 2.2302374839782715, 2.405275344848633, 2.580313205718994, 2.7553510665893555, 2.930388927459717, 3.105426788330078, 3.2804646492004395, 3.455502510070801, 3.630540370941162, 3.8055782318115234, 3.9806160926818848, 4.155653953552246, 4.330691814422607, 4.505729675292969, 4.68076753616333, 4.855805397033691, 5.030843257904053]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 9.0, 13.0, 18.0, 23.0, 30.0, 42.0, 73.0, 82.0, 137.0, 190.0, 314.0, 575.0, 1200.0, 3053.0, 9936.0, 53805.0, 3835900.0, 258787.0, 21382.0, 5236.0, 1813.0, 736.0, 332.0, 182.0, 140.0, 81.0, 47.0, 36.0, 24.0, 19.0, 12.0, 9.0, 10.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6875, -1.638946533203125, -1.59039306640625, -1.541839599609375, -1.4932861328125, -1.444732666015625, -1.39617919921875, -1.347625732421875, -1.299072265625, -1.250518798828125, -1.20196533203125, -1.153411865234375, -1.1048583984375, -1.056304931640625, -1.00775146484375, -0.959197998046875, -0.91064453125, -0.862091064453125, -0.81353759765625, -0.764984130859375, -0.7164306640625, -0.667877197265625, -0.61932373046875, -0.570770263671875, -0.522216796875, -0.473663330078125, -0.42510986328125, -0.376556396484375, -0.3280029296875, -0.279449462890625, -0.23089599609375, -0.182342529296875, -0.1337890625, -0.085235595703125, -0.03668212890625, 0.011871337890625, 0.0604248046875, 0.108978271484375, 0.15753173828125, 0.206085205078125, 0.254638671875, 0.303192138671875, 0.35174560546875, 0.400299072265625, 0.4488525390625, 0.497406005859375, 0.54595947265625, 0.594512939453125, 0.64306640625, 0.691619873046875, 0.74017333984375, 0.788726806640625, 0.8372802734375, 0.885833740234375, 0.93438720703125, 0.982940673828125, 1.031494140625, 1.080047607421875, 1.12860107421875, 1.177154541015625, 1.2257080078125, 1.274261474609375, 1.32281494140625, 1.371368408203125, 1.419921875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 8.0, 5.0, 19.0, 25.0, 52.0, 72.0, 79.0, 117.0, 124.0, 111.0, 117.0, 100.0, 65.0, 37.0, 33.0, 19.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.740234375, -0.7212409973144531, -0.7022476196289062, -0.6832542419433594, -0.6642608642578125, -0.6452674865722656, -0.6262741088867188, -0.6072807312011719, -0.588287353515625, -0.5692939758300781, -0.5503005981445312, -0.5313072204589844, -0.5123138427734375, -0.4933204650878906, -0.47432708740234375, -0.4553337097167969, -0.43634033203125, -0.4173469543457031, -0.39835357666015625, -0.3793601989746094, -0.3603668212890625, -0.3413734436035156, -0.32238006591796875, -0.3033866882324219, -0.284393310546875, -0.2653999328613281, -0.24640655517578125, -0.22741317749023438, -0.2084197998046875, -0.18942642211914062, -0.17043304443359375, -0.15143966674804688, -0.1324462890625, -0.11345291137695312, -0.09445953369140625, -0.07546615600585938, -0.0564727783203125, -0.037479400634765625, -0.01848602294921875, 0.000507354736328125, 0.019500732421875, 0.038494110107421875, 0.05748748779296875, 0.07648086547851562, 0.0954742431640625, 0.11446762084960938, 0.13346099853515625, 0.15245437622070312, 0.17144775390625, 0.19044113159179688, 0.20943450927734375, 0.22842788696289062, 0.2474212646484375, 0.2664146423339844, 0.28540802001953125, 0.3044013977050781, 0.323394775390625, 0.3423881530761719, 0.36138153076171875, 0.3803749084472656, 0.3993682861328125, 0.4183616638183594, 0.43735504150390625, 0.4563484191894531, 0.475341796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 15.0, 22.0, 49.0, 54.0, 111.0, 137.0, 244.0, 347.0, 651.0, 1177.0, 2311.0, 5463.0, 17491.0, 110196.0, 3784559.0, 233320.0, 25342.0, 6928.0, 2728.0, 1299.0, 707.0, 436.0, 283.0, 162.0, 83.0, 51.0, 45.0, 25.0, 12.0, 11.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4677734375, -1.427703857421875, -1.38763427734375, -1.347564697265625, -1.3074951171875, -1.267425537109375, -1.22735595703125, -1.187286376953125, -1.147216796875, -1.107147216796875, -1.06707763671875, -1.027008056640625, -0.9869384765625, -0.946868896484375, -0.90679931640625, -0.866729736328125, -0.82666015625, -0.786590576171875, -0.74652099609375, -0.706451416015625, -0.6663818359375, -0.626312255859375, -0.58624267578125, -0.546173095703125, -0.506103515625, -0.466033935546875, -0.42596435546875, -0.385894775390625, -0.3458251953125, -0.305755615234375, -0.26568603515625, -0.225616455078125, -0.185546875, -0.145477294921875, -0.10540771484375, -0.065338134765625, -0.0252685546875, 0.014801025390625, 0.05487060546875, 0.094940185546875, 0.135009765625, 0.175079345703125, 0.21514892578125, 0.255218505859375, 0.2952880859375, 0.335357666015625, 0.37542724609375, 0.415496826171875, 0.45556640625, 0.495635986328125, 0.53570556640625, 0.575775146484375, 0.6158447265625, 0.655914306640625, 0.69598388671875, 0.736053466796875, 0.776123046875, 0.816192626953125, 0.85626220703125, 0.896331787109375, 0.9364013671875, 0.976470947265625, 1.01654052734375, 1.056610107421875, 1.0966796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 6.0, 11.0, 14.0, 17.0, 25.0, 38.0, 60.0, 93.0, 257.0, 1374.0, 1651.0, 275.0, 103.0, 45.0, 37.0, 18.0, 13.0, 4.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.63623046875, -0.6185684204101562, -0.6009063720703125, -0.5832443237304688, -0.565582275390625, -0.5479202270507812, -0.5302581787109375, -0.5125961303710938, -0.49493408203125, -0.47727203369140625, -0.4596099853515625, -0.44194793701171875, -0.424285888671875, -0.40662384033203125, -0.3889617919921875, -0.37129974365234375, -0.3536376953125, -0.33597564697265625, -0.3183135986328125, -0.30065155029296875, -0.282989501953125, -0.26532745361328125, -0.2476654052734375, -0.23000335693359375, -0.21234130859375, -0.19467926025390625, -0.1770172119140625, -0.15935516357421875, -0.141693115234375, -0.12403106689453125, -0.1063690185546875, -0.08870697021484375, -0.071044921875, -0.05338287353515625, -0.0357208251953125, -0.01805877685546875, -0.000396728515625, 0.01726531982421875, 0.0349273681640625, 0.05258941650390625, 0.07025146484375, 0.08791351318359375, 0.1055755615234375, 0.12323760986328125, 0.140899658203125, 0.15856170654296875, 0.1762237548828125, 0.19388580322265625, 0.2115478515625, 0.22920989990234375, 0.2468719482421875, 0.26453399658203125, 0.282196044921875, 0.29985809326171875, 0.3175201416015625, 0.33518218994140625, 0.35284423828125, 0.37050628662109375, 0.3881683349609375, 0.40583038330078125, 0.423492431640625, 0.44115447998046875, 0.4588165283203125, 0.47647857666015625, 0.494140625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 12.0, 23.0, 40.0, 108.0, 276.0, 288.0, 149.0, 72.0, 23.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.058573246002197, -6.915614604949951, -6.772655487060547, -6.629696846008301, -6.486738204956055, -6.34377908706665, -6.200820446014404, -6.057861328125, -5.914902687072754, -5.771944046020508, -5.6289849281311035, -5.486026287078857, -5.343067169189453, -5.200108528137207, -5.057149887084961, -4.914191246032715, -4.7712321281433105, -4.6282734870910645, -4.48531436920166, -4.342355728149414, -4.199397087097168, -4.056437969207764, -3.9134793281555176, -3.7705204486846924, -3.627561569213867, -3.484602689743042, -3.341643810272217, -3.1986851692199707, -3.0557262897491455, -2.9127674102783203, -2.769808769226074, -2.626849889755249, -2.483891248703003, -2.3409323692321777, -2.1979737281799316, -2.0550148487091064, -1.9120559692382812, -1.769097089767456, -1.6261383295059204, -1.4831795692443848, -1.3402206897735596, -1.1972618103027344, -1.0543030500411987, -0.9113442301750183, -0.7683854103088379, -0.6254265904426575, -0.48246777057647705, -0.3395090103149414, -0.1965501308441162, -0.05359131097793579, 0.08936750888824463, 0.23232632875442505, 0.37528514862060547, 0.5182439684867859, 0.6612027883529663, 0.804161548614502, 0.9471204280853271, 1.0900793075561523, 1.233038067817688, 1.3759968280792236, 1.5189557075500488, 1.661914587020874, 1.8048733472824097, 1.9478321075439453, 2.0907909870147705]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 6.0, 14.0, 8.0, 14.0, 14.0, 23.0, 16.0, 26.0, 25.0, 34.0, 34.0, 36.0, 43.0, 36.0, 41.0, 68.0, 52.0, 41.0, 49.0, 56.0, 56.0, 58.0, 39.0, 33.0, 28.0, 23.0, 19.0, 22.0, 16.0, 17.0, 16.0, 8.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3982491493225098, -1.3483798503875732, -1.2985105514526367, -1.2486412525177002, -1.1987719535827637, -1.1489026546478271, -1.0990333557128906, -1.0491641759872437, -0.9992948770523071, -0.9494255781173706, -0.8995562791824341, -0.8496869802474976, -0.7998177409172058, -0.7499484419822693, -0.7000791430473328, -0.650209903717041, -0.6003405451774597, -0.5504712462425232, -0.5006019473075867, -0.45073267817497253, -0.4008634090423584, -0.3509941101074219, -0.30112481117248535, -0.2512555420398712, -0.2013862431049347, -0.15151695907115936, -0.10164766758680344, -0.05177837610244751, -0.0019090920686721802, 0.04796019196510315, 0.09782949090003967, 0.1476987600326538, 0.19756805896759033, 0.24743734300136566, 0.297306627035141, 0.3471759259700775, 0.39704519510269165, 0.4469144940376282, 0.4967837929725647, 0.5466530323028564, 0.596522331237793, 0.6463916301727295, 0.696260929107666, 0.7461302280426025, 0.7959994673728943, 0.8458687663078308, 0.8957380652427673, 0.9456073045730591, 0.9954766631126404, 1.0453459024429321, 1.0952152013778687, 1.1450845003128052, 1.1949537992477417, 1.2448230981826782, 1.2946923971176147, 1.3445616960525513, 1.3944309949874878, 1.4443002939224243, 1.4941695928573608, 1.5440388917922974, 1.5939081907272339, 1.6437773704528809, 1.6936466693878174, 1.743515968322754, 1.7933852672576904]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 11.0, 15.0, 20.0, 45.0, 75.0, 117.0, 240.0, 507.0, 1144.0, 3872.0, 27657.0, 600783.0, 388863.0, 20176.0, 3101.0, 989.0, 427.0, 236.0, 119.0, 55.0, 45.0, 23.0, 11.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5546875, -2.479400634765625, -2.40411376953125, -2.328826904296875, -2.2535400390625, -2.178253173828125, -2.10296630859375, -2.027679443359375, -1.952392578125, -1.877105712890625, -1.80181884765625, -1.726531982421875, -1.6512451171875, -1.575958251953125, -1.50067138671875, -1.425384521484375, -1.35009765625, -1.274810791015625, -1.19952392578125, -1.124237060546875, -1.0489501953125, -0.973663330078125, -0.89837646484375, -0.823089599609375, -0.747802734375, -0.672515869140625, -0.59722900390625, -0.521942138671875, -0.4466552734375, -0.371368408203125, -0.29608154296875, -0.220794677734375, -0.1455078125, -0.070220947265625, 0.00506591796875, 0.080352783203125, 0.1556396484375, 0.230926513671875, 0.30621337890625, 0.381500244140625, 0.456787109375, 0.532073974609375, 0.60736083984375, 0.682647705078125, 0.7579345703125, 0.833221435546875, 0.90850830078125, 0.983795166015625, 1.05908203125, 1.134368896484375, 1.20965576171875, 1.284942626953125, 1.3602294921875, 1.435516357421875, 1.51080322265625, 1.586090087890625, 1.661376953125, 1.736663818359375, 1.81195068359375, 1.887237548828125, 1.9625244140625, 2.037811279296875, 2.11309814453125, 2.188385009765625, 2.263671875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 15.0, 29.0, 38.0, 65.0, 83.0, 117.0, 133.0, 115.0, 115.0, 114.0, 66.0, 32.0, 31.0, 25.0, 12.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.763671875, -0.7436447143554688, -0.7236175537109375, -0.7035903930664062, -0.683563232421875, -0.6635360717773438, -0.6435089111328125, -0.6234817504882812, -0.60345458984375, -0.5834274291992188, -0.5634002685546875, -0.5433731079101562, -0.523345947265625, -0.5033187866210938, -0.4832916259765625, -0.46326446533203125, -0.4432373046875, -0.42321014404296875, -0.4031829833984375, -0.38315582275390625, -0.363128662109375, -0.34310150146484375, -0.3230743408203125, -0.30304718017578125, -0.28302001953125, -0.26299285888671875, -0.2429656982421875, -0.22293853759765625, -0.202911376953125, -0.18288421630859375, -0.1628570556640625, -0.14282989501953125, -0.122802734375, -0.10277557373046875, -0.0827484130859375, -0.06272125244140625, -0.042694091796875, -0.02266693115234375, -0.0026397705078125, 0.01738739013671875, 0.03741455078125, 0.05744171142578125, 0.0774688720703125, 0.09749603271484375, 0.117523193359375, 0.13755035400390625, 0.1575775146484375, 0.17760467529296875, 0.1976318359375, 0.21765899658203125, 0.2376861572265625, 0.25771331787109375, 0.277740478515625, 0.29776763916015625, 0.3177947998046875, 0.33782196044921875, 0.35784912109375, 0.37787628173828125, 0.3979034423828125, 0.41793060302734375, 0.437957763671875, 0.45798492431640625, 0.4780120849609375, 0.49803924560546875, 0.51806640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 5.0, 12.0, 12.0, 13.0, 17.0, 21.0, 32.0, 41.0, 59.0, 99.0, 120.0, 243.0, 397.0, 708.0, 1458.0, 3166.0, 7711.0, 20628.0, 63370.0, 243724.0, 508932.0, 134925.0, 39370.0, 13555.0, 5229.0, 2214.0, 1039.0, 545.0, 311.0, 208.0, 118.0, 74.0, 52.0, 41.0, 29.0, 23.0, 19.0, 11.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85498046875, -0.8276596069335938, -0.8003387451171875, -0.7730178833007812, -0.745697021484375, -0.7183761596679688, -0.6910552978515625, -0.6637344360351562, -0.63641357421875, -0.6090927124023438, -0.5817718505859375, -0.5544509887695312, -0.527130126953125, -0.49980926513671875, -0.4724884033203125, -0.44516754150390625, -0.4178466796875, -0.39052581787109375, -0.3632049560546875, -0.33588409423828125, -0.308563232421875, -0.28124237060546875, -0.2539215087890625, -0.22660064697265625, -0.19927978515625, -0.17195892333984375, -0.1446380615234375, -0.11731719970703125, -0.089996337890625, -0.06267547607421875, -0.0353546142578125, -0.00803375244140625, 0.019287109375, 0.04660797119140625, 0.0739288330078125, 0.10124969482421875, 0.128570556640625, 0.15589141845703125, 0.1832122802734375, 0.21053314208984375, 0.23785400390625, 0.26517486572265625, 0.2924957275390625, 0.31981658935546875, 0.347137451171875, 0.37445831298828125, 0.4017791748046875, 0.42910003662109375, 0.4564208984375, 0.48374176025390625, 0.5110626220703125, 0.5383834838867188, 0.565704345703125, 0.5930252075195312, 0.6203460693359375, 0.6476669311523438, 0.67498779296875, 0.7023086547851562, 0.7296295166015625, 0.7569503784179688, 0.784271240234375, 0.8115921020507812, 0.8389129638671875, 0.8662338256835938, 0.8935546875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 14.0, 16.0, 19.0, 23.0, 20.0, 24.0, 34.0, 23.0, 26.0, 33.0, 39.0, 43.0, 39.0, 46.0, 44.0, 47.0, 41.0, 38.0, 48.0, 31.0, 39.0, 40.0, 31.0, 38.0, 31.0, 33.0, 19.0, 18.0, 20.0, 15.0, 15.0, 6.0, 10.0, 6.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0400390625, -1.006988525390625, -0.97393798828125, -0.940887451171875, -0.9078369140625, -0.874786376953125, -0.84173583984375, -0.808685302734375, -0.775634765625, -0.742584228515625, -0.70953369140625, -0.676483154296875, -0.6434326171875, -0.610382080078125, -0.57733154296875, -0.544281005859375, -0.51123046875, -0.478179931640625, -0.44512939453125, -0.412078857421875, -0.3790283203125, -0.345977783203125, -0.31292724609375, -0.279876708984375, -0.246826171875, -0.213775634765625, -0.18072509765625, -0.147674560546875, -0.1146240234375, -0.081573486328125, -0.04852294921875, -0.015472412109375, 0.017578125, 0.050628662109375, 0.08367919921875, 0.116729736328125, 0.1497802734375, 0.182830810546875, 0.21588134765625, 0.248931884765625, 0.281982421875, 0.315032958984375, 0.34808349609375, 0.381134033203125, 0.4141845703125, 0.447235107421875, 0.48028564453125, 0.513336181640625, 0.54638671875, 0.579437255859375, 0.61248779296875, 0.645538330078125, 0.6785888671875, 0.711639404296875, 0.74468994140625, 0.777740478515625, 0.810791015625, 0.843841552734375, 0.87689208984375, 0.909942626953125, 0.9429931640625, 0.976043701171875, 1.00909423828125, 1.042144775390625, 1.0751953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 9.0, 4.0, 16.0, 19.0, 29.0, 35.0, 47.0, 68.0, 131.0, 226.0, 338.0, 668.0, 1465.0, 3702.0, 11862.0, 57420.0, 338286.0, 514963.0, 92457.0, 18276.0, 4823.0, 1778.0, 813.0, 421.0, 234.0, 159.0, 97.0, 62.0, 39.0, 22.0, 20.0, 10.0, 18.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.308837890625, -0.2992286682128906, -0.28961944580078125, -0.2800102233886719, -0.2704010009765625, -0.2607917785644531, -0.25118255615234375, -0.24157333374023438, -0.231964111328125, -0.22235488891601562, -0.21274566650390625, -0.20313644409179688, -0.1935272216796875, -0.18391799926757812, -0.17430877685546875, -0.16469955444335938, -0.15509033203125, -0.14548110961914062, -0.13587188720703125, -0.12626266479492188, -0.1166534423828125, -0.10704421997070312, -0.09743499755859375, -0.08782577514648438, -0.078216552734375, -0.06860733032226562, -0.05899810791015625, -0.049388885498046875, -0.0397796630859375, -0.030170440673828125, -0.02056121826171875, -0.010951995849609375, -0.0013427734375, 0.008266448974609375, 0.01787567138671875, 0.027484893798828125, 0.0370941162109375, 0.046703338623046875, 0.05631256103515625, 0.06592178344726562, 0.075531005859375, 0.08514022827148438, 0.09474945068359375, 0.10435867309570312, 0.1139678955078125, 0.12357711791992188, 0.13318634033203125, 0.14279556274414062, 0.15240478515625, 0.16201400756835938, 0.17162322998046875, 0.18123245239257812, 0.1908416748046875, 0.20045089721679688, 0.21006011962890625, 0.21966934204101562, 0.229278564453125, 0.23888778686523438, 0.24849700927734375, 0.2581062316894531, 0.2677154541015625, 0.2773246765136719, 0.28693389892578125, 0.2965431213378906, 0.30615234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 3.0, 1.0, 3.0, 5.0, 11.0, 12.0, 25.0, 27.0, 42.0, 68.0, 108.0, 145.0, 173.0, 133.0, 82.0, 55.0, 31.0, 29.0, 13.0, 6.0, 9.0, 9.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40614128112793e-05, -5.201064050197601e-05, -4.995986819267273e-05, -4.7909095883369446e-05, -4.585832357406616e-05, -4.380755126476288e-05, -4.1756778955459595e-05, -3.970600664615631e-05, -3.765523433685303e-05, -3.5604462027549744e-05, -3.355368971824646e-05, -3.1502917408943176e-05, -2.9452145099639893e-05, -2.740137279033661e-05, -2.5350600481033325e-05, -2.329982817173004e-05, -2.1249055862426758e-05, -1.9198283553123474e-05, -1.714751124382019e-05, -1.5096738934516907e-05, -1.3045966625213623e-05, -1.099519431591034e-05, -8.944422006607056e-06, -6.893649697303772e-06, -4.842877388000488e-06, -2.7921050786972046e-06, -7.413327693939209e-07, 1.3094395399093628e-06, 3.3602118492126465e-06, 5.41098415851593e-06, 7.461756467819214e-06, 9.512528777122498e-06, 1.1563301086425781e-05, 1.3614073395729065e-05, 1.566484570503235e-05, 1.7715618014335632e-05, 1.9766390323638916e-05, 2.18171626329422e-05, 2.3867934942245483e-05, 2.5918707251548767e-05, 2.796947956085205e-05, 3.0020251870155334e-05, 3.207102417945862e-05, 3.41217964887619e-05, 3.6172568798065186e-05, 3.822334110736847e-05, 4.027411341667175e-05, 4.232488572597504e-05, 4.437565803527832e-05, 4.6426430344581604e-05, 4.847720265388489e-05, 5.052797496318817e-05, 5.2578747272491455e-05, 5.462951958179474e-05, 5.668029189109802e-05, 5.8731064200401306e-05, 6.078183650970459e-05, 6.283260881900787e-05, 6.488338112831116e-05, 6.693415343761444e-05, 6.898492574691772e-05, 7.103569805622101e-05, 7.308647036552429e-05, 7.513724267482758e-05, 7.718801498413086e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 15.0, 10.0, 29.0, 46.0, 73.0, 136.0, 242.0, 451.0, 925.0, 2320.0, 7588.0, 40839.0, 414989.0, 518022.0, 49594.0, 8636.0, 2502.0, 1050.0, 546.0, 217.0, 119.0, 52.0, 60.0, 27.0, 14.0, 18.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.388916015625, -0.3759727478027344, -0.36302947998046875, -0.3500862121582031, -0.3371429443359375, -0.3241996765136719, -0.31125640869140625, -0.2983131408691406, -0.285369873046875, -0.2724266052246094, -0.25948333740234375, -0.24654006958007812, -0.2335968017578125, -0.22065353393554688, -0.20771026611328125, -0.19476699829101562, -0.18182373046875, -0.16888046264648438, -0.15593719482421875, -0.14299392700195312, -0.1300506591796875, -0.11710739135742188, -0.10416412353515625, -0.09122085571289062, -0.078277587890625, -0.06533432006835938, -0.05239105224609375, -0.039447784423828125, -0.0265045166015625, -0.013561248779296875, -0.00061798095703125, 0.012325286865234375, 0.0252685546875, 0.038211822509765625, 0.05115509033203125, 0.06409835815429688, 0.0770416259765625, 0.08998489379882812, 0.10292816162109375, 0.11587142944335938, 0.128814697265625, 0.14175796508789062, 0.15470123291015625, 0.16764450073242188, 0.1805877685546875, 0.19353103637695312, 0.20647430419921875, 0.21941757202148438, 0.23236083984375, 0.24530410766601562, 0.25824737548828125, 0.2711906433105469, 0.2841339111328125, 0.2970771789550781, 0.31002044677734375, 0.3229637145996094, 0.335906982421875, 0.3488502502441406, 0.36179351806640625, 0.3747367858886719, 0.3876800537109375, 0.4006233215332031, 0.41356658935546875, 0.4265098571777344, 0.439453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 16.0, 17.0, 25.0, 47.0, 46.0, 67.0, 93.0, 117.0, 145.0, 136.0, 74.0, 54.0, 43.0, 19.0, 25.0, 12.0, 12.0, 5.0, 12.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3330078125, -0.3211402893066406, -0.30927276611328125, -0.2974052429199219, -0.2855377197265625, -0.2736701965332031, -0.26180267333984375, -0.24993515014648438, -0.238067626953125, -0.22620010375976562, -0.21433258056640625, -0.20246505737304688, -0.1905975341796875, -0.17873001098632812, -0.16686248779296875, -0.15499496459960938, -0.14312744140625, -0.13125991821289062, -0.11939239501953125, -0.10752487182617188, -0.0956573486328125, -0.08378982543945312, -0.07192230224609375, -0.060054779052734375, -0.048187255859375, -0.036319732666015625, -0.02445220947265625, -0.012584686279296875, -0.0007171630859375, 0.011150360107421875, 0.02301788330078125, 0.034885406494140625, 0.0467529296875, 0.058620452880859375, 0.07048797607421875, 0.08235549926757812, 0.0942230224609375, 0.10609054565429688, 0.11795806884765625, 0.12982559204101562, 0.141693115234375, 0.15356063842773438, 0.16542816162109375, 0.17729568481445312, 0.1891632080078125, 0.20103073120117188, 0.21289825439453125, 0.22476577758789062, 0.23663330078125, 0.24850082397460938, 0.26036834716796875, 0.2722358703613281, 0.2841033935546875, 0.2959709167480469, 0.30783843994140625, 0.3197059631347656, 0.331573486328125, 0.3434410095214844, 0.35530853271484375, 0.3671760559082031, 0.3790435791015625, 0.3909111022949219, 0.40277862548828125, 0.4146461486816406, 0.426513671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 11.0, 31.0, 99.0, 370.0, 365.0, 111.0, 18.0, 8.0, 1.0], "bins": [-33.244346618652344, -32.679893493652344, -32.11543655395508, -31.550983428955078, -30.986528396606445, -30.422075271606445, -29.857620239257812, -29.29316520690918, -28.72871208190918, -28.164257049560547, -27.599803924560547, -27.035348892211914, -26.47089385986328, -25.90644073486328, -25.34198570251465, -24.777530670166016, -24.213077545166016, -23.648622512817383, -23.084169387817383, -22.51971435546875, -21.955259323120117, -21.390806198120117, -20.826351165771484, -20.26189613342285, -19.69744110107422, -19.132986068725586, -18.568532943725586, -18.004077911376953, -17.43962287902832, -16.87516975402832, -16.310714721679688, -15.746260643005371, -15.181805610656738, -14.617351531982422, -14.052896499633789, -13.488442420959473, -12.923988342285156, -12.359533309936523, -11.795079231262207, -11.23062515258789, -10.666170120239258, -10.101716041564941, -9.537261009216309, -8.972806930541992, -8.408352851867676, -7.843898296356201, -7.279443740844727, -6.71498966217041, -6.150535583496094, -5.586081027984619, -5.021626949310303, -4.457172393798828, -3.8927180767059326, -3.328263759613037, -2.7638092041015625, -2.199354887008667, -1.6349005699157715, -1.070446252822876, -0.5059918165206909, 0.05846261978149414, 0.6229169368743896, 1.1873712539672852, 1.7518258094787598, 2.3162801265716553, 2.880734443664551]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 9.0, 9.0, 16.0, 10.0, 14.0, 21.0, 16.0, 20.0, 18.0, 26.0, 17.0, 19.0, 31.0, 31.0, 29.0, 36.0, 30.0, 30.0, 37.0, 32.0, 48.0, 41.0, 34.0, 40.0, 30.0, 27.0, 23.0, 31.0, 25.0, 20.0, 25.0, 14.0, 31.0, 25.0, 21.0, 10.0, 16.0, 9.0, 13.0, 11.0, 9.0, 13.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.128796577453613, -4.004122734069824, -3.879448890686035, -3.754775285720825, -3.630101442337036, -3.505427598953247, -3.380753993988037, -3.256080150604248, -3.131406307220459, -3.00673246383667, -2.882058620452881, -2.757385015487671, -2.632711172103882, -2.5080373287200928, -2.383363723754883, -2.2586898803710938, -2.1340160369873047, -2.0093421936035156, -1.8846684694290161, -1.7599947452545166, -1.6353209018707275, -1.5106470584869385, -1.385973334312439, -1.2612996101379395, -1.1366257667541504, -1.0119519233703613, -0.8872781991958618, -0.7626044154167175, -0.6379306316375732, -0.513256847858429, -0.38858306407928467, -0.2639092803001404, -0.1392354965209961, -0.014561712741851807, 0.11011207103729248, 0.23478585481643677, 0.35945963859558105, 0.48413342237472534, 0.6088072061538696, 0.7334809899330139, 0.8581547737121582, 0.9828285574913025, 1.1075023412704468, 1.2321760654449463, 1.3568499088287354, 1.4815237522125244, 1.606197476387024, 1.7308712005615234, 1.8555450439453125, 1.9802188873291016, 2.1048927307128906, 2.2295663356781006, 2.3542401790618896, 2.4789140224456787, 2.6035876274108887, 2.7282614707946777, 2.852935314178467, 2.977609157562256, 3.102283000946045, 3.226956605911255, 3.351630449295044, 3.476304292678833, 3.600977897644043, 3.725651741027832, 3.850325584411621]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 3.0, 4.0, 9.0, 15.0, 26.0, 25.0, 36.0, 37.0, 73.0, 148.0, 193.0, 380.0, 653.0, 1481.0, 4150.0, 22786.0, 3771276.0, 371749.0, 15526.0, 3331.0, 1143.0, 498.0, 274.0, 174.0, 116.0, 52.0, 38.0, 21.0, 16.0, 10.0, 13.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.587890625, -3.49322509765625, -3.3985595703125, -3.30389404296875, -3.209228515625, -3.11456298828125, -3.0198974609375, -2.92523193359375, -2.83056640625, -2.73590087890625, -2.6412353515625, -2.54656982421875, -2.451904296875, -2.35723876953125, -2.2625732421875, -2.16790771484375, -2.0732421875, -1.97857666015625, -1.8839111328125, -1.78924560546875, -1.694580078125, -1.59991455078125, -1.5052490234375, -1.41058349609375, -1.31591796875, -1.22125244140625, -1.1265869140625, -1.03192138671875, -0.937255859375, -0.84259033203125, -0.7479248046875, -0.65325927734375, -0.55859375, -0.46392822265625, -0.3692626953125, -0.27459716796875, -0.179931640625, -0.08526611328125, 0.0093994140625, 0.10406494140625, 0.19873046875, 0.29339599609375, 0.3880615234375, 0.48272705078125, 0.577392578125, 0.67205810546875, 0.7667236328125, 0.86138916015625, 0.9560546875, 1.05072021484375, 1.1453857421875, 1.24005126953125, 1.334716796875, 1.42938232421875, 1.5240478515625, 1.61871337890625, 1.71337890625, 1.80804443359375, 1.9027099609375, 1.99737548828125, 2.092041015625, 2.18670654296875, 2.2813720703125, 2.37603759765625, 2.470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 11.0, 18.0, 34.0, 47.0, 63.0, 83.0, 115.0, 115.0, 118.0, 119.0, 85.0, 71.0, 44.0, 26.0, 29.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.74853515625, -0.7288436889648438, -0.7091522216796875, -0.6894607543945312, -0.669769287109375, -0.6500778198242188, -0.6303863525390625, -0.6106948852539062, -0.59100341796875, -0.5713119506835938, -0.5516204833984375, -0.5319290161132812, -0.512237548828125, -0.49254608154296875, -0.4728546142578125, -0.45316314697265625, -0.4334716796875, -0.41378021240234375, -0.3940887451171875, -0.37439727783203125, -0.354705810546875, -0.33501434326171875, -0.3153228759765625, -0.29563140869140625, -0.27593994140625, -0.25624847412109375, -0.2365570068359375, -0.21686553955078125, -0.197174072265625, -0.17748260498046875, -0.1577911376953125, -0.13809967041015625, -0.118408203125, -0.09871673583984375, -0.0790252685546875, -0.05933380126953125, -0.039642333984375, -0.01995086669921875, -0.0002593994140625, 0.01943206787109375, 0.03912353515625, 0.05881500244140625, 0.0785064697265625, 0.09819793701171875, 0.117889404296875, 0.13758087158203125, 0.1572723388671875, 0.17696380615234375, 0.1966552734375, 0.21634674072265625, 0.2360382080078125, 0.25572967529296875, 0.275421142578125, 0.29511260986328125, 0.3148040771484375, 0.33449554443359375, 0.35418701171875, 0.37387847900390625, 0.3935699462890625, 0.41326141357421875, 0.432952880859375, 0.45264434814453125, 0.4723358154296875, 0.49202728271484375, 0.51171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 2.0, 11.0, 9.0, 8.0, 25.0, 32.0, 63.0, 74.0, 132.0, 159.0, 287.0, 432.0, 667.0, 1213.0, 2277.0, 4877.0, 13961.0, 75425.0, 3820144.0, 236454.0, 24160.0, 6879.0, 2969.0, 1524.0, 941.0, 556.0, 352.0, 220.0, 147.0, 100.0, 70.0, 48.0, 20.0, 17.0, 10.0, 7.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.494140625, -1.436004638671875, -1.37786865234375, -1.319732666015625, -1.2615966796875, -1.203460693359375, -1.14532470703125, -1.087188720703125, -1.029052734375, -0.970916748046875, -0.91278076171875, -0.854644775390625, -0.7965087890625, -0.738372802734375, -0.68023681640625, -0.622100830078125, -0.56396484375, -0.505828857421875, -0.44769287109375, -0.389556884765625, -0.3314208984375, -0.273284912109375, -0.21514892578125, -0.157012939453125, -0.098876953125, -0.040740966796875, 0.01739501953125, 0.075531005859375, 0.1336669921875, 0.191802978515625, 0.24993896484375, 0.308074951171875, 0.3662109375, 0.424346923828125, 0.48248291015625, 0.540618896484375, 0.5987548828125, 0.656890869140625, 0.71502685546875, 0.773162841796875, 0.831298828125, 0.889434814453125, 0.94757080078125, 1.005706787109375, 1.0638427734375, 1.121978759765625, 1.18011474609375, 1.238250732421875, 1.29638671875, 1.354522705078125, 1.41265869140625, 1.470794677734375, 1.5289306640625, 1.587066650390625, 1.64520263671875, 1.703338623046875, 1.761474609375, 1.819610595703125, 1.87774658203125, 1.935882568359375, 1.9940185546875, 2.052154541015625, 2.11029052734375, 2.168426513671875, 2.2265625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 10.0, 21.0, 35.0, 65.0, 154.0, 856.0, 2527.0, 208.0, 80.0, 33.0, 16.0, 13.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7859573364257812, -0.7569732666015625, -0.7279891967773438, -0.699005126953125, -0.6700210571289062, -0.6410369873046875, -0.6120529174804688, -0.58306884765625, -0.5540847778320312, -0.5251007080078125, -0.49611663818359375, -0.467132568359375, -0.43814849853515625, -0.4091644287109375, -0.38018035888671875, -0.3511962890625, -0.32221221923828125, -0.2932281494140625, -0.26424407958984375, -0.235260009765625, -0.20627593994140625, -0.1772918701171875, -0.14830780029296875, -0.11932373046875, -0.09033966064453125, -0.0613555908203125, -0.03237152099609375, -0.003387451171875, 0.02559661865234375, 0.0545806884765625, 0.08356475830078125, 0.112548828125, 0.14153289794921875, 0.1705169677734375, 0.19950103759765625, 0.228485107421875, 0.25746917724609375, 0.2864532470703125, 0.31543731689453125, 0.34442138671875, 0.37340545654296875, 0.4023895263671875, 0.43137359619140625, 0.460357666015625, 0.48934173583984375, 0.5183258056640625, 0.5473098754882812, 0.5762939453125, 0.6052780151367188, 0.6342620849609375, 0.6632461547851562, 0.692230224609375, 0.7212142944335938, 0.7501983642578125, 0.7791824340820312, 0.80816650390625, 0.8371505737304688, 0.8661346435546875, 0.8951187133789062, 0.924102783203125, 0.9530868530273438, 0.9820709228515625, 1.0110549926757812, 1.0400390625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 12.0, 28.0, 153.0, 418.0, 266.0, 88.0, 25.0, 12.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.157349109649658, -6.897524356842041, -6.637700080871582, -6.377875328063965, -6.118050575256348, -5.858226299285889, -5.5984015464782715, -5.3385772705078125, -5.078752517700195, -4.818927764892578, -4.559103488922119, -4.299278736114502, -4.039454460144043, -3.779629707336426, -3.5198049545288086, -3.2599804401397705, -3.0001559257507324, -2.7403314113616943, -2.4805068969726562, -2.220682144165039, -1.960857629776001, -1.701033115386963, -1.4412084817886353, -1.1813838481903076, -0.9215593338012695, -0.6617347598075867, -0.4019101858139038, -0.14208561182022095, 0.11773896217346191, 0.3775634765625, 0.6373881101608276, 0.8972127437591553, 1.1570377349853516, 1.4168622493743896, 1.6766868829727173, 1.936511516571045, 2.196336030960083, 2.456160545349121, 2.7159852981567383, 2.9758098125457764, 3.2356343269348145, 3.4954588413238525, 3.7552833557128906, 4.015108108520508, 4.274932861328125, 4.534757137298584, 4.794581890106201, 5.05440616607666, 5.314230918884277, 5.5740556716918945, 5.8338799476623535, 6.093704700469971, 6.35352897644043, 6.613353729248047, 6.873178482055664, 7.133003234863281, 7.39282751083374, 7.652652263641357, 7.912476539611816, 8.172301292419434, 8.43212604522705, 8.691949844360352, 8.951774597167969, 9.211599349975586, 9.471424102783203]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 11.0, 9.0, 22.0, 19.0, 26.0, 20.0, 41.0, 41.0, 42.0, 46.0, 61.0, 59.0, 68.0, 63.0, 61.0, 63.0, 65.0, 44.0, 38.0, 44.0, 31.0, 19.0, 24.0, 21.0, 18.0, 12.0, 11.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2765440940856934, -2.196164608001709, -2.1157851219177246, -2.0354056358337402, -1.9550261497497559, -1.8746466636657715, -1.7942670583724976, -1.7138875722885132, -1.6335080862045288, -1.5531286001205444, -1.47274911403656, -1.3923696279525757, -1.3119900226593018, -1.2316105365753174, -1.151231050491333, -1.0708515644073486, -0.9904720783233643, -0.9100925922393799, -0.8297131061553955, -0.7493335604667664, -0.668954074382782, -0.5885745882987976, -0.5081950426101685, -0.4278155565261841, -0.3474360704421997, -0.26705658435821533, -0.18667706847190857, -0.106297567486763, -0.02591806650161743, 0.05446141958236694, 0.1348409354686737, 0.21522045135498047, 0.29559993743896484, 0.3759794235229492, 0.456358939409256, 0.5367384552955627, 0.6171179413795471, 0.6974974274635315, 0.7778769731521606, 0.858256459236145, 0.9386359453201294, 1.0190154314041138, 1.0993949174880981, 1.1797744035720825, 1.2601540088653564, 1.3405334949493408, 1.4209129810333252, 1.5012924671173096, 1.581671953201294, 1.6620514392852783, 1.7424309253692627, 1.822810411453247, 1.9031898975372314, 1.9835693836212158, 2.0639488697052, 2.1443285942077637, 2.224708080291748, 2.3050875663757324, 2.385467052459717, 2.465846538543701, 2.5462260246276855, 2.62660551071167, 2.7069849967956543, 2.7873644828796387, 2.867743968963623]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 5.0, 12.0, 16.0, 22.0, 24.0, 37.0, 51.0, 111.0, 163.0, 260.0, 496.0, 942.0, 2138.0, 6803.0, 34765.0, 358066.0, 573790.0, 56062.0, 9530.0, 2710.0, 1129.0, 596.0, 338.0, 182.0, 95.0, 72.0, 47.0, 23.0, 22.0, 12.0, 9.0, 6.0, 0.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.175628662109375, -2.09539794921875, -2.015167236328125, -1.9349365234375, -1.854705810546875, -1.77447509765625, -1.694244384765625, -1.614013671875, -1.533782958984375, -1.45355224609375, -1.373321533203125, -1.2930908203125, -1.212860107421875, -1.13262939453125, -1.052398681640625, -0.97216796875, -0.891937255859375, -0.81170654296875, -0.731475830078125, -0.6512451171875, -0.571014404296875, -0.49078369140625, -0.410552978515625, -0.330322265625, -0.250091552734375, -0.16986083984375, -0.089630126953125, -0.0093994140625, 0.070831298828125, 0.15106201171875, 0.231292724609375, 0.3115234375, 0.391754150390625, 0.47198486328125, 0.552215576171875, 0.6324462890625, 0.712677001953125, 0.79290771484375, 0.873138427734375, 0.953369140625, 1.033599853515625, 1.11383056640625, 1.194061279296875, 1.2742919921875, 1.354522705078125, 1.43475341796875, 1.514984130859375, 1.59521484375, 1.675445556640625, 1.75567626953125, 1.835906982421875, 1.9161376953125, 1.996368408203125, 2.07659912109375, 2.156829833984375, 2.237060546875, 2.317291259765625, 2.39752197265625, 2.477752685546875, 2.5579833984375, 2.638214111328125, 2.71844482421875, 2.798675537109375, 2.87890625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 11.0, 22.0, 33.0, 44.0, 62.0, 91.0, 109.0, 135.0, 131.0, 119.0, 95.0, 58.0, 27.0, 33.0, 15.0, 10.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.77099609375, -0.75006103515625, -0.7291259765625, -0.70819091796875, -0.687255859375, -0.66632080078125, -0.6453857421875, -0.62445068359375, -0.603515625, -0.58258056640625, -0.5616455078125, -0.54071044921875, -0.519775390625, -0.49884033203125, -0.4779052734375, -0.45697021484375, -0.43603515625, -0.41510009765625, -0.3941650390625, -0.37322998046875, -0.352294921875, -0.33135986328125, -0.3104248046875, -0.28948974609375, -0.2685546875, -0.24761962890625, -0.2266845703125, -0.20574951171875, -0.184814453125, -0.16387939453125, -0.1429443359375, -0.12200927734375, -0.10107421875, -0.08013916015625, -0.0592041015625, -0.03826904296875, -0.017333984375, 0.00360107421875, 0.0245361328125, 0.04547119140625, 0.06640625, 0.08734130859375, 0.1082763671875, 0.12921142578125, 0.150146484375, 0.17108154296875, 0.1920166015625, 0.21295166015625, 0.23388671875, 0.25482177734375, 0.2757568359375, 0.29669189453125, 0.317626953125, 0.33856201171875, 0.3594970703125, 0.38043212890625, 0.4013671875, 0.42230224609375, 0.4432373046875, 0.46417236328125, 0.485107421875, 0.50604248046875, 0.5269775390625, 0.54791259765625, 0.56884765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 3.0, 8.0, 4.0, 3.0, 2.0, 8.0, 15.0, 24.0, 38.0, 57.0, 106.0, 181.0, 357.0, 749.0, 2049.0, 8359.0, 73439.0, 804405.0, 141816.0, 12246.0, 2795.0, 996.0, 390.0, 203.0, 125.0, 58.0, 39.0, 30.0, 12.0, 13.0, 3.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.005859375, -2.91900634765625, -2.8321533203125, -2.74530029296875, -2.658447265625, -2.57159423828125, -2.4847412109375, -2.39788818359375, -2.31103515625, -2.22418212890625, -2.1373291015625, -2.05047607421875, -1.963623046875, -1.87677001953125, -1.7899169921875, -1.70306396484375, -1.6162109375, -1.52935791015625, -1.4425048828125, -1.35565185546875, -1.268798828125, -1.18194580078125, -1.0950927734375, -1.00823974609375, -0.92138671875, -0.83453369140625, -0.7476806640625, -0.66082763671875, -0.573974609375, -0.48712158203125, -0.4002685546875, -0.31341552734375, -0.2265625, -0.13970947265625, -0.0528564453125, 0.03399658203125, 0.120849609375, 0.20770263671875, 0.2945556640625, 0.38140869140625, 0.46826171875, 0.55511474609375, 0.6419677734375, 0.72882080078125, 0.815673828125, 0.90252685546875, 0.9893798828125, 1.07623291015625, 1.1630859375, 1.24993896484375, 1.3367919921875, 1.42364501953125, 1.510498046875, 1.59735107421875, 1.6842041015625, 1.77105712890625, 1.85791015625, 1.94476318359375, 2.0316162109375, 2.11846923828125, 2.205322265625, 2.29217529296875, 2.3790283203125, 2.46588134765625, 2.552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 12.0, 10.0, 15.0, 15.0, 24.0, 33.0, 47.0, 77.0, 83.0, 103.0, 89.0, 89.0, 78.0, 79.0, 68.0, 54.0, 36.0, 28.0, 20.0, 14.0, 9.0, 8.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.623626708984375, -2.54803466796875, -2.472442626953125, -2.3968505859375, -2.321258544921875, -2.24566650390625, -2.170074462890625, -2.094482421875, -2.018890380859375, -1.94329833984375, -1.867706298828125, -1.7921142578125, -1.716522216796875, -1.64093017578125, -1.565338134765625, -1.48974609375, -1.414154052734375, -1.33856201171875, -1.262969970703125, -1.1873779296875, -1.111785888671875, -1.03619384765625, -0.960601806640625, -0.885009765625, -0.809417724609375, -0.73382568359375, -0.658233642578125, -0.5826416015625, -0.507049560546875, -0.43145751953125, -0.355865478515625, -0.2802734375, -0.204681396484375, -0.12908935546875, -0.053497314453125, 0.0220947265625, 0.097686767578125, 0.17327880859375, 0.248870849609375, 0.324462890625, 0.400054931640625, 0.47564697265625, 0.551239013671875, 0.6268310546875, 0.702423095703125, 0.77801513671875, 0.853607177734375, 0.92919921875, 1.004791259765625, 1.08038330078125, 1.155975341796875, 1.2315673828125, 1.307159423828125, 1.38275146484375, 1.458343505859375, 1.533935546875, 1.609527587890625, 1.68511962890625, 1.760711669921875, 1.8363037109375, 1.911895751953125, 1.98748779296875, 2.063079833984375, 2.138671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 8.0, 5.0, 5.0, 12.0, 14.0, 15.0, 18.0, 27.0, 33.0, 46.0, 51.0, 72.0, 91.0, 125.0, 189.0, 266.0, 412.0, 679.0, 1304.0, 2881.0, 8186.0, 121741.0, 884617.0, 19060.0, 4280.0, 1861.0, 941.0, 487.0, 339.0, 191.0, 153.0, 110.0, 87.0, 46.0, 51.0, 37.0, 28.0, 27.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.794921875, -1.7374420166015625, -1.679962158203125, -1.6224822998046875, -1.56500244140625, -1.5075225830078125, -1.450042724609375, -1.3925628662109375, -1.3350830078125, -1.2776031494140625, -1.220123291015625, -1.1626434326171875, -1.10516357421875, -1.0476837158203125, -0.990203857421875, -0.9327239990234375, -0.875244140625, -0.8177642822265625, -0.760284423828125, -0.7028045654296875, -0.64532470703125, -0.5878448486328125, -0.530364990234375, -0.4728851318359375, -0.4154052734375, -0.3579254150390625, -0.300445556640625, -0.2429656982421875, -0.18548583984375, -0.1280059814453125, -0.070526123046875, -0.0130462646484375, 0.04443359375, 0.1019134521484375, 0.159393310546875, 0.2168731689453125, 0.27435302734375, 0.3318328857421875, 0.389312744140625, 0.4467926025390625, 0.5042724609375, 0.5617523193359375, 0.619232177734375, 0.6767120361328125, 0.73419189453125, 0.7916717529296875, 0.849151611328125, 0.9066314697265625, 0.964111328125, 1.0215911865234375, 1.079071044921875, 1.1365509033203125, 1.19403076171875, 1.2515106201171875, 1.308990478515625, 1.3664703369140625, 1.4239501953125, 1.4814300537109375, 1.538909912109375, 1.5963897705078125, 1.65386962890625, 1.7113494873046875, 1.768829345703125, 1.8263092041015625, 1.8837890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 11.0, 26.0, 137.0, 418.0, 308.0, 61.0, 20.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005035400390625, -0.0004930105060338974, -0.0004824809730052948, -0.0004719514399766922, -0.0004614219069480896, -0.000450892373919487, -0.0004403628408908844, -0.0004298333078622818, -0.0004193037748336792, -0.0004087742418050766, -0.000398244708776474, -0.0003877151757478714, -0.0003771856427192688, -0.0003666561096906662, -0.0003561265766620636, -0.000345597043633461, -0.0003350675106048584, -0.0003245379775762558, -0.0003140084445476532, -0.0003034789115190506, -0.000292949378490448, -0.0002824198454618454, -0.0002718903124332428, -0.0002613607794046402, -0.0002508312463760376, -0.000240301713347435, -0.0002297721803188324, -0.0002192426472902298, -0.0002087131142616272, -0.0001981835812330246, -0.000187654048204422, -0.0001771245151758194, -0.0001665949821472168, -0.0001560654491186142, -0.0001455359160900116, -0.000135006383061409, -0.0001244768500328064, -0.0001139473170042038, -0.0001034177839756012, -9.28882509469986e-05, -8.2358717918396e-05, -7.18291848897934e-05, -6.12996518611908e-05, -5.0770118832588196e-05, -4.0240585803985596e-05, -2.9711052775382996e-05, -1.9181519746780396e-05, -8.651986718177795e-06, 1.8775463104248047e-06, 1.2407079339027405e-05, 2.2936612367630005e-05, 3.3466145396232605e-05, 4.3995678424835205e-05, 5.4525211453437805e-05, 6.50547444820404e-05, 7.5584277510643e-05, 8.61138105392456e-05, 9.66433435678482e-05, 0.0001071728765964508, 0.0001177024096250534, 0.000128231942653656, 0.0001387614756822586, 0.0001492910087108612, 0.0001598205417394638, 0.0001703500747680664]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 8.0, 13.0, 18.0, 29.0, 50.0, 62.0, 139.0, 349.0, 1106.0, 13618.0, 1021613.0, 9906.0, 971.0, 329.0, 154.0, 61.0, 42.0, 28.0, 20.0, 12.0, 12.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.783416748046875, -3.67034912109375, -3.557281494140625, -3.4442138671875, -3.331146240234375, -3.21807861328125, -3.105010986328125, -2.991943359375, -2.878875732421875, -2.76580810546875, -2.652740478515625, -2.5396728515625, -2.426605224609375, -2.31353759765625, -2.200469970703125, -2.08740234375, -1.974334716796875, -1.86126708984375, -1.748199462890625, -1.6351318359375, -1.522064208984375, -1.40899658203125, -1.295928955078125, -1.182861328125, -1.069793701171875, -0.95672607421875, -0.843658447265625, -0.7305908203125, -0.617523193359375, -0.50445556640625, -0.391387939453125, -0.2783203125, -0.165252685546875, -0.05218505859375, 0.060882568359375, 0.1739501953125, 0.287017822265625, 0.40008544921875, 0.513153076171875, 0.626220703125, 0.739288330078125, 0.85235595703125, 0.965423583984375, 1.0784912109375, 1.191558837890625, 1.30462646484375, 1.417694091796875, 1.53076171875, 1.643829345703125, 1.75689697265625, 1.869964599609375, 1.9830322265625, 2.096099853515625, 2.20916748046875, 2.322235107421875, 2.435302734375, 2.548370361328125, 2.66143798828125, 2.774505615234375, 2.8875732421875, 3.000640869140625, 3.11370849609375, 3.226776123046875, 3.33984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 9.0, 36.0, 168.0, 554.0, 182.0, 31.0, 6.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.06048583984375, -1.9490966796875, -1.83770751953125, -1.726318359375, -1.61492919921875, -1.5035400390625, -1.39215087890625, -1.28076171875, -1.16937255859375, -1.0579833984375, -0.94659423828125, -0.835205078125, -0.72381591796875, -0.6124267578125, -0.50103759765625, -0.3896484375, -0.27825927734375, -0.1668701171875, -0.05548095703125, 0.055908203125, 0.16729736328125, 0.2786865234375, 0.39007568359375, 0.50146484375, 0.61285400390625, 0.7242431640625, 0.83563232421875, 0.947021484375, 1.05841064453125, 1.1697998046875, 1.28118896484375, 1.392578125, 1.50396728515625, 1.6153564453125, 1.72674560546875, 1.838134765625, 1.94952392578125, 2.0609130859375, 2.17230224609375, 2.28369140625, 2.39508056640625, 2.5064697265625, 2.61785888671875, 2.729248046875, 2.84063720703125, 2.9520263671875, 3.06341552734375, 3.1748046875, 3.28619384765625, 3.3975830078125, 3.50897216796875, 3.620361328125, 3.73175048828125, 3.8431396484375, 3.95452880859375, 4.06591796875, 4.17730712890625, 4.2886962890625, 4.40008544921875, 4.511474609375, 4.62286376953125, 4.7342529296875, 4.84564208984375, 4.95703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 14.0, 10.0, 19.0, 15.0, 16.0, 41.0, 62.0, 78.0, 100.0, 113.0, 127.0, 127.0, 94.0, 63.0, 35.0, 35.0, 15.0, 12.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.71515464782715, -17.3337345123291, -16.952316284179688, -16.57089614868164, -16.189476013183594, -15.80805778503418, -15.426637649536133, -15.045218467712402, -14.663799285888672, -14.282380104064941, -13.900960922241211, -13.519540786743164, -13.138121604919434, -12.756702423095703, -12.375282287597656, -11.993863105773926, -11.612443923950195, -11.231024742126465, -10.849605560302734, -10.468185424804688, -10.086766242980957, -9.705347061157227, -9.32392692565918, -8.94250774383545, -8.561088562011719, -8.179669380187988, -7.7982497215271, -7.416830062866211, -7.0354108810424805, -6.65399169921875, -6.272572040557861, -5.891152381896973, -5.509732246398926, -5.128313064575195, -4.746893405914307, -4.365473747253418, -3.9840545654296875, -3.602635145187378, -3.2212157249450684, -2.839796304702759, -2.458376884460449, -2.0769574642181396, -1.69553804397583, -1.3141186237335205, -0.9326992034912109, -0.5512797832489014, -0.1698603630065918, 0.21155905723571777, 0.5929784774780273, 0.9743978977203369, 1.3558173179626465, 1.737236738204956, 2.1186561584472656, 2.500075578689575, 2.8814949989318848, 3.2629144191741943, 3.644333839416504, 4.025753021240234, 4.407172679901123, 4.788592338562012, 5.170011520385742, 5.551430702209473, 5.932850360870361, 6.31427001953125, 6.6956892013549805]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 7.0, 11.0, 5.0, 9.0, 10.0, 16.0, 15.0, 18.0, 19.0, 24.0, 29.0, 21.0, 28.0, 34.0, 45.0, 46.0, 39.0, 52.0, 47.0, 37.0, 41.0, 46.0, 44.0, 34.0, 26.0, 33.0, 29.0, 31.0, 28.0, 26.0, 29.0, 13.0, 15.0, 14.0, 10.0, 11.0, 9.0, 7.0, 7.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.989354133605957, -7.746500492095947, -7.503647327423096, -7.260793685913086, -7.017940521240234, -6.775086879730225, -6.532233238220215, -6.289380073547363, -6.0465264320373535, -5.803672790527344, -5.560819625854492, -5.317965984344482, -5.075112342834473, -4.832259178161621, -4.589405536651611, -4.346551895141602, -4.10369873046875, -3.8608453273773193, -3.6179919242858887, -3.375138282775879, -3.1322848796844482, -2.8894314765930176, -2.646577835083008, -2.403724431991577, -2.1608710289001465, -1.9180176258087158, -1.6751641035079956, -1.4323105812072754, -1.1894571781158447, -0.9466037750244141, -0.7037502527236938, -0.46089673042297363, -0.21804332733154297, 0.02481013536453247, 0.2676635980606079, 0.5105170607566833, 0.7533705234527588, 0.9962239265441895, 1.2390774488449097, 1.4819309711456299, 1.7247843742370605, 1.9676377773284912, 2.210491180419922, 2.4533448219299316, 2.6961982250213623, 2.939051628112793, 3.1819052696228027, 3.4247586727142334, 3.667612075805664, 3.9104654788970947, 4.153318881988525, 4.396172523498535, 4.639025688171387, 4.8818793296813965, 5.124732971191406, 5.367586135864258, 5.610439777374268, 5.853293418884277, 6.096146583557129, 6.339000225067139, 6.581853866577148, 6.82470703125, 7.06756067276001, 7.3104143142700195, 7.553267478942871]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 18.0, 10.0, 17.0, 31.0, 38.0, 88.0, 133.0, 220.0, 429.0, 815.0, 1950.0, 5641.0, 23045.0, 221576.0, 3853098.0, 69572.0, 11873.0, 3288.0, 1210.0, 572.0, 295.0, 159.0, 82.0, 39.0, 21.0, 19.0, 14.0, 3.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.66796875, -3.574615478515625, -3.48126220703125, -3.387908935546875, -3.2945556640625, -3.201202392578125, -3.10784912109375, -3.014495849609375, -2.921142578125, -2.827789306640625, -2.73443603515625, -2.641082763671875, -2.5477294921875, -2.454376220703125, -2.36102294921875, -2.267669677734375, -2.17431640625, -2.080963134765625, -1.98760986328125, -1.894256591796875, -1.8009033203125, -1.707550048828125, -1.61419677734375, -1.520843505859375, -1.427490234375, -1.334136962890625, -1.24078369140625, -1.147430419921875, -1.0540771484375, -0.960723876953125, -0.86737060546875, -0.774017333984375, -0.6806640625, -0.587310791015625, -0.49395751953125, -0.400604248046875, -0.3072509765625, -0.213897705078125, -0.12054443359375, -0.027191162109375, 0.066162109375, 0.159515380859375, 0.25286865234375, 0.346221923828125, 0.4395751953125, 0.532928466796875, 0.62628173828125, 0.719635009765625, 0.81298828125, 0.906341552734375, 0.99969482421875, 1.093048095703125, 1.1864013671875, 1.279754638671875, 1.37310791015625, 1.466461181640625, 1.559814453125, 1.653167724609375, 1.74652099609375, 1.839874267578125, 1.9332275390625, 2.026580810546875, 2.11993408203125, 2.213287353515625, 2.306640625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 10.0, 16.0, 24.0, 32.0, 35.0, 63.0, 77.0, 90.0, 97.0, 123.0, 98.0, 89.0, 71.0, 54.0, 46.0, 30.0, 17.0, 10.0, 5.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.796875, -0.77490234375, -0.7529296875, -0.73095703125, -0.708984375, -0.68701171875, -0.6650390625, -0.64306640625, -0.62109375, -0.59912109375, -0.5771484375, -0.55517578125, -0.533203125, -0.51123046875, -0.4892578125, -0.46728515625, -0.4453125, -0.42333984375, -0.4013671875, -0.37939453125, -0.357421875, -0.33544921875, -0.3134765625, -0.29150390625, -0.26953125, -0.24755859375, -0.2255859375, -0.20361328125, -0.181640625, -0.15966796875, -0.1376953125, -0.11572265625, -0.09375, -0.07177734375, -0.0498046875, -0.02783203125, -0.005859375, 0.01611328125, 0.0380859375, 0.06005859375, 0.08203125, 0.10400390625, 0.1259765625, 0.14794921875, 0.169921875, 0.19189453125, 0.2138671875, 0.23583984375, 0.2578125, 0.27978515625, 0.3017578125, 0.32373046875, 0.345703125, 0.36767578125, 0.3896484375, 0.41162109375, 0.43359375, 0.45556640625, 0.4775390625, 0.49951171875, 0.521484375, 0.54345703125, 0.5654296875, 0.58740234375, 0.609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 5.0, 10.0, 8.0, 12.0, 27.0, 29.0, 30.0, 62.0, 86.0, 100.0, 195.0, 238.0, 438.0, 803.0, 1596.0, 3700.0, 11665.0, 60388.0, 3450875.0, 613733.0, 36085.0, 8202.0, 2899.0, 1258.0, 675.0, 389.0, 229.0, 178.0, 99.0, 72.0, 51.0, 39.0, 28.0, 19.0, 19.0, 14.0, 9.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.61328125, -2.525787353515625, -2.43829345703125, -2.350799560546875, -2.2633056640625, -2.175811767578125, -2.08831787109375, -2.000823974609375, -1.913330078125, -1.825836181640625, -1.73834228515625, -1.650848388671875, -1.5633544921875, -1.475860595703125, -1.38836669921875, -1.300872802734375, -1.21337890625, -1.125885009765625, -1.03839111328125, -0.950897216796875, -0.8634033203125, -0.775909423828125, -0.68841552734375, -0.600921630859375, -0.513427734375, -0.425933837890625, -0.33843994140625, -0.250946044921875, -0.1634521484375, -0.075958251953125, 0.01153564453125, 0.099029541015625, 0.1865234375, 0.274017333984375, 0.36151123046875, 0.449005126953125, 0.5364990234375, 0.623992919921875, 0.71148681640625, 0.798980712890625, 0.886474609375, 0.973968505859375, 1.06146240234375, 1.148956298828125, 1.2364501953125, 1.323944091796875, 1.41143798828125, 1.498931884765625, 1.58642578125, 1.673919677734375, 1.76141357421875, 1.848907470703125, 1.9364013671875, 2.023895263671875, 2.11138916015625, 2.198883056640625, 2.286376953125, 2.373870849609375, 2.46136474609375, 2.548858642578125, 2.6363525390625, 2.723846435546875, 2.81134033203125, 2.898834228515625, 2.986328125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 7.0, 8.0, 13.0, 17.0, 29.0, 53.0, 102.0, 247.0, 2030.0, 1163.0, 198.0, 86.0, 50.0, 19.0, 16.0, 12.0, 8.0, 10.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9931640625, -1.94195556640625, -1.8907470703125, -1.83953857421875, -1.788330078125, -1.73712158203125, -1.6859130859375, -1.63470458984375, -1.58349609375, -1.53228759765625, -1.4810791015625, -1.42987060546875, -1.378662109375, -1.32745361328125, -1.2762451171875, -1.22503662109375, -1.173828125, -1.12261962890625, -1.0714111328125, -1.02020263671875, -0.968994140625, -0.91778564453125, -0.8665771484375, -0.81536865234375, -0.76416015625, -0.71295166015625, -0.6617431640625, -0.61053466796875, -0.559326171875, -0.50811767578125, -0.4569091796875, -0.40570068359375, -0.3544921875, -0.30328369140625, -0.2520751953125, -0.20086669921875, -0.149658203125, -0.09844970703125, -0.0472412109375, 0.00396728515625, 0.05517578125, 0.10638427734375, 0.1575927734375, 0.20880126953125, 0.260009765625, 0.31121826171875, 0.3624267578125, 0.41363525390625, 0.46484375, 0.51605224609375, 0.5672607421875, 0.61846923828125, 0.669677734375, 0.72088623046875, 0.7720947265625, 0.82330322265625, 0.87451171875, 0.92572021484375, 0.9769287109375, 1.02813720703125, 1.079345703125, 1.13055419921875, 1.1817626953125, 1.23297119140625, 1.2841796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 25.0, 25.0, 56.0, 85.0, 118.0, 161.0, 187.0, 137.0, 86.0, 48.0, 28.0, 19.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12812614440918, -6.90464448928833, -6.6811628341674805, -6.457681179046631, -6.234199523925781, -6.010717868804932, -5.787236213684082, -5.563754558563232, -5.340272903442383, -5.116791248321533, -4.893309593200684, -4.669827938079834, -4.446346282958984, -4.222864627838135, -3.999382972717285, -3.7759013175964355, -3.552419662475586, -3.3289380073547363, -3.1054563522338867, -2.881974697113037, -2.6584930419921875, -2.435011386871338, -2.2115297317504883, -1.9880480766296387, -1.764566421508789, -1.5410847663879395, -1.3176031112670898, -1.0941214561462402, -0.8706398010253906, -0.647158145904541, -0.4236764907836914, -0.2001948356628418, 0.02328634262084961, 0.24676799774169922, 0.47024965286254883, 0.6937313079833984, 0.917212963104248, 1.1406946182250977, 1.3641762733459473, 1.5876579284667969, 1.8111395835876465, 2.034621238708496, 2.2581028938293457, 2.4815845489501953, 2.705066204071045, 2.9285478591918945, 3.152029514312744, 3.3755111694335938, 3.5989928245544434, 3.822474479675293, 4.045956134796143, 4.269437789916992, 4.492919445037842, 4.716401100158691, 4.939882755279541, 5.163364410400391, 5.38684606552124, 5.61032772064209, 5.8338093757629395, 6.057291030883789, 6.280772686004639, 6.504254341125488, 6.727735996246338, 6.9512176513671875, 7.174699306488037]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 6.0, 4.0, 5.0, 3.0, 4.0, 13.0, 19.0, 18.0, 12.0, 14.0, 20.0, 16.0, 27.0, 47.0, 36.0, 39.0, 46.0, 45.0, 37.0, 37.0, 49.0, 43.0, 38.0, 47.0, 25.0, 50.0, 33.0, 35.0, 30.0, 19.0, 24.0, 23.0, 17.0, 16.0, 11.0, 18.0, 11.0, 16.0, 9.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.22287654876709, -3.1301522254943848, -3.0374279022216797, -2.9447035789489746, -2.8519790172576904, -2.7592546939849854, -2.6665303707122803, -2.573806047439575, -2.481081485748291, -2.388357162475586, -2.295632839202881, -2.202908515930176, -2.1101839542388916, -2.0174596309661865, -1.9247353076934814, -1.8320109844207764, -1.7392866611480713, -1.6465623378753662, -1.5538378953933716, -1.4611135721206665, -1.3683891296386719, -1.2756648063659668, -1.1829404830932617, -1.0902161598205566, -0.997491717338562, -0.9047673344612122, -0.8120429515838623, -0.7193186283111572, -0.6265942454338074, -0.5338698625564575, -0.44114553928375244, -0.3484211564064026, -0.25569701194763184, -0.16297264397144318, -0.07024827599525452, 0.02247607707977295, 0.1152004599571228, 0.20792484283447266, 0.30064916610717773, 0.3933735489845276, 0.48609793186187744, 0.5788223147392273, 0.6715466976165771, 0.7642710208892822, 0.8569954037666321, 0.9497197866439819, 1.042444109916687, 1.1351685523986816, 1.2278928756713867, 1.3206171989440918, 1.4133416414260864, 1.5060659646987915, 1.5987904071807861, 1.6915147304534912, 1.7842390537261963, 1.8769633769989014, 1.969687819480896, 2.0624122619628906, 2.1551365852355957, 2.247860908508301, 2.340585231781006, 2.433309555053711, 2.526033878326416, 2.6187584400177, 2.7114827632904053]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 10.0, 10.0, 20.0, 28.0, 27.0, 38.0, 57.0, 72.0, 103.0, 149.0, 204.0, 324.0, 470.0, 813.0, 1456.0, 2821.0, 6091.0, 13989.0, 34894.0, 95126.0, 251138.0, 356130.0, 176463.0, 64179.0, 24043.0, 10044.0, 4438.0, 2248.0, 1201.0, 666.0, 408.0, 246.0, 181.0, 102.0, 94.0, 72.0, 57.0, 40.0, 29.0, 22.0, 13.0, 11.0, 2.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5419921875, -1.4942626953125, -1.446533203125, -1.3988037109375, -1.35107421875, -1.3033447265625, -1.255615234375, -1.2078857421875, -1.16015625, -1.1124267578125, -1.064697265625, -1.0169677734375, -0.96923828125, -0.9215087890625, -0.873779296875, -0.8260498046875, -0.7783203125, -0.7305908203125, -0.682861328125, -0.6351318359375, -0.58740234375, -0.5396728515625, -0.491943359375, -0.4442138671875, -0.396484375, -0.3487548828125, -0.301025390625, -0.2532958984375, -0.20556640625, -0.1578369140625, -0.110107421875, -0.0623779296875, -0.0146484375, 0.0330810546875, 0.080810546875, 0.1285400390625, 0.17626953125, 0.2239990234375, 0.271728515625, 0.3194580078125, 0.3671875, 0.4149169921875, 0.462646484375, 0.5103759765625, 0.55810546875, 0.6058349609375, 0.653564453125, 0.7012939453125, 0.7490234375, 0.7967529296875, 0.844482421875, 0.8922119140625, 0.93994140625, 0.9876708984375, 1.035400390625, 1.0831298828125, 1.130859375, 1.1785888671875, 1.226318359375, 1.2740478515625, 1.32177734375, 1.3695068359375, 1.417236328125, 1.4649658203125, 1.5126953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 16.0, 13.0, 19.0, 37.0, 59.0, 57.0, 86.0, 92.0, 92.0, 107.0, 78.0, 90.0, 75.0, 47.0, 36.0, 26.0, 22.0, 14.0, 11.0, 1.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8134765625, -0.7908859252929688, -0.7682952880859375, -0.7457046508789062, -0.723114013671875, -0.7005233764648438, -0.6779327392578125, -0.6553421020507812, -0.63275146484375, -0.6101608276367188, -0.5875701904296875, -0.5649795532226562, -0.542388916015625, -0.5197982788085938, -0.4972076416015625, -0.47461700439453125, -0.4520263671875, -0.42943572998046875, -0.4068450927734375, -0.38425445556640625, -0.361663818359375, -0.33907318115234375, -0.3164825439453125, -0.29389190673828125, -0.27130126953125, -0.24871063232421875, -0.2261199951171875, -0.20352935791015625, -0.180938720703125, -0.15834808349609375, -0.1357574462890625, -0.11316680908203125, -0.090576171875, -0.06798553466796875, -0.0453948974609375, -0.02280426025390625, -0.000213623046875, 0.02237701416015625, 0.0449676513671875, 0.06755828857421875, 0.09014892578125, 0.11273956298828125, 0.1353302001953125, 0.15792083740234375, 0.180511474609375, 0.20310211181640625, 0.2256927490234375, 0.24828338623046875, 0.2708740234375, 0.29346466064453125, 0.3160552978515625, 0.33864593505859375, 0.361236572265625, 0.38382720947265625, 0.4064178466796875, 0.42900848388671875, 0.45159912109375, 0.47418975830078125, 0.4967803955078125, 0.5193710327148438, 0.541961669921875, 0.5645523071289062, 0.5871429443359375, 0.6097335815429688, 0.63232421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 7.0, 5.0, 6.0, 8.0, 14.0, 18.0, 22.0, 16.0, 31.0, 34.0, 70.0, 96.0, 147.0, 206.0, 349.0, 577.0, 971.0, 1798.0, 3769.0, 9451.0, 27662.0, 104562.0, 413803.0, 358449.0, 87277.0, 23759.0, 8024.0, 3393.0, 1645.0, 878.0, 509.0, 335.0, 221.0, 116.0, 78.0, 68.0, 43.0, 41.0, 21.0, 20.0, 12.0, 6.0, 10.0, 6.0, 9.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.13946533203125, -2.0679931640625, -1.99652099609375, -1.925048828125, -1.85357666015625, -1.7821044921875, -1.71063232421875, -1.63916015625, -1.56768798828125, -1.4962158203125, -1.42474365234375, -1.353271484375, -1.28179931640625, -1.2103271484375, -1.13885498046875, -1.0673828125, -0.99591064453125, -0.9244384765625, -0.85296630859375, -0.781494140625, -0.71002197265625, -0.6385498046875, -0.56707763671875, -0.49560546875, -0.42413330078125, -0.3526611328125, -0.28118896484375, -0.209716796875, -0.13824462890625, -0.0667724609375, 0.00469970703125, 0.076171875, 0.14764404296875, 0.2191162109375, 0.29058837890625, 0.362060546875, 0.43353271484375, 0.5050048828125, 0.57647705078125, 0.64794921875, 0.71942138671875, 0.7908935546875, 0.86236572265625, 0.933837890625, 1.00531005859375, 1.0767822265625, 1.14825439453125, 1.2197265625, 1.29119873046875, 1.3626708984375, 1.43414306640625, 1.505615234375, 1.57708740234375, 1.6485595703125, 1.72003173828125, 1.79150390625, 1.86297607421875, 1.9344482421875, 2.00592041015625, 2.077392578125, 2.14886474609375, 2.2203369140625, 2.29180908203125, 2.36328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 13.0, 14.0, 18.0, 17.0, 21.0, 25.0, 34.0, 36.0, 56.0, 59.0, 59.0, 58.0, 43.0, 57.0, 58.0, 75.0, 54.0, 47.0, 45.0, 41.0, 31.0, 17.0, 27.0, 17.0, 11.0, 8.0, 14.0, 5.0, 3.0, 5.0, 2.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.72265625, -2.63739013671875, -2.5521240234375, -2.46685791015625, -2.381591796875, -2.29632568359375, -2.2110595703125, -2.12579345703125, -2.04052734375, -1.95526123046875, -1.8699951171875, -1.78472900390625, -1.699462890625, -1.61419677734375, -1.5289306640625, -1.44366455078125, -1.3583984375, -1.27313232421875, -1.1878662109375, -1.10260009765625, -1.017333984375, -0.93206787109375, -0.8468017578125, -0.76153564453125, -0.67626953125, -0.59100341796875, -0.5057373046875, -0.42047119140625, -0.335205078125, -0.24993896484375, -0.1646728515625, -0.07940673828125, 0.005859375, 0.09112548828125, 0.1763916015625, 0.26165771484375, 0.346923828125, 0.43218994140625, 0.5174560546875, 0.60272216796875, 0.68798828125, 0.77325439453125, 0.8585205078125, 0.94378662109375, 1.029052734375, 1.11431884765625, 1.1995849609375, 1.28485107421875, 1.3701171875, 1.45538330078125, 1.5406494140625, 1.62591552734375, 1.711181640625, 1.79644775390625, 1.8817138671875, 1.96697998046875, 2.05224609375, 2.13751220703125, 2.2227783203125, 2.30804443359375, 2.393310546875, 2.47857666015625, 2.5638427734375, 2.64910888671875, 2.734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 12.0, 10.0, 19.0, 35.0, 44.0, 86.0, 144.0, 264.0, 466.0, 1255.0, 3861.0, 20510.0, 315868.0, 661213.0, 36144.0, 5735.0, 1568.0, 624.0, 292.0, 154.0, 95.0, 49.0, 30.0, 22.0, 19.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8310546875, -1.775787353515625, -1.72052001953125, -1.665252685546875, -1.6099853515625, -1.554718017578125, -1.49945068359375, -1.444183349609375, -1.388916015625, -1.333648681640625, -1.27838134765625, -1.223114013671875, -1.1678466796875, -1.112579345703125, -1.05731201171875, -1.002044677734375, -0.94677734375, -0.891510009765625, -0.83624267578125, -0.780975341796875, -0.7257080078125, -0.670440673828125, -0.61517333984375, -0.559906005859375, -0.504638671875, -0.449371337890625, -0.39410400390625, -0.338836669921875, -0.2835693359375, -0.228302001953125, -0.17303466796875, -0.117767333984375, -0.0625, -0.007232666015625, 0.04803466796875, 0.103302001953125, 0.1585693359375, 0.213836669921875, 0.26910400390625, 0.324371337890625, 0.379638671875, 0.434906005859375, 0.49017333984375, 0.545440673828125, 0.6007080078125, 0.655975341796875, 0.71124267578125, 0.766510009765625, 0.82177734375, 0.877044677734375, 0.93231201171875, 0.987579345703125, 1.0428466796875, 1.098114013671875, 1.15338134765625, 1.208648681640625, 1.263916015625, 1.319183349609375, 1.37445068359375, 1.429718017578125, 1.4849853515625, 1.540252685546875, 1.59552001953125, 1.650787353515625, 1.7060546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 14.0, 32.0, 32.0, 72.0, 118.0, 188.0, 198.0, 147.0, 81.0, 44.0, 27.0, 15.0, 13.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0003609657287597656, -0.0003527700901031494, -0.0003445744514465332, -0.000336378812789917, -0.0003281831741333008, -0.00031998753547668457, -0.00031179189682006836, -0.00030359625816345215, -0.00029540061950683594, -0.0002872049808502197, -0.0002790093421936035, -0.0002708137035369873, -0.0002626180648803711, -0.0002544224262237549, -0.00024622678756713867, -0.00023803114891052246, -0.00022983551025390625, -0.00022163987159729004, -0.00021344423294067383, -0.00020524859428405762, -0.0001970529556274414, -0.0001888573169708252, -0.00018066167831420898, -0.00017246603965759277, -0.00016427040100097656, -0.00015607476234436035, -0.00014787912368774414, -0.00013968348503112793, -0.00013148784637451172, -0.0001232922077178955, -0.0001150965690612793, -0.00010690093040466309, -9.870529174804688e-05, -9.050965309143066e-05, -8.231401443481445e-05, -7.411837577819824e-05, -6.592273712158203e-05, -5.772709846496582e-05, -4.953145980834961e-05, -4.13358211517334e-05, -3.314018249511719e-05, -2.4944543838500977e-05, -1.6748905181884766e-05, -8.553266525268555e-06, -3.5762786865234375e-07, 7.838010787963867e-06, 1.6033649444580078e-05, 2.422928810119629e-05, 3.24249267578125e-05, 4.062056541442871e-05, 4.881620407104492e-05, 5.701184272766113e-05, 6.520748138427734e-05, 7.340312004089355e-05, 8.159875869750977e-05, 8.979439735412598e-05, 9.799003601074219e-05, 0.0001061856746673584, 0.00011438131332397461, 0.00012257695198059082, 0.00013077259063720703, 0.00013896822929382324, 0.00014716386795043945, 0.00015535950660705566, 0.00016355514526367188]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 10.0, 23.0, 31.0, 39.0, 83.0, 157.0, 377.0, 901.0, 2944.0, 16954.0, 353301.0, 640335.0, 27450.0, 3976.0, 1101.0, 405.0, 191.0, 117.0, 60.0, 46.0, 15.0, 14.0, 9.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.220703125, -2.16241455078125, -2.1041259765625, -2.04583740234375, -1.987548828125, -1.92926025390625, -1.8709716796875, -1.81268310546875, -1.75439453125, -1.69610595703125, -1.6378173828125, -1.57952880859375, -1.521240234375, -1.46295166015625, -1.4046630859375, -1.34637451171875, -1.2880859375, -1.22979736328125, -1.1715087890625, -1.11322021484375, -1.054931640625, -0.99664306640625, -0.9383544921875, -0.88006591796875, -0.82177734375, -0.76348876953125, -0.7052001953125, -0.64691162109375, -0.588623046875, -0.53033447265625, -0.4720458984375, -0.41375732421875, -0.35546875, -0.29718017578125, -0.2388916015625, -0.18060302734375, -0.122314453125, -0.06402587890625, -0.0057373046875, 0.05255126953125, 0.11083984375, 0.16912841796875, 0.2274169921875, 0.28570556640625, 0.343994140625, 0.40228271484375, 0.4605712890625, 0.51885986328125, 0.5771484375, 0.63543701171875, 0.6937255859375, 0.75201416015625, 0.810302734375, 0.86859130859375, 0.9268798828125, 0.98516845703125, 1.04345703125, 1.10174560546875, 1.1600341796875, 1.21832275390625, 1.276611328125, 1.33489990234375, 1.3931884765625, 1.45147705078125, 1.509765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 9.0, 21.0, 30.0, 44.0, 92.0, 143.0, 189.0, 163.0, 106.0, 69.0, 51.0, 35.0, 18.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.1693267822265625, -1.113067626953125, -1.0568084716796875, -1.00054931640625, -0.9442901611328125, -0.888031005859375, -0.8317718505859375, -0.7755126953125, -0.7192535400390625, -0.662994384765625, -0.6067352294921875, -0.55047607421875, -0.4942169189453125, -0.437957763671875, -0.3816986083984375, -0.325439453125, -0.2691802978515625, -0.212921142578125, -0.1566619873046875, -0.10040283203125, -0.0441436767578125, 0.012115478515625, 0.0683746337890625, 0.1246337890625, 0.1808929443359375, 0.237152099609375, 0.2934112548828125, 0.34967041015625, 0.4059295654296875, 0.462188720703125, 0.5184478759765625, 0.57470703125, 0.6309661865234375, 0.687225341796875, 0.7434844970703125, 0.79974365234375, 0.8560028076171875, 0.912261962890625, 0.9685211181640625, 1.0247802734375, 1.0810394287109375, 1.137298583984375, 1.1935577392578125, 1.24981689453125, 1.3060760498046875, 1.362335205078125, 1.4185943603515625, 1.474853515625, 1.5311126708984375, 1.587371826171875, 1.6436309814453125, 1.69989013671875, 1.7561492919921875, 1.812408447265625, 1.8686676025390625, 1.9249267578125, 1.9811859130859375, 2.037445068359375, 2.0937042236328125, 2.14996337890625, 2.2062225341796875, 2.262481689453125, 2.3187408447265625, 2.375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 7.0, 18.0, 17.0, 22.0, 24.0, 29.0, 49.0, 67.0, 67.0, 102.0, 99.0, 103.0, 78.0, 75.0, 45.0, 49.0, 27.0, 24.0, 23.0, 19.0, 11.0, 9.0, 5.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.437044143676758, -14.044700622558594, -13.652356147766113, -13.26001262664795, -12.867668151855469, -12.475324630737305, -12.082980155944824, -11.69063663482666, -11.29829216003418, -10.905948638916016, -10.513604164123535, -10.121260643005371, -9.72891616821289, -9.336572647094727, -8.944228172302246, -8.551884651184082, -8.159540176391602, -7.767196178436279, -7.374852180480957, -6.982508182525635, -6.5901641845703125, -6.19782018661499, -5.805476188659668, -5.413132667541504, -5.02078914642334, -4.628445148468018, -4.236101150512695, -3.843757152557373, -3.451413154602051, -3.0590691566467285, -2.6667253971099854, -2.274381399154663, -1.8820371627807617, -1.4896931648254395, -1.0973491668701172, -0.7050052881240845, -0.3126612901687622, 0.07968270778656006, 0.4720265865325928, 0.864370584487915, 1.2567145824432373, 1.6490585803985596, 2.041402578353882, 2.433746337890625, 2.8260903358459473, 3.2184343338012695, 3.610778331756592, 4.003122329711914, 4.395466327667236, 4.787810325622559, 5.180154323577881, 5.572498321533203, 5.964842319488525, 6.357186317443848, 6.749529838562012, 7.141874313354492, 7.534217834472656, 7.9265618324279785, 8.3189058303833, 8.711249351501465, 9.103593826293945, 9.49593734741211, 9.88828182220459, 10.280625343322754, 10.672969818115234]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 8.0, 12.0, 10.0, 19.0, 15.0, 17.0, 22.0, 23.0, 27.0, 34.0, 33.0, 40.0, 40.0, 52.0, 31.0, 50.0, 60.0, 40.0, 62.0, 59.0, 43.0, 50.0, 36.0, 32.0, 32.0, 17.0, 27.0, 21.0, 15.0, 10.0, 12.0, 9.0, 5.0, 7.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.222931861877441, -13.821723937988281, -13.420516014099121, -13.019308090209961, -12.6181001663208, -12.21689224243164, -11.815683364868164, -11.41447639465332, -11.013267517089844, -10.612059593200684, -10.210851669311523, -9.809643745422363, -9.408435821533203, -9.007227897644043, -8.606019973754883, -8.204811096191406, -7.8036041259765625, -7.402396202087402, -7.001188278198242, -6.599980354309082, -6.198772430419922, -5.797564506530762, -5.396356105804443, -4.995148181915283, -4.593940258026123, -4.192732334136963, -3.7915244102478027, -3.3903162479400635, -2.9891083240509033, -2.587900400161743, -2.186692237854004, -1.7854843139648438, -1.38427734375, -0.9830693602561951, -0.5818613767623901, -0.18065333366394043, 0.22055459022521973, 0.6217625141143799, 1.0229706764221191, 1.4241786003112793, 1.8253865242004395, 2.2265944480895996, 2.6278023719787598, 3.029010534286499, 3.430218458175659, 3.8314263820648193, 4.232634544372559, 4.633842468261719, 5.035050392150879, 5.436258316040039, 5.837466239929199, 6.238674163818359, 6.6398820877075195, 7.04109001159668, 7.442298412322998, 7.843506336212158, 8.244714736938477, 8.645922660827637, 9.047130584716797, 9.448338508605957, 9.849546432495117, 10.250754356384277, 10.651962280273438, 11.053171157836914, 11.454378128051758]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 14.0, 15.0, 27.0, 39.0, 48.0, 104.0, 146.0, 222.0, 363.0, 696.0, 1344.0, 2780.0, 7178.0, 31153.0, 4061374.0, 70801.0, 10760.0, 3699.0, 1577.0, 841.0, 443.0, 256.0, 142.0, 92.0, 54.0, 37.0, 15.0, 8.0, 16.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.58203125, -3.481597900390625, -3.38116455078125, -3.280731201171875, -3.1802978515625, -3.079864501953125, -2.97943115234375, -2.878997802734375, -2.778564453125, -2.678131103515625, -2.57769775390625, -2.477264404296875, -2.3768310546875, -2.276397705078125, -2.17596435546875, -2.075531005859375, -1.97509765625, -1.874664306640625, -1.77423095703125, -1.673797607421875, -1.5733642578125, -1.472930908203125, -1.37249755859375, -1.272064208984375, -1.171630859375, -1.071197509765625, -0.97076416015625, -0.870330810546875, -0.7698974609375, -0.669464111328125, -0.56903076171875, -0.468597412109375, -0.3681640625, -0.267730712890625, -0.16729736328125, -0.066864013671875, 0.0335693359375, 0.134002685546875, 0.23443603515625, 0.334869384765625, 0.435302734375, 0.535736083984375, 0.63616943359375, 0.736602783203125, 0.8370361328125, 0.937469482421875, 1.03790283203125, 1.138336181640625, 1.23876953125, 1.339202880859375, 1.43963623046875, 1.540069580078125, 1.6405029296875, 1.740936279296875, 1.84136962890625, 1.941802978515625, 2.042236328125, 2.142669677734375, 2.24310302734375, 2.343536376953125, 2.4439697265625, 2.544403076171875, 2.64483642578125, 2.745269775390625, 2.845703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 7.0, 4.0, 13.0, 16.0, 25.0, 37.0, 43.0, 46.0, 47.0, 65.0, 64.0, 70.0, 72.0, 79.0, 93.0, 51.0, 53.0, 64.0, 43.0, 34.0, 19.0, 19.0, 9.0, 6.0, 8.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.806640625, -0.7826080322265625, -0.758575439453125, -0.7345428466796875, -0.71051025390625, -0.6864776611328125, -0.662445068359375, -0.6384124755859375, -0.6143798828125, -0.5903472900390625, -0.566314697265625, -0.5422821044921875, -0.51824951171875, -0.4942169189453125, -0.470184326171875, -0.4461517333984375, -0.422119140625, -0.3980865478515625, -0.374053955078125, -0.3500213623046875, -0.32598876953125, -0.3019561767578125, -0.277923583984375, -0.2538909912109375, -0.2298583984375, -0.2058258056640625, -0.181793212890625, -0.1577606201171875, -0.13372802734375, -0.1096954345703125, -0.085662841796875, -0.0616302490234375, -0.03759765625, -0.0135650634765625, 0.010467529296875, 0.0345001220703125, 0.05853271484375, 0.0825653076171875, 0.106597900390625, 0.1306304931640625, 0.1546630859375, 0.1786956787109375, 0.202728271484375, 0.2267608642578125, 0.25079345703125, 0.2748260498046875, 0.298858642578125, 0.3228912353515625, 0.346923828125, 0.3709564208984375, 0.394989013671875, 0.4190216064453125, 0.44305419921875, 0.4670867919921875, 0.491119384765625, 0.5151519775390625, 0.5391845703125, 0.5632171630859375, 0.587249755859375, 0.6112823486328125, 0.63531494140625, 0.6593475341796875, 0.683380126953125, 0.7074127197265625, 0.7314453125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 5.0, 10.0, 5.0, 17.0, 7.0, 11.0, 19.0, 33.0, 33.0, 57.0, 69.0, 65.0, 106.0, 140.0, 203.0, 336.0, 473.0, 868.0, 1938.0, 6195.0, 51302.0, 4097593.0, 26581.0, 4565.0, 1500.0, 750.0, 421.0, 269.0, 183.0, 117.0, 90.0, 80.0, 64.0, 45.0, 32.0, 27.0, 19.0, 16.0, 11.0, 10.0, 10.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.26605224609375, -5.0867919921875, -4.90753173828125, -4.728271484375, -4.54901123046875, -4.3697509765625, -4.19049072265625, -4.01123046875, -3.83197021484375, -3.6527099609375, -3.47344970703125, -3.294189453125, -3.11492919921875, -2.9356689453125, -2.75640869140625, -2.5771484375, -2.39788818359375, -2.2186279296875, -2.03936767578125, -1.860107421875, -1.68084716796875, -1.5015869140625, -1.32232666015625, -1.14306640625, -0.96380615234375, -0.7845458984375, -0.60528564453125, -0.426025390625, -0.24676513671875, -0.0675048828125, 0.11175537109375, 0.291015625, 0.47027587890625, 0.6495361328125, 0.82879638671875, 1.008056640625, 1.18731689453125, 1.3665771484375, 1.54583740234375, 1.72509765625, 1.90435791015625, 2.0836181640625, 2.26287841796875, 2.442138671875, 2.62139892578125, 2.8006591796875, 2.97991943359375, 3.1591796875, 3.33843994140625, 3.5177001953125, 3.69696044921875, 3.876220703125, 4.05548095703125, 4.2347412109375, 4.41400146484375, 4.59326171875, 4.77252197265625, 4.9517822265625, 5.13104248046875, 5.310302734375, 5.48956298828125, 5.6688232421875, 5.84808349609375, 6.02734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 7.0, 7.0, 15.0, 19.0, 88.0, 3691.0, 150.0, 58.0, 24.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.3387908935546875, -1.297698974609375, -1.2566070556640625, -1.21551513671875, -1.1744232177734375, -1.133331298828125, -1.0922393798828125, -1.0511474609375, -1.0100555419921875, -0.968963623046875, -0.9278717041015625, -0.88677978515625, -0.8456878662109375, -0.804595947265625, -0.7635040283203125, -0.722412109375, -0.6813201904296875, -0.640228271484375, -0.5991363525390625, -0.55804443359375, -0.5169525146484375, -0.475860595703125, -0.4347686767578125, -0.3936767578125, -0.3525848388671875, -0.311492919921875, -0.2704010009765625, -0.22930908203125, -0.1882171630859375, -0.147125244140625, -0.1060333251953125, -0.06494140625, -0.0238494873046875, 0.017242431640625, 0.0583343505859375, 0.09942626953125, 0.1405181884765625, 0.181610107421875, 0.2227020263671875, 0.2637939453125, 0.3048858642578125, 0.345977783203125, 0.3870697021484375, 0.42816162109375, 0.4692535400390625, 0.510345458984375, 0.5514373779296875, 0.592529296875, 0.6336212158203125, 0.674713134765625, 0.7158050537109375, 0.75689697265625, 0.7979888916015625, 0.839080810546875, 0.8801727294921875, 0.9212646484375, 0.9623565673828125, 1.003448486328125, 1.0445404052734375, 1.08563232421875, 1.1267242431640625, 1.167816162109375, 1.2089080810546875, 1.25]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 12.0, 19.0, 29.0, 52.0, 102.0, 146.0, 183.0, 143.0, 106.0, 78.0, 46.0, 23.0, 11.0, 10.0, 9.0, 3.0, 7.0, 4.0, 9.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0666720867156982, -2.963979959487915, -2.8612875938415527, -2.7585954666137695, -2.6559031009674072, -2.553210973739624, -2.4505186080932617, -2.3478264808654785, -2.245134115219116, -2.142441987991333, -2.0397496223449707, -1.937057375907898, -1.8343651294708252, -1.731673002243042, -1.6289806365966797, -1.5262885093688965, -1.4235962629318237, -1.320904016494751, -1.2182117700576782, -1.1155195236206055, -1.0128272771835327, -0.9101350903511047, -0.807442843914032, -0.7047505974769592, -0.6020583510398865, -0.4993661046028137, -0.39667385816574097, -0.2939816415309906, -0.19128939509391785, -0.08859717845916748, 0.014095067977905273, 0.11678731441497803, 0.21947956085205078, 0.32217180728912354, 0.4248640537261963, 0.527556300163269, 0.6302485466003418, 0.7329407334327698, 0.8356329798698425, 0.9383252263069153, 1.0410175323486328, 1.1437097787857056, 1.2464020252227783, 1.349094271659851, 1.4517865180969238, 1.554478645324707, 1.6571710109710693, 1.7598631381988525, 1.8625553846359253, 1.965247631072998, 2.0679397583007812, 2.1706321239471436, 2.2733242511749268, 2.376016616821289, 2.4787087440490723, 2.5814011096954346, 2.6840932369232178, 2.786785364151001, 2.8894777297973633, 2.9921698570251465, 3.094862222671509, 3.197554349899292, 3.3002467155456543, 3.4029388427734375, 3.5056312084198]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 11.0, 11.0, 17.0, 9.0, 20.0, 17.0, 20.0, 23.0, 26.0, 32.0, 27.0, 43.0, 35.0, 42.0, 31.0, 44.0, 45.0, 34.0, 31.0, 45.0, 34.0, 34.0, 38.0, 40.0, 28.0, 36.0, 29.0, 21.0, 19.0, 24.0, 16.0, 15.0, 12.0, 17.0, 11.0, 12.0, 9.0, 6.0, 13.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5509384870529175, -1.4998595714569092, -1.4487806558609009, -1.3977017402648926, -1.3466229438781738, -1.295543909072876, -1.2444651126861572, -1.193386197090149, -1.1423072814941406, -1.0912283658981323, -1.040149450302124, -0.9890705943107605, -0.9379916787147522, -0.8869127631187439, -0.8358339071273804, -0.7847549915313721, -0.7336760759353638, -0.6825971603393555, -0.6315182447433472, -0.5804393887519836, -0.5293604731559753, -0.47828155755996704, -0.42720267176628113, -0.3761237859725952, -0.3250448703765869, -0.2739659547805786, -0.2228870689868927, -0.1718081682920456, -0.12072926759719849, -0.06965035200119019, -0.018571466207504272, 0.03250741958618164, 0.08358645439147949, 0.1346653550863266, 0.1857442557811737, 0.2368231564760208, 0.2879020571708679, 0.3389809727668762, 0.39005985856056213, 0.44113874435424805, 0.49221765995025635, 0.5432965755462646, 0.594375491142273, 0.6454543471336365, 0.6965332627296448, 0.7476121783256531, 0.7986910343170166, 0.8497699499130249, 0.9008488655090332, 0.9519277811050415, 1.0030066967010498, 1.054085612297058, 1.1051645278930664, 1.1562433242797852, 1.2073222398757935, 1.2584011554718018, 1.30948007106781, 1.3605589866638184, 1.4116379022598267, 1.462716817855835, 1.5137956142425537, 1.5648746490478516, 1.6159534454345703, 1.6670323610305786, 1.718111276626587]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 8.0, 13.0, 8.0, 16.0, 27.0, 23.0, 52.0, 64.0, 129.0, 186.0, 295.0, 477.0, 820.0, 1346.0, 2348.0, 4230.0, 8324.0, 16221.0, 33541.0, 73628.0, 161718.0, 283325.0, 239198.0, 118542.0, 53336.0, 24442.0, 12016.0, 6195.0, 3385.0, 1914.0, 968.0, 619.0, 396.0, 274.0, 165.0, 107.0, 64.0, 48.0, 39.0, 21.0, 9.0, 11.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.82421875, -1.77178955078125, -1.7193603515625, -1.66693115234375, -1.614501953125, -1.56207275390625, -1.5096435546875, -1.45721435546875, -1.40478515625, -1.35235595703125, -1.2999267578125, -1.24749755859375, -1.195068359375, -1.14263916015625, -1.0902099609375, -1.03778076171875, -0.9853515625, -0.93292236328125, -0.8804931640625, -0.82806396484375, -0.775634765625, -0.72320556640625, -0.6707763671875, -0.61834716796875, -0.56591796875, -0.51348876953125, -0.4610595703125, -0.40863037109375, -0.356201171875, -0.30377197265625, -0.2513427734375, -0.19891357421875, -0.146484375, -0.09405517578125, -0.0416259765625, 0.01080322265625, 0.063232421875, 0.11566162109375, 0.1680908203125, 0.22052001953125, 0.27294921875, 0.32537841796875, 0.3778076171875, 0.43023681640625, 0.482666015625, 0.53509521484375, 0.5875244140625, 0.63995361328125, 0.6923828125, 0.74481201171875, 0.7972412109375, 0.84967041015625, 0.902099609375, 0.95452880859375, 1.0069580078125, 1.05938720703125, 1.11181640625, 1.16424560546875, 1.2166748046875, 1.26910400390625, 1.321533203125, 1.37396240234375, 1.4263916015625, 1.47882080078125, 1.53125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 12.0, 20.0, 13.0, 27.0, 33.0, 24.0, 37.0, 43.0, 65.0, 59.0, 76.0, 52.0, 60.0, 76.0, 77.0, 63.0, 48.0, 51.0, 31.0, 26.0, 26.0, 19.0, 7.0, 11.0, 6.0, 6.0, 12.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7949447631835938, -0.7710418701171875, -0.7471389770507812, -0.723236083984375, -0.6993331909179688, -0.6754302978515625, -0.6515274047851562, -0.62762451171875, -0.6037216186523438, -0.5798187255859375, -0.5559158325195312, -0.532012939453125, -0.5081100463867188, -0.4842071533203125, -0.46030426025390625, -0.4364013671875, -0.41249847412109375, -0.3885955810546875, -0.36469268798828125, -0.340789794921875, -0.31688690185546875, -0.2929840087890625, -0.26908111572265625, -0.24517822265625, -0.22127532958984375, -0.1973724365234375, -0.17346954345703125, -0.149566650390625, -0.12566375732421875, -0.1017608642578125, -0.07785797119140625, -0.053955078125, -0.03005218505859375, -0.0061492919921875, 0.01775360107421875, 0.041656494140625, 0.06555938720703125, 0.0894622802734375, 0.11336517333984375, 0.13726806640625, 0.16117095947265625, 0.1850738525390625, 0.20897674560546875, 0.232879638671875, 0.25678253173828125, 0.2806854248046875, 0.30458831787109375, 0.3284912109375, 0.35239410400390625, 0.3762969970703125, 0.40019989013671875, 0.424102783203125, 0.44800567626953125, 0.4719085693359375, 0.49581146240234375, 0.51971435546875, 0.5436172485351562, 0.5675201416015625, 0.5914230346679688, 0.615325927734375, 0.6392288208007812, 0.6631317138671875, 0.6870346069335938, 0.7109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 10.0, 9.0, 17.0, 28.0, 33.0, 72.0, 105.0, 119.0, 212.0, 385.0, 720.0, 1661.0, 4523.0, 16497.0, 77163.0, 464267.0, 395669.0, 65150.0, 14518.0, 4234.0, 1530.0, 644.0, 343.0, 206.0, 140.0, 79.0, 82.0, 50.0, 20.0, 21.0, 14.0, 5.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.693359375, -2.585418701171875, -2.47747802734375, -2.369537353515625, -2.2615966796875, -2.153656005859375, -2.04571533203125, -1.937774658203125, -1.829833984375, -1.721893310546875, -1.61395263671875, -1.506011962890625, -1.3980712890625, -1.290130615234375, -1.18218994140625, -1.074249267578125, -0.96630859375, -0.858367919921875, -0.75042724609375, -0.642486572265625, -0.5345458984375, -0.426605224609375, -0.31866455078125, -0.210723876953125, -0.102783203125, 0.005157470703125, 0.11309814453125, 0.221038818359375, 0.3289794921875, 0.436920166015625, 0.54486083984375, 0.652801513671875, 0.7607421875, 0.868682861328125, 0.97662353515625, 1.084564208984375, 1.1925048828125, 1.300445556640625, 1.40838623046875, 1.516326904296875, 1.624267578125, 1.732208251953125, 1.84014892578125, 1.948089599609375, 2.0560302734375, 2.163970947265625, 2.27191162109375, 2.379852294921875, 2.48779296875, 2.595733642578125, 2.70367431640625, 2.811614990234375, 2.9195556640625, 3.027496337890625, 3.13543701171875, 3.243377685546875, 3.351318359375, 3.459259033203125, 3.56719970703125, 3.675140380859375, 3.7830810546875, 3.891021728515625, 3.99896240234375, 4.106903076171875, 4.21484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 10.0, 9.0, 14.0, 22.0, 40.0, 30.0, 41.0, 44.0, 45.0, 69.0, 69.0, 83.0, 81.0, 65.0, 60.0, 56.0, 52.0, 39.0, 24.0, 26.0, 26.0, 28.0, 15.0, 15.0, 10.0, 5.0, 7.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.63671875, -2.50433349609375, -2.3719482421875, -2.23956298828125, -2.107177734375, -1.97479248046875, -1.8424072265625, -1.71002197265625, -1.57763671875, -1.44525146484375, -1.3128662109375, -1.18048095703125, -1.048095703125, -0.91571044921875, -0.7833251953125, -0.65093994140625, -0.5185546875, -0.38616943359375, -0.2537841796875, -0.12139892578125, 0.010986328125, 0.14337158203125, 0.2757568359375, 0.40814208984375, 0.54052734375, 0.67291259765625, 0.8052978515625, 0.93768310546875, 1.070068359375, 1.20245361328125, 1.3348388671875, 1.46722412109375, 1.599609375, 1.73199462890625, 1.8643798828125, 1.99676513671875, 2.129150390625, 2.26153564453125, 2.3939208984375, 2.52630615234375, 2.65869140625, 2.79107666015625, 2.9234619140625, 3.05584716796875, 3.188232421875, 3.32061767578125, 3.4530029296875, 3.58538818359375, 3.7177734375, 3.85015869140625, 3.9825439453125, 4.11492919921875, 4.247314453125, 4.37969970703125, 4.5120849609375, 4.64447021484375, 4.77685546875, 4.90924072265625, 5.0416259765625, 5.17401123046875, 5.306396484375, 5.43878173828125, 5.5711669921875, 5.70355224609375, 5.8359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 8.0, 5.0, 12.0, 19.0, 32.0, 47.0, 72.0, 153.0, 303.0, 687.0, 2305.0, 20766.0, 996911.0, 23335.0, 2489.0, 728.0, 311.0, 157.0, 87.0, 47.0, 23.0, 20.0, 18.0, 6.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6328125, -5.435302734375, -5.23779296875, -5.040283203125, -4.8427734375, -4.645263671875, -4.44775390625, -4.250244140625, -4.052734375, -3.855224609375, -3.65771484375, -3.460205078125, -3.2626953125, -3.065185546875, -2.86767578125, -2.670166015625, -2.47265625, -2.275146484375, -2.07763671875, -1.880126953125, -1.6826171875, -1.485107421875, -1.28759765625, -1.090087890625, -0.892578125, -0.695068359375, -0.49755859375, -0.300048828125, -0.1025390625, 0.094970703125, 0.29248046875, 0.489990234375, 0.6875, 0.885009765625, 1.08251953125, 1.280029296875, 1.4775390625, 1.675048828125, 1.87255859375, 2.070068359375, 2.267578125, 2.465087890625, 2.66259765625, 2.860107421875, 3.0576171875, 3.255126953125, 3.45263671875, 3.650146484375, 3.84765625, 4.045166015625, 4.24267578125, 4.440185546875, 4.6376953125, 4.835205078125, 5.03271484375, 5.230224609375, 5.427734375, 5.625244140625, 5.82275390625, 6.020263671875, 6.2177734375, 6.415283203125, 6.61279296875, 6.810302734375, 7.0078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 13.0, 9.0, 19.0, 67.0, 133.0, 271.0, 258.0, 133.0, 50.0, 20.0, 8.0, 8.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002892017364501953, -0.0002739168703556061, -0.00025863200426101685, -0.0002433471381664276, -0.00022806227207183838, -0.00021277740597724915, -0.0001974925398826599, -0.00018220767378807068, -0.00016692280769348145, -0.0001516379415988922, -0.00013635307550430298, -0.00012106820940971375, -0.00010578334331512451, -9.049847722053528e-05, -7.521361112594604e-05, -5.992874503135681e-05, -4.464387893676758e-05, -2.9359012842178345e-05, -1.4074146747589111e-05, 1.210719347000122e-06, 1.6495585441589355e-05, 3.178045153617859e-05, 4.706531763076782e-05, 6.235018372535706e-05, 7.763504981994629e-05, 9.291991591453552e-05, 0.00010820478200912476, 0.000123489648103714, 0.00013877451419830322, 0.00015405938029289246, 0.0001693442463874817, 0.00018462911248207092, 0.00019991397857666016, 0.0002151988446712494, 0.00023048371076583862, 0.00024576857686042786, 0.0002610534429550171, 0.0002763383090496063, 0.00029162317514419556, 0.0003069080412387848, 0.000322192907333374, 0.00033747777342796326, 0.0003527626395225525, 0.0003680475056171417, 0.00038333237171173096, 0.0003986172378063202, 0.0004139021039009094, 0.00042918696999549866, 0.0004444718360900879, 0.0004597567021846771, 0.00047504156827926636, 0.0004903264343738556, 0.0005056113004684448, 0.0005208961665630341, 0.0005361810326576233, 0.0005514658987522125, 0.0005667507648468018, 0.000582035630941391, 0.0005973204970359802, 0.0006126053631305695, 0.0006278902292251587, 0.0006431750953197479, 0.0006584599614143372, 0.0006737448275089264, 0.0006890296936035156]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 6.0, 3.0, 3.0, 2.0, 8.0, 13.0, 24.0, 29.0, 42.0, 65.0, 140.0, 341.0, 821.0, 2526.0, 14289.0, 870568.0, 150477.0, 6549.0, 1554.0, 538.0, 261.0, 112.0, 68.0, 37.0, 32.0, 14.0, 19.0, 7.0, 1.0, 2.0, 5.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.382080078125, -4.24853515625, -4.114990234375, -3.9814453125, -3.847900390625, -3.71435546875, -3.580810546875, -3.447265625, -3.313720703125, -3.18017578125, -3.046630859375, -2.9130859375, -2.779541015625, -2.64599609375, -2.512451171875, -2.37890625, -2.245361328125, -2.11181640625, -1.978271484375, -1.8447265625, -1.711181640625, -1.57763671875, -1.444091796875, -1.310546875, -1.177001953125, -1.04345703125, -0.909912109375, -0.7763671875, -0.642822265625, -0.50927734375, -0.375732421875, -0.2421875, -0.108642578125, 0.02490234375, 0.158447265625, 0.2919921875, 0.425537109375, 0.55908203125, 0.692626953125, 0.826171875, 0.959716796875, 1.09326171875, 1.226806640625, 1.3603515625, 1.493896484375, 1.62744140625, 1.760986328125, 1.89453125, 2.028076171875, 2.16162109375, 2.295166015625, 2.4287109375, 2.562255859375, 2.69580078125, 2.829345703125, 2.962890625, 3.096435546875, 3.22998046875, 3.363525390625, 3.4970703125, 3.630615234375, 3.76416015625, 3.897705078125, 4.03125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 2.0, 6.0, 6.0, 17.0, 28.0, 50.0, 116.0, 190.0, 225.0, 142.0, 90.0, 41.0, 30.0, 25.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.05078125, -2.95330810546875, -2.8558349609375, -2.75836181640625, -2.660888671875, -2.56341552734375, -2.4659423828125, -2.36846923828125, -2.27099609375, -2.17352294921875, -2.0760498046875, -1.97857666015625, -1.881103515625, -1.78363037109375, -1.6861572265625, -1.58868408203125, -1.4912109375, -1.39373779296875, -1.2962646484375, -1.19879150390625, -1.101318359375, -1.00384521484375, -0.9063720703125, -0.80889892578125, -0.71142578125, -0.61395263671875, -0.5164794921875, -0.41900634765625, -0.321533203125, -0.22406005859375, -0.1265869140625, -0.02911376953125, 0.068359375, 0.16583251953125, 0.2633056640625, 0.36077880859375, 0.458251953125, 0.55572509765625, 0.6531982421875, 0.75067138671875, 0.84814453125, 0.94561767578125, 1.0430908203125, 1.14056396484375, 1.238037109375, 1.33551025390625, 1.4329833984375, 1.53045654296875, 1.6279296875, 1.72540283203125, 1.8228759765625, 1.92034912109375, 2.017822265625, 2.11529541015625, 2.2127685546875, 2.31024169921875, 2.40771484375, 2.50518798828125, 2.6026611328125, 2.70013427734375, 2.797607421875, 2.89508056640625, 2.9925537109375, 3.09002685546875, 3.1875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 11.0, 15.0, 22.0, 48.0, 55.0, 87.0, 108.0, 120.0, 141.0, 137.0, 73.0, 60.0, 35.0, 41.0, 21.0, 12.0, 3.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.72735023498535, -24.90595817565918, -24.084566116333008, -23.263174057006836, -22.441781997680664, -21.620389938354492, -20.798995971679688, -19.977603912353516, -19.156211853027344, -18.334819793701172, -17.513427734375, -16.692035675048828, -15.870643615722656, -15.049251556396484, -14.227858543395996, -13.406466484069824, -12.585075378417969, -11.763683319091797, -10.942291259765625, -10.120899200439453, -9.299507141113281, -8.47811508178711, -7.656722068786621, -6.835330009460449, -6.013937950134277, -5.1925458908081055, -4.371153831481934, -3.5497612953186035, -2.7283692359924316, -1.9069771766662598, -1.0855846405029297, -0.2641925811767578, 0.5571994781494141, 1.3785916566848755, 2.199983835220337, 3.021376132965088, 3.8427681922912598, 4.664160251617432, 5.485552787780762, 6.306944847106934, 7.1283369064331055, 7.949728965759277, 8.77112102508545, 9.592514038085938, 10.41390609741211, 11.235298156738281, 12.056690216064453, 12.878082275390625, 13.699474334716797, 14.520866394042969, 15.34225845336914, 16.163650512695312, 16.985042572021484, 17.806434631347656, 18.627826690673828, 19.44921875, 20.270610809326172, 21.092002868652344, 21.913394927978516, 22.734786987304688, 23.55617904663086, 24.37757110595703, 25.198963165283203, 26.020355224609375, 26.84174919128418]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 6.0, 13.0, 9.0, 10.0, 12.0, 17.0, 17.0, 26.0, 25.0, 30.0, 33.0, 33.0, 33.0, 26.0, 45.0, 48.0, 34.0, 51.0, 46.0, 50.0, 39.0, 38.0, 36.0, 41.0, 44.0, 41.0, 34.0, 26.0, 30.0, 17.0, 21.0, 13.0, 9.0, 10.0, 13.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.515485763549805, -15.02234935760498, -14.529212951660156, -14.036076545715332, -13.542940139770508, -13.0498046875, -12.55666732788086, -12.063531875610352, -11.570395469665527, -11.077259063720703, -10.584122657775879, -10.090986251831055, -9.59784984588623, -9.104713439941406, -8.611577987670898, -8.118441581726074, -7.625304698944092, -7.132168292999268, -6.639031887054443, -6.145895957946777, -5.652759552001953, -5.159623146057129, -4.666486740112305, -4.1733503341674805, -3.6802141666412354, -3.187077760696411, -2.693941593170166, -2.200805187225342, -1.7076689004898071, -1.2145326137542725, -0.7213962078094482, -0.22826004028320312, 0.2648763656616211, 0.7580126523971558, 1.2511489391326904, 1.7442853450775146, 2.2374215126037598, 2.730557918548584, 3.223694324493408, 3.7168304920196533, 4.209966659545898, 4.703103065490723, 5.196239471435547, 5.689375877380371, 6.182511806488037, 6.675648212432861, 7.1687846183776855, 7.661920547485352, 8.155057907104492, 8.648194313049316, 9.14133071899414, 9.634467124938965, 10.127603530883789, 10.620738983154297, 11.113876342773438, 11.607011795043945, 12.10014820098877, 12.593284606933594, 13.086421012878418, 13.579557418823242, 14.072693824768066, 14.56583023071289, 15.058965682983398, 15.552102088928223, 16.045238494873047]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 8.0, 2.0, 15.0, 10.0, 10.0, 12.0, 20.0, 28.0, 54.0, 65.0, 109.0, 174.0, 317.0, 553.0, 1057.0, 2434.0, 7485.0, 42485.0, 4057913.0, 66931.0, 9099.0, 2827.0, 1223.0, 587.0, 312.0, 215.0, 113.0, 85.0, 43.0, 24.0, 23.0, 15.0, 6.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.96484375, -4.829132080078125, -4.69342041015625, -4.557708740234375, -4.4219970703125, -4.286285400390625, -4.15057373046875, -4.014862060546875, -3.879150390625, -3.743438720703125, -3.60772705078125, -3.472015380859375, -3.3363037109375, -3.200592041015625, -3.06488037109375, -2.929168701171875, -2.79345703125, -2.657745361328125, -2.52203369140625, -2.386322021484375, -2.2506103515625, -2.114898681640625, -1.97918701171875, -1.843475341796875, -1.707763671875, -1.572052001953125, -1.43634033203125, -1.300628662109375, -1.1649169921875, -1.029205322265625, -0.89349365234375, -0.757781982421875, -0.6220703125, -0.486358642578125, -0.35064697265625, -0.214935302734375, -0.0792236328125, 0.056488037109375, 0.19219970703125, 0.327911376953125, 0.463623046875, 0.599334716796875, 0.73504638671875, 0.870758056640625, 1.0064697265625, 1.142181396484375, 1.27789306640625, 1.413604736328125, 1.54931640625, 1.685028076171875, 1.82073974609375, 1.956451416015625, 2.0921630859375, 2.227874755859375, 2.36358642578125, 2.499298095703125, 2.635009765625, 2.770721435546875, 2.90643310546875, 3.042144775390625, 3.1778564453125, 3.313568115234375, 3.44927978515625, 3.584991455078125, 3.720703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 10.0, 15.0, 14.0, 24.0, 28.0, 33.0, 39.0, 38.0, 46.0, 55.0, 64.0, 70.0, 73.0, 60.0, 66.0, 52.0, 63.0, 50.0, 39.0, 23.0, 29.0, 22.0, 17.0, 8.0, 7.0, 6.0, 12.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8130264282226562, -0.7886505126953125, -0.7642745971679688, -0.739898681640625, -0.7155227661132812, -0.6911468505859375, -0.6667709350585938, -0.64239501953125, -0.6180191040039062, -0.5936431884765625, -0.5692672729492188, -0.544891357421875, -0.5205154418945312, -0.4961395263671875, -0.47176361083984375, -0.4473876953125, -0.42301177978515625, -0.3986358642578125, -0.37425994873046875, -0.349884033203125, -0.32550811767578125, -0.3011322021484375, -0.27675628662109375, -0.25238037109375, -0.22800445556640625, -0.2036285400390625, -0.17925262451171875, -0.154876708984375, -0.13050079345703125, -0.1061248779296875, -0.08174896240234375, -0.057373046875, -0.03299713134765625, -0.0086212158203125, 0.01575469970703125, 0.040130615234375, 0.06450653076171875, 0.0888824462890625, 0.11325836181640625, 0.13763427734375, 0.16201019287109375, 0.1863861083984375, 0.21076202392578125, 0.235137939453125, 0.25951385498046875, 0.2838897705078125, 0.30826568603515625, 0.3326416015625, 0.35701751708984375, 0.3813934326171875, 0.40576934814453125, 0.430145263671875, 0.45452117919921875, 0.4788970947265625, 0.5032730102539062, 0.52764892578125, 0.5520248413085938, 0.5764007568359375, 0.6007766723632812, 0.625152587890625, 0.6495285034179688, 0.6739044189453125, 0.6982803344726562, 0.72265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 6.0, 4.0, 3.0, 6.0, 7.0, 10.0, 10.0, 22.0, 22.0, 14.0, 34.0, 53.0, 57.0, 104.0, 199.0, 346.0, 606.0, 1119.0, 2418.0, 5557.0, 14563.0, 58419.0, 3904195.0, 166907.0, 24615.0, 8129.0, 3435.0, 1540.0, 784.0, 428.0, 234.0, 125.0, 68.0, 67.0, 37.0, 24.0, 19.0, 16.0, 13.0, 6.0, 9.0, 9.0, 9.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.48828125, -4.3421630859375, -4.196044921875, -4.0499267578125, -3.90380859375, -3.7576904296875, -3.611572265625, -3.4654541015625, -3.3193359375, -3.1732177734375, -3.027099609375, -2.8809814453125, -2.73486328125, -2.5887451171875, -2.442626953125, -2.2965087890625, -2.150390625, -2.0042724609375, -1.858154296875, -1.7120361328125, -1.56591796875, -1.4197998046875, -1.273681640625, -1.1275634765625, -0.9814453125, -0.8353271484375, -0.689208984375, -0.5430908203125, -0.39697265625, -0.2508544921875, -0.104736328125, 0.0413818359375, 0.1875, 0.3336181640625, 0.479736328125, 0.6258544921875, 0.77197265625, 0.9180908203125, 1.064208984375, 1.2103271484375, 1.3564453125, 1.5025634765625, 1.648681640625, 1.7947998046875, 1.94091796875, 2.0870361328125, 2.233154296875, 2.3792724609375, 2.525390625, 2.6715087890625, 2.817626953125, 2.9637451171875, 3.10986328125, 3.2559814453125, 3.402099609375, 3.5482177734375, 3.6943359375, 3.8404541015625, 3.986572265625, 4.1326904296875, 4.27880859375, 4.4249267578125, 4.571044921875, 4.7171630859375, 4.86328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 7.0, 5.0, 6.0, 8.0, 12.0, 33.0, 32.0, 76.0, 238.0, 3226.0, 254.0, 62.0, 52.0, 10.0, 18.0, 12.0, 4.0, 8.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.0078125, -1.9654998779296875, -1.923187255859375, -1.8808746337890625, -1.83856201171875, -1.7962493896484375, -1.753936767578125, -1.7116241455078125, -1.6693115234375, -1.6269989013671875, -1.584686279296875, -1.5423736572265625, -1.50006103515625, -1.4577484130859375, -1.415435791015625, -1.3731231689453125, -1.330810546875, -1.2884979248046875, -1.246185302734375, -1.2038726806640625, -1.16156005859375, -1.1192474365234375, -1.076934814453125, -1.0346221923828125, -0.9923095703125, -0.9499969482421875, -0.907684326171875, -0.8653717041015625, -0.82305908203125, -0.7807464599609375, -0.738433837890625, -0.6961212158203125, -0.65380859375, -0.6114959716796875, -0.569183349609375, -0.5268707275390625, -0.48455810546875, -0.4422454833984375, -0.399932861328125, -0.3576202392578125, -0.3153076171875, -0.2729949951171875, -0.230682373046875, -0.1883697509765625, -0.14605712890625, -0.1037445068359375, -0.061431884765625, -0.0191192626953125, 0.023193359375, 0.0655059814453125, 0.107818603515625, 0.1501312255859375, 0.19244384765625, 0.2347564697265625, 0.277069091796875, 0.3193817138671875, 0.3616943359375, 0.4040069580078125, 0.446319580078125, 0.4886322021484375, 0.53094482421875, 0.5732574462890625, 0.615570068359375, 0.6578826904296875, 0.7001953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 20.0, 36.0, 85.0, 148.0, 231.0, 197.0, 150.0, 67.0, 42.0, 16.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.93954849243164, -10.662216186523438, -10.384883880615234, -10.107551574707031, -9.830219268798828, -9.552886962890625, -9.275554656982422, -8.998222351074219, -8.720890045166016, -8.443557739257812, -8.16622543334961, -7.888893127441406, -7.611560821533203, -7.334228515625, -7.056896209716797, -6.779563903808594, -6.502231597900391, -6.2248992919921875, -5.947566986083984, -5.670234680175781, -5.392902374267578, -5.115570068359375, -4.838237762451172, -4.560905456542969, -4.283573150634766, -4.0062408447265625, -3.7289085388183594, -3.4515762329101562, -3.174243927001953, -2.89691162109375, -2.619579315185547, -2.3422470092773438, -2.0649147033691406, -1.7875823974609375, -1.5102500915527344, -1.2329177856445312, -0.9555854797363281, -0.678253173828125, -0.4009208679199219, -0.12358856201171875, 0.15374374389648438, 0.4310760498046875, 0.7084083557128906, 0.9857406616210938, 1.2630729675292969, 1.5404052734375, 1.8177375793457031, 2.0950698852539062, 2.3724021911621094, 2.6497344970703125, 2.9270668029785156, 3.2043991088867188, 3.481731414794922, 3.759063720703125, 4.036396026611328, 4.313728332519531, 4.591060638427734, 4.8683929443359375, 5.145725250244141, 5.423057556152344, 5.700389862060547, 5.97772216796875, 6.255054473876953, 6.532386779785156, 6.809719085693359]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 10.0, 3.0, 7.0, 16.0, 9.0, 13.0, 21.0, 24.0, 19.0, 28.0, 36.0, 46.0, 37.0, 55.0, 47.0, 49.0, 58.0, 54.0, 51.0, 57.0, 51.0, 52.0, 39.0, 38.0, 34.0, 33.0, 31.0, 26.0, 18.0, 22.0, 9.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5569868087768555, -3.4534077644348145, -3.3498284816741943, -3.2462494373321533, -3.142670154571533, -3.039091110229492, -2.935512065887451, -2.83193302154541, -2.72835373878479, -2.624774694442749, -2.521195411682129, -2.417616367340088, -2.314037322998047, -2.2104580402374268, -2.1068789958953857, -2.0032997131347656, -1.8997206687927246, -1.796141505241394, -1.6925623416900635, -1.5889832973480225, -1.485404133796692, -1.3818249702453613, -1.2782459259033203, -1.1746667623519897, -1.0710875988006592, -0.9675084352493286, -0.8639293313026428, -0.760350227355957, -0.6567710638046265, -0.5531919002532959, -0.4496127963066101, -0.3460336923599243, -0.24245452880859375, -0.13887539505958557, -0.03529626131057739, 0.06828287243843079, 0.17186200618743896, 0.27544116973876953, 0.3790202736854553, 0.4825993776321411, 0.5861785411834717, 0.6897577047348022, 0.793336808681488, 0.8969159126281738, 1.0004950761795044, 1.104074239730835, 1.207653284072876, 1.3112324476242065, 1.414811611175537, 1.5183907747268677, 1.6219699382781982, 1.7255489826202393, 1.8291281461715698, 1.9327073097229004, 2.0362863540649414, 2.1398653984069824, 2.2434446811676025, 2.3470237255096436, 2.4506030082702637, 2.5541820526123047, 2.6577610969543457, 2.761340379714966, 2.864919424057007, 2.968498706817627, 3.072077751159668]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 7.0, 15.0, 17.0, 12.0, 16.0, 36.0, 50.0, 56.0, 103.0, 156.0, 281.0, 462.0, 818.0, 1414.0, 2703.0, 5522.0, 12155.0, 30400.0, 85345.0, 267228.0, 402224.0, 153263.0, 50650.0, 18996.0, 8231.0, 3865.0, 1955.0, 1028.0, 560.0, 372.0, 219.0, 142.0, 86.0, 57.0, 30.0, 25.0, 13.0, 14.0, 7.0, 7.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.338714599609375, -2.26141357421875, -2.184112548828125, -2.1068115234375, -2.029510498046875, -1.95220947265625, -1.874908447265625, -1.797607421875, -1.720306396484375, -1.64300537109375, -1.565704345703125, -1.4884033203125, -1.411102294921875, -1.33380126953125, -1.256500244140625, -1.17919921875, -1.101898193359375, -1.02459716796875, -0.947296142578125, -0.8699951171875, -0.792694091796875, -0.71539306640625, -0.638092041015625, -0.560791015625, -0.483489990234375, -0.40618896484375, -0.328887939453125, -0.2515869140625, -0.174285888671875, -0.09698486328125, -0.019683837890625, 0.0576171875, 0.134918212890625, 0.21221923828125, 0.289520263671875, 0.3668212890625, 0.444122314453125, 0.52142333984375, 0.598724365234375, 0.676025390625, 0.753326416015625, 0.83062744140625, 0.907928466796875, 0.9852294921875, 1.062530517578125, 1.13983154296875, 1.217132568359375, 1.29443359375, 1.371734619140625, 1.44903564453125, 1.526336669921875, 1.6036376953125, 1.680938720703125, 1.75823974609375, 1.835540771484375, 1.912841796875, 1.990142822265625, 2.06744384765625, 2.144744873046875, 2.2220458984375, 2.299346923828125, 2.37664794921875, 2.453948974609375, 2.53125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 7.0, 4.0, 6.0, 10.0, 9.0, 10.0, 14.0, 13.0, 12.0, 23.0, 15.0, 23.0, 20.0, 44.0, 39.0, 38.0, 43.0, 39.0, 66.0, 45.0, 47.0, 57.0, 43.0, 47.0, 51.0, 47.0, 43.0, 28.0, 26.0, 22.0, 22.0, 21.0, 12.0, 16.0, 8.0, 7.0, 7.0, 8.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.82958984375, -0.8059921264648438, -0.7823944091796875, -0.7587966918945312, -0.735198974609375, -0.7116012573242188, -0.6880035400390625, -0.6644058227539062, -0.64080810546875, -0.6172103881835938, -0.5936126708984375, -0.5700149536132812, -0.546417236328125, -0.5228195190429688, -0.4992218017578125, -0.47562408447265625, -0.4520263671875, -0.42842864990234375, -0.4048309326171875, -0.38123321533203125, -0.357635498046875, -0.33403778076171875, -0.3104400634765625, -0.28684234619140625, -0.26324462890625, -0.23964691162109375, -0.2160491943359375, -0.19245147705078125, -0.168853759765625, -0.14525604248046875, -0.1216583251953125, -0.09806060791015625, -0.074462890625, -0.05086517333984375, -0.0272674560546875, -0.00366973876953125, 0.019927978515625, 0.04352569580078125, 0.0671234130859375, 0.09072113037109375, 0.11431884765625, 0.13791656494140625, 0.1615142822265625, 0.18511199951171875, 0.208709716796875, 0.23230743408203125, 0.2559051513671875, 0.27950286865234375, 0.3031005859375, 0.32669830322265625, 0.3502960205078125, 0.37389373779296875, 0.397491455078125, 0.42108917236328125, 0.4446868896484375, 0.46828460693359375, 0.49188232421875, 0.5154800415039062, 0.5390777587890625, 0.5626754760742188, 0.586273193359375, 0.6098709106445312, 0.6334686279296875, 0.6570663452148438, 0.6806640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 4.0, 7.0, 10.0, 12.0, 15.0, 28.0, 30.0, 53.0, 97.0, 164.0, 398.0, 1130.0, 4475.0, 38635.0, 851888.0, 139527.0, 9203.0, 1773.0, 547.0, 240.0, 116.0, 55.0, 50.0, 32.0, 19.0, 15.0, 9.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.3707275390625, -6.132080078125, -5.8934326171875, -5.65478515625, -5.4161376953125, -5.177490234375, -4.9388427734375, -4.7001953125, -4.4615478515625, -4.222900390625, -3.9842529296875, -3.74560546875, -3.5069580078125, -3.268310546875, -3.0296630859375, -2.791015625, -2.5523681640625, -2.313720703125, -2.0750732421875, -1.83642578125, -1.5977783203125, -1.359130859375, -1.1204833984375, -0.8818359375, -0.6431884765625, -0.404541015625, -0.1658935546875, 0.07275390625, 0.3114013671875, 0.550048828125, 0.7886962890625, 1.02734375, 1.2659912109375, 1.504638671875, 1.7432861328125, 1.98193359375, 2.2205810546875, 2.459228515625, 2.6978759765625, 2.9365234375, 3.1751708984375, 3.413818359375, 3.6524658203125, 3.89111328125, 4.1297607421875, 4.368408203125, 4.6070556640625, 4.845703125, 5.0843505859375, 5.322998046875, 5.5616455078125, 5.80029296875, 6.0389404296875, 6.277587890625, 6.5162353515625, 6.7548828125, 6.9935302734375, 7.232177734375, 7.4708251953125, 7.70947265625, 7.9481201171875, 8.186767578125, 8.4254150390625, 8.6640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 5.0, 7.0, 7.0, 12.0, 6.0, 17.0, 12.0, 31.0, 26.0, 26.0, 32.0, 36.0, 37.0, 49.0, 51.0, 49.0, 65.0, 58.0, 63.0, 57.0, 56.0, 60.0, 43.0, 42.0, 33.0, 26.0, 23.0, 18.0, 14.0, 10.0, 8.0, 12.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.0234375, -4.87689208984375, -4.7303466796875, -4.58380126953125, -4.437255859375, -4.29071044921875, -4.1441650390625, -3.99761962890625, -3.85107421875, -3.70452880859375, -3.5579833984375, -3.41143798828125, -3.264892578125, -3.11834716796875, -2.9718017578125, -2.82525634765625, -2.6787109375, -2.53216552734375, -2.3856201171875, -2.23907470703125, -2.092529296875, -1.94598388671875, -1.7994384765625, -1.65289306640625, -1.50634765625, -1.35980224609375, -1.2132568359375, -1.06671142578125, -0.920166015625, -0.77362060546875, -0.6270751953125, -0.48052978515625, -0.333984375, -0.18743896484375, -0.0408935546875, 0.10565185546875, 0.252197265625, 0.39874267578125, 0.5452880859375, 0.69183349609375, 0.83837890625, 0.98492431640625, 1.1314697265625, 1.27801513671875, 1.424560546875, 1.57110595703125, 1.7176513671875, 1.86419677734375, 2.0107421875, 2.15728759765625, 2.3038330078125, 2.45037841796875, 2.596923828125, 2.74346923828125, 2.8900146484375, 3.03656005859375, 3.18310546875, 3.32965087890625, 3.4761962890625, 3.62274169921875, 3.769287109375, 3.91583251953125, 4.0623779296875, 4.20892333984375, 4.35546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 10.0, 7.0, 27.0, 28.0, 35.0, 66.0, 96.0, 236.0, 556.0, 2253.0, 23911.0, 997743.0, 20415.0, 2071.0, 560.0, 249.0, 116.0, 66.0, 30.0, 25.0, 17.0, 14.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3203125, -9.10595703125, -8.8916015625, -8.67724609375, -8.462890625, -8.24853515625, -8.0341796875, -7.81982421875, -7.60546875, -7.39111328125, -7.1767578125, -6.96240234375, -6.748046875, -6.53369140625, -6.3193359375, -6.10498046875, -5.890625, -5.67626953125, -5.4619140625, -5.24755859375, -5.033203125, -4.81884765625, -4.6044921875, -4.39013671875, -4.17578125, -3.96142578125, -3.7470703125, -3.53271484375, -3.318359375, -3.10400390625, -2.8896484375, -2.67529296875, -2.4609375, -2.24658203125, -2.0322265625, -1.81787109375, -1.603515625, -1.38916015625, -1.1748046875, -0.96044921875, -0.74609375, -0.53173828125, -0.3173828125, -0.10302734375, 0.111328125, 0.32568359375, 0.5400390625, 0.75439453125, 0.96875, 1.18310546875, 1.3974609375, 1.61181640625, 1.826171875, 2.04052734375, 2.2548828125, 2.46923828125, 2.68359375, 2.89794921875, 3.1123046875, 3.32666015625, 3.541015625, 3.75537109375, 3.9697265625, 4.18408203125, 4.3984375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 17.0, 15.0, 40.0, 63.0, 125.0, 157.0, 205.0, 149.0, 116.0, 43.0, 32.0, 15.0, 7.0, 6.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000392913818359375, -0.0003774911165237427, -0.00036206841468811035, -0.00034664571285247803, -0.0003312230110168457, -0.0003158003091812134, -0.00030037760734558105, -0.00028495490550994873, -0.0002695322036743164, -0.0002541095018386841, -0.00023868680000305176, -0.00022326409816741943, -0.0002078413963317871, -0.00019241869449615479, -0.00017699599266052246, -0.00016157329082489014, -0.0001461505889892578, -0.0001307278871536255, -0.00011530518531799316, -9.988248348236084e-05, -8.445978164672852e-05, -6.903707981109619e-05, -5.361437797546387e-05, -3.819167613983154e-05, -2.276897430419922e-05, -7.3462724685668945e-06, 8.07642936706543e-06, 2.3499131202697754e-05, 3.892183303833008e-05, 5.43445348739624e-05, 6.976723670959473e-05, 8.518993854522705e-05, 0.00010061264038085938, 0.0001160353422164917, 0.00013145804405212402, 0.00014688074588775635, 0.00016230344772338867, 0.000177726149559021, 0.00019314885139465332, 0.00020857155323028564, 0.00022399425506591797, 0.0002394169569015503, 0.0002548396587371826, 0.00027026236057281494, 0.00028568506240844727, 0.0003011077642440796, 0.0003165304660797119, 0.00033195316791534424, 0.00034737586975097656, 0.0003627985715866089, 0.0003782212734222412, 0.00039364397525787354, 0.00040906667709350586, 0.0004244893789291382, 0.0004399120807647705, 0.00045533478260040283, 0.00047075748443603516, 0.0004861801862716675, 0.0005016028881072998, 0.0005170255899429321, 0.0005324482917785645, 0.0005478709936141968, 0.0005632936954498291, 0.0005787163972854614, 0.0005941390991210938]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 13.0, 27.0, 42.0, 105.0, 271.0, 708.0, 4280.0, 262748.0, 772327.0, 6500.0, 988.0, 309.0, 114.0, 53.0, 33.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.796875, -6.5850830078125, -6.373291015625, -6.1614990234375, -5.94970703125, -5.7379150390625, -5.526123046875, -5.3143310546875, -5.1025390625, -4.8907470703125, -4.678955078125, -4.4671630859375, -4.25537109375, -4.0435791015625, -3.831787109375, -3.6199951171875, -3.408203125, -3.1964111328125, -2.984619140625, -2.7728271484375, -2.56103515625, -2.3492431640625, -2.137451171875, -1.9256591796875, -1.7138671875, -1.5020751953125, -1.290283203125, -1.0784912109375, -0.86669921875, -0.6549072265625, -0.443115234375, -0.2313232421875, -0.01953125, 0.1922607421875, 0.404052734375, 0.6158447265625, 0.82763671875, 1.0394287109375, 1.251220703125, 1.4630126953125, 1.6748046875, 1.8865966796875, 2.098388671875, 2.3101806640625, 2.52197265625, 2.7337646484375, 2.945556640625, 3.1573486328125, 3.369140625, 3.5809326171875, 3.792724609375, 4.0045166015625, 4.21630859375, 4.4281005859375, 4.639892578125, 4.8516845703125, 5.0634765625, 5.2752685546875, 5.487060546875, 5.6988525390625, 5.91064453125, 6.1224365234375, 6.334228515625, 6.5460205078125, 6.7578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 17.0, 33.0, 57.0, 142.0, 263.0, 269.0, 123.0, 56.0, 22.0, 10.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9296875, -9.722320556640625, -9.51495361328125, -9.307586669921875, -9.1002197265625, -8.892852783203125, -8.68548583984375, -8.478118896484375, -8.270751953125, -8.063385009765625, -7.85601806640625, -7.648651123046875, -7.4412841796875, -7.233917236328125, -7.02655029296875, -6.819183349609375, -6.61181640625, -6.404449462890625, -6.19708251953125, -5.989715576171875, -5.7823486328125, -5.574981689453125, -5.36761474609375, -5.160247802734375, -4.952880859375, -4.745513916015625, -4.53814697265625, -4.330780029296875, -4.1234130859375, -3.916046142578125, -3.70867919921875, -3.501312255859375, -3.2939453125, -3.086578369140625, -2.87921142578125, -2.671844482421875, -2.4644775390625, -2.257110595703125, -2.04974365234375, -1.842376708984375, -1.635009765625, -1.427642822265625, -1.22027587890625, -1.012908935546875, -0.8055419921875, -0.598175048828125, -0.39080810546875, -0.183441162109375, 0.02392578125, 0.231292724609375, 0.43865966796875, 0.646026611328125, 0.8533935546875, 1.060760498046875, 1.26812744140625, 1.475494384765625, 1.682861328125, 1.890228271484375, 2.09759521484375, 2.304962158203125, 2.5123291015625, 2.719696044921875, 2.92706298828125, 3.134429931640625, 3.341796875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 31.0, 165.0, 471.0, 284.0, 41.0, 14.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-215.9741973876953, -212.02598571777344, -208.07777404785156, -204.12957763671875, -200.18136596679688, -196.233154296875, -192.28494262695312, -188.33673095703125, -184.38851928710938, -180.4403076171875, -176.49209594726562, -172.54388427734375, -168.59568786621094, -164.64747619628906, -160.6992645263672, -156.7510528564453, -152.8028564453125, -148.85464477539062, -144.90643310546875, -140.95822143554688, -137.01002502441406, -133.0618133544922, -129.1136016845703, -125.16539001464844, -121.21717834472656, -117.26896667480469, -113.32076263427734, -109.37255096435547, -105.4243392944336, -101.47613525390625, -97.52792358398438, -93.5797119140625, -89.6314926147461, -85.68328094482422, -81.73507690429688, -77.786865234375, -73.83865356445312, -69.89044189453125, -65.9422378540039, -61.99402618408203, -58.04581832885742, -54.09761047363281, -50.14939880371094, -46.20119094848633, -42.25298309326172, -38.304771423339844, -34.356563568115234, -30.408353805541992, -26.46014404296875, -22.511934280395508, -18.563724517822266, -14.615516662597656, -10.667306900024414, -6.719097137451172, -2.7708892822265625, 1.1773204803466797, 5.125530242919922, 9.073740005493164, 13.02194881439209, 16.970157623291016, 20.918367385864258, 24.8665771484375, 28.81478500366211, 32.76299285888672, 36.711204528808594]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 3.0, 9.0, 6.0, 17.0, 10.0, 22.0, 25.0, 26.0, 25.0, 31.0, 25.0, 40.0, 30.0, 44.0, 39.0, 53.0, 46.0, 52.0, 50.0, 39.0, 45.0, 45.0, 39.0, 32.0, 28.0, 22.0, 25.0, 23.0, 27.0, 28.0, 13.0, 28.0, 8.0, 14.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.871593475341797, -16.31081199645996, -15.750032424926758, -15.189250946044922, -14.628470420837402, -14.067689895629883, -13.506909370422363, -12.946128845214844, -12.385347366333008, -11.824566841125488, -11.263786315917969, -10.703004837036133, -10.142224311828613, -9.581443786621094, -9.020663261413574, -8.459882736206055, -7.899102210998535, -7.338321685791016, -6.777540683746338, -6.216760158538818, -5.655979156494141, -5.095198631286621, -4.534418106079102, -3.973637342453003, -3.4128565788269043, -2.8520758152008057, -2.291295051574707, -1.7305145263671875, -1.1697337627410889, -0.6089529991149902, -0.0481724739074707, 0.5126082897186279, 1.0733890533447266, 1.6341698169708252, 2.194950580596924, 2.7557311058044434, 3.316511869430542, 3.8772926330566406, 4.43807315826416, 4.99885368347168, 5.559634685516357, 6.120415210723877, 6.681196212768555, 7.241976737976074, 7.802757263183594, 8.36353874206543, 8.924318313598633, 9.485099792480469, 10.045880317687988, 10.606660842895508, 11.167441368103027, 11.728221893310547, 12.289003372192383, 12.849783897399902, 13.410564422607422, 13.971344947814941, 14.532125473022461, 15.09290599822998, 15.6536865234375, 16.214468002319336, 16.77524757385254, 17.336029052734375, 17.896808624267578, 18.457590103149414, 19.01837158203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 23.0, 25.0, 29.0, 49.0, 80.0, 136.0, 299.0, 585.0, 1658.0, 6143.0, 3983055.0, 193570.0, 5781.0, 1565.0, 603.0, 269.0, 136.0, 80.0, 51.0, 40.0, 21.0, 20.0, 6.0, 8.0, 7.0, 3.0, 5.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.872314453125, -7.58056640625, -7.288818359375, -6.9970703125, -6.705322265625, -6.41357421875, -6.121826171875, -5.830078125, -5.538330078125, -5.24658203125, -4.954833984375, -4.6630859375, -4.371337890625, -4.07958984375, -3.787841796875, -3.49609375, -3.204345703125, -2.91259765625, -2.620849609375, -2.3291015625, -2.037353515625, -1.74560546875, -1.453857421875, -1.162109375, -0.870361328125, -0.57861328125, -0.286865234375, 0.0048828125, 0.296630859375, 0.58837890625, 0.880126953125, 1.171875, 1.463623046875, 1.75537109375, 2.047119140625, 2.3388671875, 2.630615234375, 2.92236328125, 3.214111328125, 3.505859375, 3.797607421875, 4.08935546875, 4.381103515625, 4.6728515625, 4.964599609375, 5.25634765625, 5.548095703125, 5.83984375, 6.131591796875, 6.42333984375, 6.715087890625, 7.0068359375, 7.298583984375, 7.59033203125, 7.882080078125, 8.173828125, 8.465576171875, 8.75732421875, 9.049072265625, 9.3408203125, 9.632568359375, 9.92431640625, 10.216064453125, 10.5078125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 15.0, 16.0, 21.0, 21.0, 38.0, 39.0, 51.0, 53.0, 72.0, 78.0, 95.0, 77.0, 59.0, 60.0, 62.0, 56.0, 50.0, 34.0, 17.0, 24.0, 11.0, 10.0, 11.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4306640625, -1.3927841186523438, -1.3549041748046875, -1.3170242309570312, -1.279144287109375, -1.2412643432617188, -1.2033843994140625, -1.1655044555664062, -1.12762451171875, -1.0897445678710938, -1.0518646240234375, -1.0139846801757812, -0.976104736328125, -0.9382247924804688, -0.9003448486328125, -0.8624649047851562, -0.8245849609375, -0.7867050170898438, -0.7488250732421875, -0.7109451293945312, -0.673065185546875, -0.6351852416992188, -0.5973052978515625, -0.5594253540039062, -0.52154541015625, -0.48366546630859375, -0.4457855224609375, -0.40790557861328125, -0.370025634765625, -0.33214569091796875, -0.2942657470703125, -0.25638580322265625, -0.218505859375, -0.18062591552734375, -0.1427459716796875, -0.10486602783203125, -0.066986083984375, -0.02910614013671875, 0.0087738037109375, 0.04665374755859375, 0.08453369140625, 0.12241363525390625, 0.1602935791015625, 0.19817352294921875, 0.236053466796875, 0.27393341064453125, 0.3118133544921875, 0.34969329833984375, 0.3875732421875, 0.42545318603515625, 0.4633331298828125, 0.5012130737304688, 0.539093017578125, 0.5769729614257812, 0.6148529052734375, 0.6527328491210938, 0.69061279296875, 0.7284927368164062, 0.7663726806640625, 0.8042526245117188, 0.842132568359375, 0.8800125122070312, 0.9178924560546875, 0.9557723999023438, 0.99365234375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 7.0, 7.0, 24.0, 33.0, 28.0, 31.0, 52.0, 88.0, 89.0, 116.0, 175.0, 246.0, 319.0, 443.0, 710.0, 1134.0, 1854.0, 3552.0, 8652.0, 38904.0, 4073287.0, 45790.0, 9268.0, 3848.0, 1984.0, 1189.0, 719.0, 496.0, 327.0, 232.0, 184.0, 117.0, 73.0, 64.0, 39.0, 36.0, 33.0, 32.0, 26.0, 21.0, 12.0, 6.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.65234375, -6.46514892578125, -6.2779541015625, -6.09075927734375, -5.903564453125, -5.71636962890625, -5.5291748046875, -5.34197998046875, -5.15478515625, -4.96759033203125, -4.7803955078125, -4.59320068359375, -4.406005859375, -4.21881103515625, -4.0316162109375, -3.84442138671875, -3.6572265625, -3.47003173828125, -3.2828369140625, -3.09564208984375, -2.908447265625, -2.72125244140625, -2.5340576171875, -2.34686279296875, -2.15966796875, -1.97247314453125, -1.7852783203125, -1.59808349609375, -1.410888671875, -1.22369384765625, -1.0364990234375, -0.84930419921875, -0.662109375, -0.47491455078125, -0.2877197265625, -0.10052490234375, 0.086669921875, 0.27386474609375, 0.4610595703125, 0.64825439453125, 0.83544921875, 1.02264404296875, 1.2098388671875, 1.39703369140625, 1.584228515625, 1.77142333984375, 1.9586181640625, 2.14581298828125, 2.3330078125, 2.52020263671875, 2.7073974609375, 2.89459228515625, 3.081787109375, 3.26898193359375, 3.4561767578125, 3.64337158203125, 3.83056640625, 4.01776123046875, 4.2049560546875, 4.39215087890625, 4.579345703125, 4.76654052734375, 4.9537353515625, 5.14093017578125, 5.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 6.0, 17.0, 20.0, 46.0, 115.0, 3691.0, 73.0, 35.0, 24.0, 9.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9365234375, -1.8897247314453125, -1.842926025390625, -1.7961273193359375, -1.74932861328125, -1.7025299072265625, -1.655731201171875, -1.6089324951171875, -1.5621337890625, -1.5153350830078125, -1.468536376953125, -1.4217376708984375, -1.37493896484375, -1.3281402587890625, -1.281341552734375, -1.2345428466796875, -1.187744140625, -1.1409454345703125, -1.094146728515625, -1.0473480224609375, -1.00054931640625, -0.9537506103515625, -0.906951904296875, -0.8601531982421875, -0.8133544921875, -0.7665557861328125, -0.719757080078125, -0.6729583740234375, -0.62615966796875, -0.5793609619140625, -0.532562255859375, -0.4857635498046875, -0.43896484375, -0.3921661376953125, -0.345367431640625, -0.2985687255859375, -0.25177001953125, -0.2049713134765625, -0.158172607421875, -0.1113739013671875, -0.0645751953125, -0.0177764892578125, 0.029022216796875, 0.0758209228515625, 0.12261962890625, 0.1694183349609375, 0.216217041015625, 0.2630157470703125, 0.309814453125, 0.3566131591796875, 0.403411865234375, 0.4502105712890625, 0.49700927734375, 0.5438079833984375, 0.590606689453125, 0.6374053955078125, 0.6842041015625, 0.7310028076171875, 0.777801513671875, 0.8246002197265625, 0.87139892578125, 0.9181976318359375, 0.964996337890625, 1.0117950439453125, 1.05859375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 10.0, 23.0, 26.0, 58.0, 73.0, 100.0, 124.0, 134.0, 134.0, 100.0, 83.0, 56.0, 23.0, 17.0, 12.0, 10.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171369552612305, -3.9306156635284424, -3.7440943717956543, -3.557573080062866, -3.371051788330078, -3.18453049659729, -2.998009204864502, -2.811487913131714, -2.624966621398926, -2.4384453296661377, -2.2519240379333496, -2.0654027462005615, -1.8788814544677734, -1.6923601627349854, -1.5058388710021973, -1.3193175792694092, -1.132796287536621, -0.946274995803833, -0.7597537040710449, -0.5732324123382568, -0.38671112060546875, -0.20018982887268066, -0.013668537139892578, 0.1728527545928955, 0.3593740463256836, 0.5458953380584717, 0.7324166297912598, 0.9189379215240479, 1.105459213256836, 1.291980504989624, 1.478501796722412, 1.6650230884552002, 1.8515443801879883, 2.0380656719207764, 2.2245869636535645, 2.4111082553863525, 2.5976295471191406, 2.7841508388519287, 2.970672130584717, 3.157193422317505, 3.343714714050293, 3.530236005783081, 3.716757297515869, 3.9032785892486572, 4.089799880981445, 4.2763214111328125, 4.4628424644470215, 4.6493635177612305, 4.835885047912598, 5.022406578063965, 5.208927631378174, 5.395448684692383, 5.58197021484375, 5.768491744995117, 5.955012798309326, 6.141533851623535, 6.328055381774902, 6.5145769119262695, 6.7010979652404785, 6.8876190185546875, 7.074140548706055, 7.260662078857422, 7.447183132171631, 7.63370418548584, 7.820225715637207]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 6.0, 3.0, 5.0, 10.0, 4.0, 6.0, 6.0, 10.0, 21.0, 16.0, 15.0, 18.0, 27.0, 29.0, 17.0, 36.0, 27.0, 26.0, 41.0, 35.0, 37.0, 45.0, 43.0, 32.0, 42.0, 42.0, 43.0, 51.0, 39.0, 40.0, 35.0, 31.0, 23.0, 23.0, 15.0, 18.0, 14.0, 6.0, 17.0, 14.0, 11.0, 9.0, 9.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7874960899353027, -2.7028729915618896, -2.6182498931884766, -2.5336267948150635, -2.4490036964416504, -2.3643805980682373, -2.279757499694824, -2.195134401321411, -2.110511302947998, -2.025888204574585, -1.9412651062011719, -1.8566420078277588, -1.7720189094543457, -1.6873958110809326, -1.6027727127075195, -1.5181496143341064, -1.433526635169983, -1.3489035367965698, -1.2642804384231567, -1.1796573400497437, -1.0950342416763306, -1.0104111433029175, -0.9257881045341492, -0.8411650061607361, -0.756541907787323, -0.6719188094139099, -0.5872957110404968, -0.5026726722717285, -0.41804954409599304, -0.33342644572257996, -0.24880337715148926, -0.16418027877807617, -0.07955718040466309, 0.005065910518169403, 0.08968900144100189, 0.17431208491325378, 0.25893518328666687, 0.34355828166007996, 0.42818135023117065, 0.5128044486045837, 0.5974275469779968, 0.6820506453514099, 0.766673743724823, 0.8512967824935913, 0.9359198808670044, 1.0205429792404175, 1.1051660776138306, 1.1897891759872437, 1.2744122743606567, 1.3590353727340698, 1.443658471107483, 1.528281569480896, 1.612904667854309, 1.6975277662277222, 1.7821507453918457, 1.8667738437652588, 1.9513969421386719, 2.036020040512085, 2.120643138885498, 2.205266237258911, 2.289889335632324, 2.3745124340057373, 2.4591355323791504, 2.5437586307525635, 2.6283817291259766]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 10.0, 14.0, 18.0, 27.0, 42.0, 48.0, 71.0, 89.0, 159.0, 221.0, 340.0, 580.0, 934.0, 1706.0, 3164.0, 6451.0, 14456.0, 36355.0, 105030.0, 318039.0, 362406.0, 124304.0, 42032.0, 16466.0, 7375.0, 3437.0, 1963.0, 1034.0, 653.0, 353.0, 230.0, 176.0, 108.0, 73.0, 55.0, 44.0, 24.0, 16.0, 14.0, 10.0, 5.0, 4.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.474609375, -2.3974609375, -2.3203125, -2.2431640625, -2.166015625, -2.0888671875, -2.01171875, -1.9345703125, -1.857421875, -1.7802734375, -1.703125, -1.6259765625, -1.548828125, -1.4716796875, -1.39453125, -1.3173828125, -1.240234375, -1.1630859375, -1.0859375, -1.0087890625, -0.931640625, -0.8544921875, -0.77734375, -0.7001953125, -0.623046875, -0.5458984375, -0.46875, -0.3916015625, -0.314453125, -0.2373046875, -0.16015625, -0.0830078125, -0.005859375, 0.0712890625, 0.1484375, 0.2255859375, 0.302734375, 0.3798828125, 0.45703125, 0.5341796875, 0.611328125, 0.6884765625, 0.765625, 0.8427734375, 0.919921875, 0.9970703125, 1.07421875, 1.1513671875, 1.228515625, 1.3056640625, 1.3828125, 1.4599609375, 1.537109375, 1.6142578125, 1.69140625, 1.7685546875, 1.845703125, 1.9228515625, 2.0, 2.0771484375, 2.154296875, 2.2314453125, 2.30859375, 2.3857421875, 2.462890625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 2.0, 4.0, 7.0, 3.0, 11.0, 12.0, 16.0, 24.0, 27.0, 40.0, 56.0, 52.0, 67.0, 81.0, 74.0, 74.0, 84.0, 64.0, 65.0, 47.0, 44.0, 44.0, 34.0, 16.0, 24.0, 13.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.349609375, -1.3076171875, -1.265625, -1.2236328125, -1.181640625, -1.1396484375, -1.09765625, -1.0556640625, -1.013671875, -0.9716796875, -0.9296875, -0.8876953125, -0.845703125, -0.8037109375, -0.76171875, -0.7197265625, -0.677734375, -0.6357421875, -0.59375, -0.5517578125, -0.509765625, -0.4677734375, -0.42578125, -0.3837890625, -0.341796875, -0.2998046875, -0.2578125, -0.2158203125, -0.173828125, -0.1318359375, -0.08984375, -0.0478515625, -0.005859375, 0.0361328125, 0.078125, 0.1201171875, 0.162109375, 0.2041015625, 0.24609375, 0.2880859375, 0.330078125, 0.3720703125, 0.4140625, 0.4560546875, 0.498046875, 0.5400390625, 0.58203125, 0.6240234375, 0.666015625, 0.7080078125, 0.75, 0.7919921875, 0.833984375, 0.8759765625, 0.91796875, 0.9599609375, 1.001953125, 1.0439453125, 1.0859375, 1.1279296875, 1.169921875, 1.2119140625, 1.25390625, 1.2958984375, 1.337890625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 10.0, 11.0, 8.0, 26.0, 33.0, 22.0, 50.0, 66.0, 144.0, 239.0, 355.0, 870.0, 2655.0, 14020.0, 183069.0, 778291.0, 58905.0, 6756.0, 1695.0, 616.0, 258.0, 145.0, 97.0, 69.0, 41.0, 27.0, 19.0, 16.0, 7.0, 7.0, 7.0, 5.0, 7.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4609375, -7.26617431640625, -7.0714111328125, -6.87664794921875, -6.681884765625, -6.48712158203125, -6.2923583984375, -6.09759521484375, -5.90283203125, -5.70806884765625, -5.5133056640625, -5.31854248046875, -5.123779296875, -4.92901611328125, -4.7342529296875, -4.53948974609375, -4.3447265625, -4.14996337890625, -3.9552001953125, -3.76043701171875, -3.565673828125, -3.37091064453125, -3.1761474609375, -2.98138427734375, -2.78662109375, -2.59185791015625, -2.3970947265625, -2.20233154296875, -2.007568359375, -1.81280517578125, -1.6180419921875, -1.42327880859375, -1.228515625, -1.03375244140625, -0.8389892578125, -0.64422607421875, -0.449462890625, -0.25469970703125, -0.0599365234375, 0.13482666015625, 0.32958984375, 0.52435302734375, 0.7191162109375, 0.91387939453125, 1.108642578125, 1.30340576171875, 1.4981689453125, 1.69293212890625, 1.8876953125, 2.08245849609375, 2.2772216796875, 2.47198486328125, 2.666748046875, 2.86151123046875, 3.0562744140625, 3.25103759765625, 3.44580078125, 3.64056396484375, 3.8353271484375, 4.03009033203125, 4.224853515625, 4.41961669921875, 4.6143798828125, 4.80914306640625, 5.00390625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 9.0, 17.0, 20.0, 23.0, 25.0, 27.0, 32.0, 45.0, 50.0, 38.0, 50.0, 39.0, 54.0, 57.0, 55.0, 62.0, 54.0, 46.0, 51.0, 36.0, 33.0, 27.0, 25.0, 29.0, 16.0, 19.0, 10.0, 9.0, 13.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.875, -5.7144775390625, -5.553955078125, -5.3934326171875, -5.23291015625, -5.0723876953125, -4.911865234375, -4.7513427734375, -4.5908203125, -4.4302978515625, -4.269775390625, -4.1092529296875, -3.94873046875, -3.7882080078125, -3.627685546875, -3.4671630859375, -3.306640625, -3.1461181640625, -2.985595703125, -2.8250732421875, -2.66455078125, -2.5040283203125, -2.343505859375, -2.1829833984375, -2.0224609375, -1.8619384765625, -1.701416015625, -1.5408935546875, -1.38037109375, -1.2198486328125, -1.059326171875, -0.8988037109375, -0.73828125, -0.5777587890625, -0.417236328125, -0.2567138671875, -0.09619140625, 0.0643310546875, 0.224853515625, 0.3853759765625, 0.5458984375, 0.7064208984375, 0.866943359375, 1.0274658203125, 1.18798828125, 1.3485107421875, 1.509033203125, 1.6695556640625, 1.830078125, 1.9906005859375, 2.151123046875, 2.3116455078125, 2.47216796875, 2.6326904296875, 2.793212890625, 2.9537353515625, 3.1142578125, 3.2747802734375, 3.435302734375, 3.5958251953125, 3.75634765625, 3.9168701171875, 4.077392578125, 4.2379150390625, 4.3984375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 4.0, 4.0, 6.0, 6.0, 26.0, 28.0, 23.0, 41.0, 79.0, 125.0, 280.0, 826.0, 3692.0, 57772.0, 950439.0, 31197.0, 2792.0, 635.0, 230.0, 127.0, 57.0, 43.0, 28.0, 33.0, 15.0, 13.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.68377685546875, -5.5277099609375, -5.37164306640625, -5.215576171875, -5.05950927734375, -4.9034423828125, -4.74737548828125, -4.59130859375, -4.43524169921875, -4.2791748046875, -4.12310791015625, -3.967041015625, -3.81097412109375, -3.6549072265625, -3.49884033203125, -3.3427734375, -3.18670654296875, -3.0306396484375, -2.87457275390625, -2.718505859375, -2.56243896484375, -2.4063720703125, -2.25030517578125, -2.09423828125, -1.93817138671875, -1.7821044921875, -1.62603759765625, -1.469970703125, -1.31390380859375, -1.1578369140625, -1.00177001953125, -0.845703125, -0.68963623046875, -0.5335693359375, -0.37750244140625, -0.221435546875, -0.06536865234375, 0.0906982421875, 0.24676513671875, 0.40283203125, 0.55889892578125, 0.7149658203125, 0.87103271484375, 1.027099609375, 1.18316650390625, 1.3392333984375, 1.49530029296875, 1.6513671875, 1.80743408203125, 1.9635009765625, 2.11956787109375, 2.275634765625, 2.43170166015625, 2.5877685546875, 2.74383544921875, 2.89990234375, 3.05596923828125, 3.2120361328125, 3.36810302734375, 3.524169921875, 3.68023681640625, 3.8363037109375, 3.99237060546875, 4.1484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 5.0, 13.0, 11.0, 11.0, 23.0, 27.0, 33.0, 59.0, 74.0, 78.0, 123.0, 125.0, 112.0, 84.0, 70.0, 42.0, 33.0, 20.0, 22.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032901763916015625, -0.00031850486993789673, -0.0003079921007156372, -0.0002974793314933777, -0.00028696656227111816, -0.00027645379304885864, -0.0002659410238265991, -0.0002554282546043396, -0.0002449154853820801, -0.00023440271615982056, -0.00022388994693756104, -0.00021337717771530151, -0.000202864408493042, -0.00019235163927078247, -0.00018183887004852295, -0.00017132610082626343, -0.0001608133316040039, -0.00015030056238174438, -0.00013978779315948486, -0.00012927502393722534, -0.00011876225471496582, -0.0001082494854927063, -9.773671627044678e-05, -8.722394704818726e-05, -7.671117782592773e-05, -6.619840860366821e-05, -5.568563938140869e-05, -4.517287015914917e-05, -3.466010093688965e-05, -2.4147331714630127e-05, -1.3634562492370605e-05, -3.121793270111084e-06, 7.3909759521484375e-06, 1.790374517440796e-05, 2.841651439666748e-05, 3.8929283618927e-05, 4.9442052841186523e-05, 5.9954822063446045e-05, 7.046759128570557e-05, 8.098036050796509e-05, 9.149312973022461e-05, 0.00010200589895248413, 0.00011251866817474365, 0.00012303143739700317, 0.0001335442066192627, 0.00014405697584152222, 0.00015456974506378174, 0.00016508251428604126, 0.00017559528350830078, 0.0001861080527305603, 0.00019662082195281982, 0.00020713359117507935, 0.00021764636039733887, 0.0002281591296195984, 0.0002386718988418579, 0.00024918466806411743, 0.00025969743728637695, 0.0002702102065086365, 0.000280722975730896, 0.0002912357449531555, 0.00030174851417541504, 0.00031226128339767456, 0.0003227740526199341, 0.0003332868218421936, 0.0003437995910644531]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 8.0, 5.0, 15.0, 21.0, 38.0, 56.0, 113.0, 177.0, 384.0, 975.0, 3143.0, 21085.0, 692527.0, 313807.0, 12421.0, 2308.0, 776.0, 320.0, 156.0, 88.0, 53.0, 30.0, 16.0, 9.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.822265625, -3.70947265625, -3.5966796875, -3.48388671875, -3.37109375, -3.25830078125, -3.1455078125, -3.03271484375, -2.919921875, -2.80712890625, -2.6943359375, -2.58154296875, -2.46875, -2.35595703125, -2.2431640625, -2.13037109375, -2.017578125, -1.90478515625, -1.7919921875, -1.67919921875, -1.56640625, -1.45361328125, -1.3408203125, -1.22802734375, -1.115234375, -1.00244140625, -0.8896484375, -0.77685546875, -0.6640625, -0.55126953125, -0.4384765625, -0.32568359375, -0.212890625, -0.10009765625, 0.0126953125, 0.12548828125, 0.23828125, 0.35107421875, 0.4638671875, 0.57666015625, 0.689453125, 0.80224609375, 0.9150390625, 1.02783203125, 1.140625, 1.25341796875, 1.3662109375, 1.47900390625, 1.591796875, 1.70458984375, 1.8173828125, 1.93017578125, 2.04296875, 2.15576171875, 2.2685546875, 2.38134765625, 2.494140625, 2.60693359375, 2.7197265625, 2.83251953125, 2.9453125, 3.05810546875, 3.1708984375, 3.28369140625, 3.396484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 5.0, 10.0, 17.0, 18.0, 35.0, 54.0, 87.0, 98.0, 147.0, 161.0, 128.0, 88.0, 65.0, 27.0, 20.0, 19.0, 11.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.279296875, -3.190948486328125, -3.10260009765625, -3.014251708984375, -2.9259033203125, -2.837554931640625, -2.74920654296875, -2.660858154296875, -2.572509765625, -2.484161376953125, -2.39581298828125, -2.307464599609375, -2.2191162109375, -2.130767822265625, -2.04241943359375, -1.954071044921875, -1.86572265625, -1.777374267578125, -1.68902587890625, -1.600677490234375, -1.5123291015625, -1.423980712890625, -1.33563232421875, -1.247283935546875, -1.158935546875, -1.070587158203125, -0.98223876953125, -0.893890380859375, -0.8055419921875, -0.717193603515625, -0.62884521484375, -0.540496826171875, -0.4521484375, -0.363800048828125, -0.27545166015625, -0.187103271484375, -0.0987548828125, -0.010406494140625, 0.07794189453125, 0.166290283203125, 0.254638671875, 0.342987060546875, 0.43133544921875, 0.519683837890625, 0.6080322265625, 0.696380615234375, 0.78472900390625, 0.873077392578125, 0.96142578125, 1.049774169921875, 1.13812255859375, 1.226470947265625, 1.3148193359375, 1.403167724609375, 1.49151611328125, 1.579864501953125, 1.668212890625, 1.756561279296875, 1.84490966796875, 1.933258056640625, 2.0216064453125, 2.109954833984375, 2.19830322265625, 2.286651611328125, 2.375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 26.0, 103.0, 246.0, 370.0, 192.0, 55.0, 10.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.64690399169922, -36.89484786987305, -34.142791748046875, -31.390737533569336, -28.638681411743164, -25.886625289916992, -23.134571075439453, -20.38251495361328, -17.63045883178711, -14.878402709960938, -12.126347541809082, -9.374292373657227, -6.622236251831055, -3.870180130004883, -1.1181259155273438, 1.6339302062988281, 4.385986328125, 7.138041973114014, 9.890097618103027, 12.642152786254883, 15.394208908081055, 18.146265029907227, 20.898319244384766, 23.650375366210938, 26.40243148803711, 29.15448760986328, 31.906543731689453, 34.658599853515625, 37.41065216064453, 40.16271209716797, 42.914764404296875, 45.66682052612305, 48.41886901855469, 51.17092514038086, 53.92298126220703, 56.67503356933594, 59.427093505859375, 62.17914581298828, 64.93119812011719, 67.68325805664062, 70.43531799316406, 73.18737030029297, 75.9394302368164, 78.69148254394531, 81.44354248046875, 84.19559478759766, 86.94764709472656, 89.69970703125, 92.4517593383789, 95.20381164550781, 97.95587158203125, 100.70792388916016, 103.4599838256836, 106.2120361328125, 108.96409606933594, 111.71614837646484, 114.46820068359375, 117.22025299072266, 119.9723129272461, 122.724365234375, 125.47642517089844, 128.22848510742188, 130.98052978515625, 133.7325897216797, 136.48464965820312]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 6.0, 11.0, 14.0, 7.0, 8.0, 19.0, 26.0, 21.0, 33.0, 25.0, 37.0, 38.0, 46.0, 39.0, 56.0, 64.0, 75.0, 49.0, 54.0, 55.0, 42.0, 46.0, 46.0, 34.0, 20.0, 22.0, 23.0, 9.0, 21.0, 11.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.68273162841797, -21.984506607055664, -21.286283493041992, -20.588058471679688, -19.889835357666016, -19.19161033630371, -18.493385314941406, -17.795162200927734, -17.096939086914062, -16.398714065551758, -15.700490951538086, -15.002265930175781, -14.30404281616211, -13.605817794799805, -12.907593727111816, -12.209369659423828, -11.511144638061523, -10.812920570373535, -10.114696502685547, -9.416471481323242, -8.71824836730957, -8.020023345947266, -7.321799278259277, -6.623575210571289, -5.925351142883301, -5.2271270751953125, -4.528903007507324, -3.8306784629821777, -3.1324543952941895, -2.434230327606201, -1.7360057830810547, -1.0377817153930664, -0.3395576477050781, 0.3586665391921997, 1.0568907260894775, 1.755115032196045, 2.453339099884033, 3.1515631675720215, 3.849787712097168, 4.548011779785156, 5.2462358474731445, 5.944459915161133, 6.642683982849121, 7.340908527374268, 8.039133071899414, 8.737356185913086, 9.43558120727539, 10.133805274963379, 10.832029342651367, 11.530253410339355, 12.228477478027344, 12.926702499389648, 13.62492561340332, 14.323150634765625, 15.021374702453613, 15.719598770141602, 16.417823791503906, 17.11604881286621, 17.814271926879883, 18.512496948242188, 19.21072006225586, 19.908945083618164, 20.60717010498047, 21.30539321899414, 22.003616333007812]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 1.0, 6.0, 8.0, 16.0, 24.0, 31.0, 69.0, 102.0, 159.0, 265.0, 537.0, 1112.0, 3017.0, 10056.0, 382589.0, 3780263.0, 10722.0, 2932.0, 1159.0, 530.0, 243.0, 155.0, 93.0, 54.0, 39.0, 28.0, 18.0, 14.0, 3.0, 9.0, 7.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.05029296875, -6.8154296875, -6.58056640625, -6.345703125, -6.11083984375, -5.8759765625, -5.64111328125, -5.40625, -5.17138671875, -4.9365234375, -4.70166015625, -4.466796875, -4.23193359375, -3.9970703125, -3.76220703125, -3.52734375, -3.29248046875, -3.0576171875, -2.82275390625, -2.587890625, -2.35302734375, -2.1181640625, -1.88330078125, -1.6484375, -1.41357421875, -1.1787109375, -0.94384765625, -0.708984375, -0.47412109375, -0.2392578125, -0.00439453125, 0.23046875, 0.46533203125, 0.7001953125, 0.93505859375, 1.169921875, 1.40478515625, 1.6396484375, 1.87451171875, 2.109375, 2.34423828125, 2.5791015625, 2.81396484375, 3.048828125, 3.28369140625, 3.5185546875, 3.75341796875, 3.98828125, 4.22314453125, 4.4580078125, 4.69287109375, 4.927734375, 5.16259765625, 5.3974609375, 5.63232421875, 5.8671875, 6.10205078125, 6.3369140625, 6.57177734375, 6.806640625, 7.04150390625, 7.2763671875, 7.51123046875, 7.74609375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 6.0, 12.0, 12.0, 17.0, 15.0, 23.0, 34.0, 46.0, 54.0, 49.0, 82.0, 76.0, 79.0, 81.0, 61.0, 74.0, 56.0, 48.0, 46.0, 28.0, 20.0, 21.0, 16.0, 8.0, 3.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4384765625, -1.3957366943359375, -1.352996826171875, -1.3102569580078125, -1.26751708984375, -1.2247772216796875, -1.182037353515625, -1.1392974853515625, -1.0965576171875, -1.0538177490234375, -1.011077880859375, -0.9683380126953125, -0.92559814453125, -0.8828582763671875, -0.840118408203125, -0.7973785400390625, -0.754638671875, -0.7118988037109375, -0.669158935546875, -0.6264190673828125, -0.58367919921875, -0.5409393310546875, -0.498199462890625, -0.4554595947265625, -0.4127197265625, -0.3699798583984375, -0.327239990234375, -0.2845001220703125, -0.24176025390625, -0.1990203857421875, -0.156280517578125, -0.1135406494140625, -0.07080078125, -0.0280609130859375, 0.014678955078125, 0.0574188232421875, 0.10015869140625, 0.1428985595703125, 0.185638427734375, 0.2283782958984375, 0.2711181640625, 0.3138580322265625, 0.356597900390625, 0.3993377685546875, 0.44207763671875, 0.4848175048828125, 0.527557373046875, 0.5702972412109375, 0.613037109375, 0.6557769775390625, 0.698516845703125, 0.7412567138671875, 0.78399658203125, 0.8267364501953125, 0.869476318359375, 0.9122161865234375, 0.9549560546875, 0.9976959228515625, 1.040435791015625, 1.0831756591796875, 1.12591552734375, 1.1686553955078125, 1.211395263671875, 1.2541351318359375, 1.296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 5.0, 8.0, 7.0, 10.0, 12.0, 23.0, 20.0, 37.0, 59.0, 77.0, 105.0, 122.0, 182.0, 286.0, 357.0, 480.0, 691.0, 1020.0, 1606.0, 2339.0, 3626.0, 6008.0, 11599.0, 25829.0, 87407.0, 3773338.0, 202805.0, 39630.0, 15511.0, 7770.0, 4479.0, 2787.0, 1899.0, 1215.0, 857.0, 606.0, 396.0, 317.0, 202.0, 159.0, 106.0, 98.0, 58.0, 38.0, 36.0, 22.0, 14.0, 15.0, 7.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.185546875, -2.111968994140625, -2.03839111328125, -1.964813232421875, -1.8912353515625, -1.817657470703125, -1.74407958984375, -1.670501708984375, -1.596923828125, -1.523345947265625, -1.44976806640625, -1.376190185546875, -1.3026123046875, -1.229034423828125, -1.15545654296875, -1.081878662109375, -1.00830078125, -0.934722900390625, -0.86114501953125, -0.787567138671875, -0.7139892578125, -0.640411376953125, -0.56683349609375, -0.493255615234375, -0.419677734375, -0.346099853515625, -0.27252197265625, -0.198944091796875, -0.1253662109375, -0.051788330078125, 0.02178955078125, 0.095367431640625, 0.1689453125, 0.242523193359375, 0.31610107421875, 0.389678955078125, 0.4632568359375, 0.536834716796875, 0.61041259765625, 0.683990478515625, 0.757568359375, 0.831146240234375, 0.90472412109375, 0.978302001953125, 1.0518798828125, 1.125457763671875, 1.19903564453125, 1.272613525390625, 1.34619140625, 1.419769287109375, 1.49334716796875, 1.566925048828125, 1.6405029296875, 1.714080810546875, 1.78765869140625, 1.861236572265625, 1.934814453125, 2.008392333984375, 2.08197021484375, 2.155548095703125, 2.2291259765625, 2.302703857421875, 2.37628173828125, 2.449859619140625, 2.5234375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 6.0, 11.0, 3.0, 12.0, 16.0, 16.0, 36.0, 37.0, 98.0, 260.0, 3104.0, 204.0, 91.0, 52.0, 33.0, 21.0, 9.0, 13.0, 8.0, 6.0, 5.0, 8.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.56640625, -1.5180816650390625, -1.469757080078125, -1.4214324951171875, -1.37310791015625, -1.3247833251953125, -1.276458740234375, -1.2281341552734375, -1.1798095703125, -1.1314849853515625, -1.083160400390625, -1.0348358154296875, -0.98651123046875, -0.9381866455078125, -0.889862060546875, -0.8415374755859375, -0.793212890625, -0.7448883056640625, -0.696563720703125, -0.6482391357421875, -0.59991455078125, -0.5515899658203125, -0.503265380859375, -0.4549407958984375, -0.4066162109375, -0.3582916259765625, -0.309967041015625, -0.2616424560546875, -0.21331787109375, -0.1649932861328125, -0.116668701171875, -0.0683441162109375, -0.02001953125, 0.0283050537109375, 0.076629638671875, 0.1249542236328125, 0.17327880859375, 0.2216033935546875, 0.269927978515625, 0.3182525634765625, 0.3665771484375, 0.4149017333984375, 0.463226318359375, 0.5115509033203125, 0.55987548828125, 0.6082000732421875, 0.656524658203125, 0.7048492431640625, 0.753173828125, 0.8014984130859375, 0.849822998046875, 0.8981475830078125, 0.94647216796875, 0.9947967529296875, 1.043121337890625, 1.0914459228515625, 1.1397705078125, 1.1880950927734375, 1.236419677734375, 1.2847442626953125, 1.33306884765625, 1.3813934326171875, 1.429718017578125, 1.4780426025390625, 1.5263671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 6.0, 16.0, 44.0, 85.0, 212.0, 248.0, 174.0, 93.0, 62.0, 26.0, 8.0, 11.0, 4.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.936712265014648, -10.510978698730469, -10.085244178771973, -9.659510612487793, -9.233777046203613, -8.808042526245117, -8.382308959960938, -7.956575393676758, -7.53084135055542, -7.105107307434082, -6.679373741149902, -6.2536396980285645, -5.827905654907227, -5.402172088623047, -4.976438045501709, -4.550704002380371, -4.124970436096191, -3.6992366313934326, -3.273502826690674, -2.847768783569336, -2.422034978866577, -1.9963011741638184, -1.5705671310424805, -1.1448333263397217, -0.7190995216369629, -0.2933656573295593, 0.13236820697784424, 0.5581021308898926, 0.9838359355926514, 1.4095697402954102, 1.835303783416748, 2.261037588119507, 2.6867713928222656, 3.1125051975250244, 3.538239002227783, 3.963973045349121, 4.389706611633301, 4.815440654754639, 5.241174697875977, 5.666908264160156, 6.092642307281494, 6.518376350402832, 6.944109916687012, 7.36984395980835, 7.7955780029296875, 8.221311569213867, 8.647045135498047, 9.072779655456543, 9.498513221740723, 9.924246788024902, 10.349981307983398, 10.775714874267578, 11.201448440551758, 11.627182006835938, 12.052916526794434, 12.478650093078613, 12.90438461303711, 13.330118179321289, 13.755852699279785, 14.181586265563965, 14.607319831848145, 15.03305435180664, 15.45878791809082, 15.884521484375, 16.31025505065918]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 8.0, 12.0, 9.0, 9.0, 15.0, 19.0, 25.0, 20.0, 21.0, 25.0, 23.0, 34.0, 32.0, 36.0, 31.0, 31.0, 33.0, 30.0, 47.0, 43.0, 26.0, 37.0, 34.0, 36.0, 34.0, 30.0, 37.0, 27.0, 29.0, 34.0, 26.0, 18.0, 24.0, 13.0, 19.0, 15.0, 11.0, 5.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.657516956329346, -4.501657009124756, -4.345797538757324, -4.189937591552734, -4.0340776443481445, -3.878217935562134, -3.722358226776123, -3.566498279571533, -3.4106385707855225, -3.2547788619995117, -3.098918914794922, -2.943059206008911, -2.7871994972229004, -2.6313395500183105, -2.4754798412323, -2.319620132446289, -2.163760185241699, -2.0079004764556885, -1.8520405292510986, -1.696180820465088, -1.5403209924697876, -1.3844611644744873, -1.2286014556884766, -1.0727416276931763, -0.916881799697876, -0.7610219717025757, -0.6051622033119202, -0.44930240511894226, -0.29344260692596436, -0.13758277893066406, 0.018276989459991455, 0.17413675785064697, 0.32999658584594727, 0.48585638403892517, 0.6417161822319031, 0.7975759506225586, 0.9534357786178589, 1.1092956066131592, 1.26515531539917, 1.4210151433944702, 1.5768749713897705, 1.7327347993850708, 1.888594627380371, 2.044454336166382, 2.2003140449523926, 2.3561739921569824, 2.512033700942993, 2.667893409729004, 2.8237533569335938, 2.9796130657196045, 3.1354730129241943, 3.291332721710205, 3.447192668914795, 3.6030523777008057, 3.7589120864868164, 3.9147720336914062, 4.070631980895996, 4.226491928100586, 4.382351398468018, 4.538211345672607, 4.694071292877197, 4.849930763244629, 5.005790710449219, 5.161650657653809, 5.31751012802124]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 6.0, 15.0, 23.0, 29.0, 32.0, 47.0, 74.0, 120.0, 213.0, 284.0, 545.0, 930.0, 1750.0, 3602.0, 8228.0, 21097.0, 60085.0, 188393.0, 421328.0, 226184.0, 72592.0, 24821.0, 9532.0, 3966.0, 2018.0, 1065.0, 607.0, 334.0, 200.0, 122.0, 97.0, 49.0, 54.0, 23.0, 27.0, 13.0, 7.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.673828125, -2.594207763671875, -2.51458740234375, -2.434967041015625, -2.3553466796875, -2.275726318359375, -2.19610595703125, -2.116485595703125, -2.036865234375, -1.957244873046875, -1.87762451171875, -1.798004150390625, -1.7183837890625, -1.638763427734375, -1.55914306640625, -1.479522705078125, -1.39990234375, -1.320281982421875, -1.24066162109375, -1.161041259765625, -1.0814208984375, -1.001800537109375, -0.92218017578125, -0.842559814453125, -0.762939453125, -0.683319091796875, -0.60369873046875, -0.524078369140625, -0.4444580078125, -0.364837646484375, -0.28521728515625, -0.205596923828125, -0.1259765625, -0.046356201171875, 0.03326416015625, 0.112884521484375, 0.1925048828125, 0.272125244140625, 0.35174560546875, 0.431365966796875, 0.510986328125, 0.590606689453125, 0.67022705078125, 0.749847412109375, 0.8294677734375, 0.909088134765625, 0.98870849609375, 1.068328857421875, 1.14794921875, 1.227569580078125, 1.30718994140625, 1.386810302734375, 1.4664306640625, 1.546051025390625, 1.62567138671875, 1.705291748046875, 1.784912109375, 1.864532470703125, 1.94415283203125, 2.023773193359375, 2.1033935546875, 2.183013916015625, 2.26263427734375, 2.342254638671875, 2.421875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 6.0, 15.0, 13.0, 15.0, 29.0, 36.0, 33.0, 52.0, 45.0, 62.0, 63.0, 73.0, 81.0, 68.0, 58.0, 60.0, 65.0, 48.0, 32.0, 37.0, 30.0, 17.0, 12.0, 11.0, 6.0, 7.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.9970703125, -1.948822021484375, -1.90057373046875, -1.852325439453125, -1.8040771484375, -1.755828857421875, -1.70758056640625, -1.659332275390625, -1.611083984375, -1.562835693359375, -1.51458740234375, -1.466339111328125, -1.4180908203125, -1.369842529296875, -1.32159423828125, -1.273345947265625, -1.22509765625, -1.176849365234375, -1.12860107421875, -1.080352783203125, -1.0321044921875, -0.983856201171875, -0.93560791015625, -0.887359619140625, -0.839111328125, -0.790863037109375, -0.74261474609375, -0.694366455078125, -0.6461181640625, -0.597869873046875, -0.54962158203125, -0.501373291015625, -0.453125, -0.404876708984375, -0.35662841796875, -0.308380126953125, -0.2601318359375, -0.211883544921875, -0.16363525390625, -0.115386962890625, -0.067138671875, -0.018890380859375, 0.02935791015625, 0.077606201171875, 0.1258544921875, 0.174102783203125, 0.22235107421875, 0.270599365234375, 0.31884765625, 0.367095947265625, 0.41534423828125, 0.463592529296875, 0.5118408203125, 0.560089111328125, 0.60833740234375, 0.656585693359375, 0.704833984375, 0.753082275390625, 0.80133056640625, 0.849578857421875, 0.8978271484375, 0.946075439453125, 0.99432373046875, 1.042572021484375, 1.0908203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 6.0, 10.0, 16.0, 22.0, 38.0, 43.0, 74.0, 117.0, 168.0, 378.0, 720.0, 1876.0, 6282.0, 39692.0, 549628.0, 409751.0, 31115.0, 5488.0, 1543.0, 652.0, 357.0, 200.0, 119.0, 72.0, 51.0, 31.0, 26.0, 20.0, 14.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9921875, -4.8197021484375, -4.647216796875, -4.4747314453125, -4.30224609375, -4.1297607421875, -3.957275390625, -3.7847900390625, -3.6123046875, -3.4398193359375, -3.267333984375, -3.0948486328125, -2.92236328125, -2.7498779296875, -2.577392578125, -2.4049072265625, -2.232421875, -2.0599365234375, -1.887451171875, -1.7149658203125, -1.54248046875, -1.3699951171875, -1.197509765625, -1.0250244140625, -0.8525390625, -0.6800537109375, -0.507568359375, -0.3350830078125, -0.16259765625, 0.0098876953125, 0.182373046875, 0.3548583984375, 0.52734375, 0.6998291015625, 0.872314453125, 1.0447998046875, 1.21728515625, 1.3897705078125, 1.562255859375, 1.7347412109375, 1.9072265625, 2.0797119140625, 2.252197265625, 2.4246826171875, 2.59716796875, 2.7696533203125, 2.942138671875, 3.1146240234375, 3.287109375, 3.4595947265625, 3.632080078125, 3.8045654296875, 3.97705078125, 4.1495361328125, 4.322021484375, 4.4945068359375, 4.6669921875, 4.8394775390625, 5.011962890625, 5.1844482421875, 5.35693359375, 5.5294189453125, 5.701904296875, 5.8743896484375, 6.046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 12.0, 18.0, 26.0, 26.0, 36.0, 58.0, 63.0, 76.0, 73.0, 92.0, 73.0, 72.0, 83.0, 73.0, 48.0, 38.0, 34.0, 26.0, 17.0, 17.0, 11.0, 7.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.6590576171875, -7.404052734375, -7.1490478515625, -6.89404296875, -6.6390380859375, -6.384033203125, -6.1290283203125, -5.8740234375, -5.6190185546875, -5.364013671875, -5.1090087890625, -4.85400390625, -4.5989990234375, -4.343994140625, -4.0889892578125, -3.833984375, -3.5789794921875, -3.323974609375, -3.0689697265625, -2.81396484375, -2.5589599609375, -2.303955078125, -2.0489501953125, -1.7939453125, -1.5389404296875, -1.283935546875, -1.0289306640625, -0.77392578125, -0.5189208984375, -0.263916015625, -0.0089111328125, 0.24609375, 0.5010986328125, 0.756103515625, 1.0111083984375, 1.26611328125, 1.5211181640625, 1.776123046875, 2.0311279296875, 2.2861328125, 2.5411376953125, 2.796142578125, 3.0511474609375, 3.30615234375, 3.5611572265625, 3.816162109375, 4.0711669921875, 4.326171875, 4.5811767578125, 4.836181640625, 5.0911865234375, 5.34619140625, 5.6011962890625, 5.856201171875, 6.1112060546875, 6.3662109375, 6.6212158203125, 6.876220703125, 7.1312255859375, 7.38623046875, 7.6412353515625, 7.896240234375, 8.1512451171875, 8.40625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 10.0, 15.0, 24.0, 40.0, 70.0, 127.0, 235.0, 600.0, 2253.0, 18695.0, 630876.0, 380174.0, 12580.0, 1861.0, 522.0, 188.0, 108.0, 70.0, 23.0, 22.0, 21.0, 16.0, 7.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.978515625, -2.897857666015625, -2.81719970703125, -2.736541748046875, -2.6558837890625, -2.575225830078125, -2.49456787109375, -2.413909912109375, -2.333251953125, -2.252593994140625, -2.17193603515625, -2.091278076171875, -2.0106201171875, -1.929962158203125, -1.84930419921875, -1.768646240234375, -1.68798828125, -1.607330322265625, -1.52667236328125, -1.446014404296875, -1.3653564453125, -1.284698486328125, -1.20404052734375, -1.123382568359375, -1.042724609375, -0.962066650390625, -0.88140869140625, -0.800750732421875, -0.7200927734375, -0.639434814453125, -0.55877685546875, -0.478118896484375, -0.3974609375, -0.316802978515625, -0.23614501953125, -0.155487060546875, -0.0748291015625, 0.005828857421875, 0.08648681640625, 0.167144775390625, 0.247802734375, 0.328460693359375, 0.40911865234375, 0.489776611328125, 0.5704345703125, 0.651092529296875, 0.73175048828125, 0.812408447265625, 0.89306640625, 0.973724365234375, 1.05438232421875, 1.135040283203125, 1.2156982421875, 1.296356201171875, 1.37701416015625, 1.457672119140625, 1.538330078125, 1.618988037109375, 1.69964599609375, 1.780303955078125, 1.8609619140625, 1.941619873046875, 2.02227783203125, 2.102935791015625, 2.18359375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 11.0, 22.0, 29.0, 28.0, 33.0, 56.0, 62.0, 83.0, 98.0, 96.0, 97.0, 75.0, 57.0, 50.0, 44.0, 29.0, 27.0, 8.0, 20.0, 13.0, 11.0, 9.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025582313537597656, -0.00024836696684360504, -0.00024091079831123352, -0.000233454629778862, -0.00022599846124649048, -0.00021854229271411896, -0.00021108612418174744, -0.00020362995564937592, -0.0001961737871170044, -0.00018871761858463287, -0.00018126145005226135, -0.00017380528151988983, -0.0001663491129875183, -0.0001588929444551468, -0.00015143677592277527, -0.00014398060739040375, -0.00013652443885803223, -0.0001290682703256607, -0.00012161210179328918, -0.00011415593326091766, -0.00010669976472854614, -9.924359619617462e-05, -9.17874276638031e-05, -8.433125913143158e-05, -7.687509059906006e-05, -6.941892206668854e-05, -6.196275353431702e-05, -5.4506585001945496e-05, -4.7050416469573975e-05, -3.9594247937202454e-05, -3.213807940483093e-05, -2.468191087245941e-05, -1.722574234008789e-05, -9.76957380771637e-06, -2.3134052753448486e-06, 5.142763257026672e-06, 1.2598931789398193e-05, 2.0055100321769714e-05, 2.7511268854141235e-05, 3.4967437386512756e-05, 4.242360591888428e-05, 4.98797744512558e-05, 5.733594298362732e-05, 6.479211151599884e-05, 7.224828004837036e-05, 7.970444858074188e-05, 8.71606171131134e-05, 9.461678564548492e-05, 0.00010207295417785645, 0.00010952912271022797, 0.00011698529124259949, 0.000124441459774971, 0.00013189762830734253, 0.00013935379683971405, 0.00014680996537208557, 0.0001542661339044571, 0.0001617223024368286, 0.00016917847096920013, 0.00017663463950157166, 0.00018409080803394318, 0.0001915469765663147, 0.00019900314509868622, 0.00020645931363105774, 0.00021391548216342926, 0.00022137165069580078]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 11.0, 18.0, 35.0, 48.0, 111.0, 198.0, 398.0, 1191.0, 6655.0, 133986.0, 863880.0, 37313.0, 3305.0, 804.0, 285.0, 133.0, 72.0, 50.0, 22.0, 17.0, 9.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.503082275390625, -1.41632080078125, -1.329559326171875, -1.2427978515625, -1.156036376953125, -1.06927490234375, -0.982513427734375, -0.895751953125, -0.808990478515625, -0.72222900390625, -0.635467529296875, -0.5487060546875, -0.461944580078125, -0.37518310546875, -0.288421630859375, -0.20166015625, -0.114898681640625, -0.02813720703125, 0.058624267578125, 0.1453857421875, 0.232147216796875, 0.31890869140625, 0.405670166015625, 0.492431640625, 0.579193115234375, 0.66595458984375, 0.752716064453125, 0.8394775390625, 0.926239013671875, 1.01300048828125, 1.099761962890625, 1.1865234375, 1.273284912109375, 1.36004638671875, 1.446807861328125, 1.5335693359375, 1.620330810546875, 1.70709228515625, 1.793853759765625, 1.880615234375, 1.967376708984375, 2.05413818359375, 2.140899658203125, 2.2276611328125, 2.314422607421875, 2.40118408203125, 2.487945556640625, 2.57470703125, 2.661468505859375, 2.74822998046875, 2.834991455078125, 2.9217529296875, 3.008514404296875, 3.09527587890625, 3.182037353515625, 3.268798828125, 3.355560302734375, 3.44232177734375, 3.529083251953125, 3.6158447265625, 3.702606201171875, 3.78936767578125, 3.876129150390625, 3.962890625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 4.0, 7.0, 10.0, 9.0, 17.0, 22.0, 22.0, 45.0, 41.0, 65.0, 76.0, 108.0, 87.0, 94.0, 75.0, 82.0, 48.0, 42.0, 33.0, 31.0, 26.0, 11.0, 12.0, 13.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.94921875, -1.8967132568359375, -1.844207763671875, -1.7917022705078125, -1.73919677734375, -1.6866912841796875, -1.634185791015625, -1.5816802978515625, -1.5291748046875, -1.4766693115234375, -1.424163818359375, -1.3716583251953125, -1.31915283203125, -1.2666473388671875, -1.214141845703125, -1.1616363525390625, -1.109130859375, -1.0566253662109375, -1.004119873046875, -0.9516143798828125, -0.89910888671875, -0.8466033935546875, -0.794097900390625, -0.7415924072265625, -0.6890869140625, -0.6365814208984375, -0.584075927734375, -0.5315704345703125, -0.47906494140625, -0.4265594482421875, -0.374053955078125, -0.3215484619140625, -0.26904296875, -0.2165374755859375, -0.164031982421875, -0.1115264892578125, -0.05902099609375, -0.0065155029296875, 0.045989990234375, 0.0984954833984375, 0.1510009765625, 0.2035064697265625, 0.256011962890625, 0.3085174560546875, 0.36102294921875, 0.4135284423828125, 0.466033935546875, 0.5185394287109375, 0.571044921875, 0.6235504150390625, 0.676055908203125, 0.7285614013671875, 0.78106689453125, 0.8335723876953125, 0.886077880859375, 0.9385833740234375, 0.9910888671875, 1.0435943603515625, 1.096099853515625, 1.1486053466796875, 1.20111083984375, 1.2536163330078125, 1.306121826171875, 1.3586273193359375, 1.4111328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 18.0, 70.0, 111.0, 187.0, 201.0, 189.0, 105.0, 63.0, 30.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.119056701660156, -47.69866180419922, -46.27827072143555, -44.85787582397461, -43.43748474121094, -42.01708984375, -40.59669876098633, -39.17630386352539, -37.75591278076172, -36.33551788330078, -34.91512680053711, -33.49473190307617, -32.0743408203125, -30.653947830200195, -29.23355484008789, -27.813159942626953, -26.39276695251465, -24.972373962402344, -23.55198097229004, -22.131587982177734, -20.71119499206543, -19.290802001953125, -17.870407104492188, -16.450016021728516, -15.029622077941895, -13.60922908782959, -12.188836097717285, -10.768442153930664, -9.34804916381836, -7.927656650543213, -6.50726318359375, -5.086870193481445, -3.6664772033691406, -2.246084213256836, -0.8256909847259521, 0.5947022438049316, 2.0150952339172363, 3.435488224029541, 4.855881690979004, 6.276274681091309, 7.696667671203613, 9.117060661315918, 10.537453651428223, 11.957847595214844, 13.378240585327148, 14.798633575439453, 16.219026565551758, 17.639419555664062, 19.059812545776367, 20.480205535888672, 21.900598526000977, 23.32099151611328, 24.741384506225586, 26.16177749633789, 27.582172393798828, 29.0025634765625, 30.422958374023438, 31.843351364135742, 33.26374435424805, 34.684139251708984, 36.104530334472656, 37.524925231933594, 38.945316314697266, 40.3657112121582, 41.786102294921875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 7.0, 8.0, 2.0, 6.0, 14.0, 19.0, 14.0, 13.0, 27.0, 25.0, 25.0, 34.0, 33.0, 38.0, 34.0, 44.0, 40.0, 58.0, 47.0, 59.0, 46.0, 47.0, 37.0, 44.0, 24.0, 36.0, 38.0, 32.0, 27.0, 24.0, 19.0, 16.0, 9.0, 8.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-20.249895095825195, -19.588411331176758, -18.926929473876953, -18.265445709228516, -17.603961944580078, -16.94247817993164, -16.280996322631836, -15.619512557983398, -14.958029747009277, -14.296546936035156, -13.635063171386719, -12.973580360412598, -12.312097549438477, -11.650613784790039, -10.989130973815918, -10.327648162841797, -9.66616439819336, -9.004681587219238, -8.3431978225708, -7.68171501159668, -7.0202317237854, -6.358748435974121, -5.697265625, -5.035782337188721, -4.374299049377441, -3.712815761566162, -3.051332712173462, -2.3898496627807617, -1.7283663749694824, -1.0668830871582031, -0.40540003776550293, 0.25608301162719727, 0.9175643920898438, 1.5790475606918335, 2.2405307292938232, 2.9020137786865234, 3.5634970664978027, 4.224980354309082, 4.886463165283203, 5.547946453094482, 6.209429740905762, 6.870913028717041, 7.53239631652832, 8.193879127502441, 8.855361938476562, 9.516845703125, 10.178328514099121, 10.839811325073242, 11.50129508972168, 12.1627779006958, 12.824261665344238, 13.48574447631836, 14.147228240966797, 14.808711051940918, 15.470193862915039, 16.131677627563477, 16.79315948486328, 17.45464324951172, 18.116125106811523, 18.77760887145996, 19.4390926361084, 20.100574493408203, 20.76205825805664, 21.423542022705078, 22.085025787353516]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 3.0, 4.0, 7.0, 9.0, 4.0, 10.0, 18.0, 24.0, 26.0, 30.0, 47.0, 83.0, 97.0, 232.0, 401.0, 842.0, 1881.0, 4446.0, 11375.0, 35465.0, 206976.0, 3555853.0, 310141.0, 44418.0, 13203.0, 4908.0, 1982.0, 851.0, 414.0, 233.0, 106.0, 74.0, 37.0, 16.0, 24.0, 9.0, 9.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.71875, -2.63775634765625, -2.5567626953125, -2.47576904296875, -2.394775390625, -2.31378173828125, -2.2327880859375, -2.15179443359375, -2.07080078125, -1.98980712890625, -1.9088134765625, -1.82781982421875, -1.746826171875, -1.66583251953125, -1.5848388671875, -1.50384521484375, -1.4228515625, -1.34185791015625, -1.2608642578125, -1.17987060546875, -1.098876953125, -1.01788330078125, -0.9368896484375, -0.85589599609375, -0.77490234375, -0.69390869140625, -0.6129150390625, -0.53192138671875, -0.450927734375, -0.36993408203125, -0.2889404296875, -0.20794677734375, -0.126953125, -0.04595947265625, 0.0350341796875, 0.11602783203125, 0.197021484375, 0.27801513671875, 0.3590087890625, 0.44000244140625, 0.52099609375, 0.60198974609375, 0.6829833984375, 0.76397705078125, 0.844970703125, 0.92596435546875, 1.0069580078125, 1.08795166015625, 1.1689453125, 1.24993896484375, 1.3309326171875, 1.41192626953125, 1.492919921875, 1.57391357421875, 1.6549072265625, 1.73590087890625, 1.81689453125, 1.89788818359375, 1.9788818359375, 2.05987548828125, 2.140869140625, 2.22186279296875, 2.3028564453125, 2.38385009765625, 2.46484375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 8.0, 10.0, 3.0, 19.0, 23.0, 25.0, 34.0, 54.0, 51.0, 48.0, 59.0, 64.0, 81.0, 80.0, 70.0, 60.0, 61.0, 57.0, 45.0, 45.0, 22.0, 22.0, 14.0, 18.0, 8.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.82421875, -1.7809219360351562, -1.7376251220703125, -1.6943283081054688, -1.651031494140625, -1.6077346801757812, -1.5644378662109375, -1.5211410522460938, -1.47784423828125, -1.4345474243164062, -1.3912506103515625, -1.3479537963867188, -1.304656982421875, -1.2613601684570312, -1.2180633544921875, -1.1747665405273438, -1.1314697265625, -1.0881729125976562, -1.0448760986328125, -1.0015792846679688, -0.958282470703125, -0.9149856567382812, -0.8716888427734375, -0.8283920288085938, -0.78509521484375, -0.7417984008789062, -0.6985015869140625, -0.6552047729492188, -0.611907958984375, -0.5686111450195312, -0.5253143310546875, -0.48201751708984375, -0.438720703125, -0.39542388916015625, -0.3521270751953125, -0.30883026123046875, -0.265533447265625, -0.22223663330078125, -0.1789398193359375, -0.13564300537109375, -0.09234619140625, -0.04904937744140625, -0.0057525634765625, 0.03754425048828125, 0.080841064453125, 0.12413787841796875, 0.1674346923828125, 0.21073150634765625, 0.2540283203125, 0.29732513427734375, 0.3406219482421875, 0.38391876220703125, 0.427215576171875, 0.47051239013671875, 0.5138092041015625, 0.5571060180664062, 0.60040283203125, 0.6436996459960938, 0.6869964599609375, 0.7302932739257812, 0.773590087890625, 0.8168869018554688, 0.8601837158203125, 0.9034805297851562, 0.94677734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 8.0, 7.0, 7.0, 15.0, 20.0, 23.0, 37.0, 64.0, 61.0, 111.0, 184.0, 313.0, 487.0, 846.0, 1679.0, 3822.0, 9104.0, 25507.0, 91086.0, 1024587.0, 2842597.0, 139170.0, 33723.0, 11568.0, 4606.0, 1999.0, 1047.0, 581.0, 354.0, 231.0, 149.0, 96.0, 45.0, 42.0, 28.0, 26.0, 13.0, 8.0, 6.0, 13.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.396484375, -2.31695556640625, -2.2374267578125, -2.15789794921875, -2.078369140625, -1.99884033203125, -1.9193115234375, -1.83978271484375, -1.76025390625, -1.68072509765625, -1.6011962890625, -1.52166748046875, -1.442138671875, -1.36260986328125, -1.2830810546875, -1.20355224609375, -1.1240234375, -1.04449462890625, -0.9649658203125, -0.88543701171875, -0.805908203125, -0.72637939453125, -0.6468505859375, -0.56732177734375, -0.48779296875, -0.40826416015625, -0.3287353515625, -0.24920654296875, -0.169677734375, -0.09014892578125, -0.0106201171875, 0.06890869140625, 0.1484375, 0.22796630859375, 0.3074951171875, 0.38702392578125, 0.466552734375, 0.54608154296875, 0.6256103515625, 0.70513916015625, 0.78466796875, 0.86419677734375, 0.9437255859375, 1.02325439453125, 1.102783203125, 1.18231201171875, 1.2618408203125, 1.34136962890625, 1.4208984375, 1.50042724609375, 1.5799560546875, 1.65948486328125, 1.739013671875, 1.81854248046875, 1.8980712890625, 1.97760009765625, 2.05712890625, 2.13665771484375, 2.2161865234375, 2.29571533203125, 2.375244140625, 2.45477294921875, 2.5343017578125, 2.61383056640625, 2.693359375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 12.0, 13.0, 17.0, 25.0, 40.0, 65.0, 92.0, 155.0, 339.0, 936.0, 1457.0, 499.0, 198.0, 72.0, 49.0, 29.0, 23.0, 15.0, 8.0, 6.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.454376220703125, -3.31695556640625, -3.179534912109375, -3.0421142578125, -2.904693603515625, -2.76727294921875, -2.629852294921875, -2.492431640625, -2.355010986328125, -2.21759033203125, -2.080169677734375, -1.9427490234375, -1.805328369140625, -1.66790771484375, -1.530487060546875, -1.39306640625, -1.255645751953125, -1.11822509765625, -0.980804443359375, -0.8433837890625, -0.705963134765625, -0.56854248046875, -0.431121826171875, -0.293701171875, -0.156280517578125, -0.01885986328125, 0.118560791015625, 0.2559814453125, 0.393402099609375, 0.53082275390625, 0.668243408203125, 0.8056640625, 0.943084716796875, 1.08050537109375, 1.217926025390625, 1.3553466796875, 1.492767333984375, 1.63018798828125, 1.767608642578125, 1.905029296875, 2.042449951171875, 2.17987060546875, 2.317291259765625, 2.4547119140625, 2.592132568359375, 2.72955322265625, 2.866973876953125, 3.00439453125, 3.141815185546875, 3.27923583984375, 3.416656494140625, 3.5540771484375, 3.691497802734375, 3.82891845703125, 3.966339111328125, 4.103759765625, 4.241180419921875, 4.37860107421875, 4.516021728515625, 4.6534423828125, 4.790863037109375, 4.92828369140625, 5.065704345703125, 5.203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 10.0, 17.0, 26.0, 60.0, 157.0, 333.0, 277.0, 97.0, 20.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.57215881347656, -30.778039932250977, -28.983922958374023, -27.189804077148438, -25.39568519592285, -23.601566314697266, -21.807449340820312, -20.013330459594727, -18.21921157836914, -16.425092697143555, -14.630974769592285, -12.836856842041016, -11.04273796081543, -9.24862003326416, -7.454502105712891, -5.660383224487305, -3.8662662506103516, -2.072147846221924, -0.2780296802520752, 1.5160884857177734, 3.310206890106201, 5.104325294494629, 6.898443222045898, 8.692562103271484, 10.486680030822754, 12.280797958374023, 14.07491683959961, 15.869034767150879, 17.66315269470215, 19.457271575927734, 21.251388549804688, 23.045509338378906, 24.83962631225586, 26.633745193481445, 28.4278621673584, 30.221981048583984, 32.01609802246094, 33.810218811035156, 35.60433578491211, 37.39845275878906, 39.19257354736328, 40.986690521240234, 42.78081130981445, 44.574928283691406, 46.36904525756836, 48.16316604614258, 49.95728302001953, 51.75140380859375, 53.54551696777344, 55.33963394165039, 57.13375473022461, 58.92787170410156, 60.721988677978516, 62.516109466552734, 64.31022644042969, 66.1043472290039, 67.89846801757812, 69.69258880615234, 71.48670196533203, 73.28082275390625, 75.07494354248047, 76.86905670166016, 78.66317749023438, 80.4572982788086, 82.25141143798828]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 9.0, 4.0, 3.0, 11.0, 21.0, 22.0, 21.0, 27.0, 26.0, 27.0, 38.0, 44.0, 47.0, 63.0, 53.0, 46.0, 64.0, 53.0, 59.0, 55.0, 49.0, 43.0, 47.0, 28.0, 22.0, 28.0, 24.0, 20.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.564776420593262, -12.058303833007812, -11.55183219909668, -11.04535961151123, -10.538887023925781, -10.032415390014648, -9.5259428024292, -9.01947021484375, -8.512998580932617, -8.006525993347168, -7.500054359436035, -6.993581771850586, -6.487109661102295, -5.980637550354004, -5.474164962768555, -4.967692852020264, -4.461220741271973, -3.9547486305236816, -3.4482762813568115, -2.9418039321899414, -2.4353318214416504, -1.9288597106933594, -1.4223873615264893, -0.9159150123596191, -0.4094429016113281, 0.09702932834625244, 0.603501558303833, 1.1099737882614136, 1.6164460182189941, 2.122918128967285, 2.6293904781341553, 3.1358628273010254, 3.642333984375, 4.148806095123291, 4.655278205871582, 5.161750793457031, 5.668222904205322, 6.174695014953613, 6.6811676025390625, 7.1876397132873535, 7.6941118240356445, 8.200584411621094, 8.707056045532227, 9.213528633117676, 9.720001220703125, 10.226472854614258, 10.732945442199707, 11.239418029785156, 11.745889663696289, 12.252362251281738, 12.758833885192871, 13.26530647277832, 13.771778106689453, 14.278250694274902, 14.784723281860352, 15.291194915771484, 15.797667503356934, 16.304140090942383, 16.810611724853516, 17.31708335876465, 17.823556900024414, 18.330028533935547, 18.83650016784668, 19.342973709106445, 19.849445343017578]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 5.0, 14.0, 15.0, 33.0, 32.0, 66.0, 102.0, 163.0, 247.0, 362.0, 640.0, 1059.0, 1792.0, 3225.0, 6500.0, 13215.0, 29657.0, 69907.0, 174387.0, 356119.0, 228748.0, 90598.0, 37691.0, 16633.0, 7988.0, 4084.0, 2137.0, 1214.0, 688.0, 424.0, 283.0, 183.0, 105.0, 69.0, 36.0, 36.0, 20.0, 17.0, 12.0, 9.0, 5.0, 7.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7568359375, -1.6995086669921875, -1.642181396484375, -1.5848541259765625, -1.52752685546875, -1.4701995849609375, -1.412872314453125, -1.3555450439453125, -1.2982177734375, -1.2408905029296875, -1.183563232421875, -1.1262359619140625, -1.06890869140625, -1.0115814208984375, -0.954254150390625, -0.8969268798828125, -0.839599609375, -0.7822723388671875, -0.724945068359375, -0.6676177978515625, -0.61029052734375, -0.5529632568359375, -0.495635986328125, -0.4383087158203125, -0.3809814453125, -0.3236541748046875, -0.266326904296875, -0.2089996337890625, -0.15167236328125, -0.0943450927734375, -0.037017822265625, 0.0203094482421875, 0.07763671875, 0.1349639892578125, 0.192291259765625, 0.2496185302734375, 0.30694580078125, 0.3642730712890625, 0.421600341796875, 0.4789276123046875, 0.5362548828125, 0.5935821533203125, 0.650909423828125, 0.7082366943359375, 0.76556396484375, 0.8228912353515625, 0.880218505859375, 0.9375457763671875, 0.994873046875, 1.0522003173828125, 1.109527587890625, 1.1668548583984375, 1.22418212890625, 1.2815093994140625, 1.338836669921875, 1.3961639404296875, 1.4534912109375, 1.5108184814453125, 1.568145751953125, 1.6254730224609375, 1.68280029296875, 1.7401275634765625, 1.797454833984375, 1.8547821044921875, 1.912109375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 9.0, 15.0, 14.0, 13.0, 24.0, 24.0, 32.0, 35.0, 30.0, 46.0, 40.0, 38.0, 34.0, 37.0, 41.0, 47.0, 48.0, 52.0, 40.0, 44.0, 30.0, 48.0, 46.0, 28.0, 24.0, 22.0, 18.0, 15.0, 15.0, 14.0, 14.0, 8.0, 8.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8349609375, -0.807647705078125, -0.78033447265625, -0.753021240234375, -0.7257080078125, -0.698394775390625, -0.67108154296875, -0.643768310546875, -0.616455078125, -0.589141845703125, -0.56182861328125, -0.534515380859375, -0.5072021484375, -0.479888916015625, -0.45257568359375, -0.425262451171875, -0.39794921875, -0.370635986328125, -0.34332275390625, -0.316009521484375, -0.2886962890625, -0.261383056640625, -0.23406982421875, -0.206756591796875, -0.179443359375, -0.152130126953125, -0.12481689453125, -0.097503662109375, -0.0701904296875, -0.042877197265625, -0.01556396484375, 0.011749267578125, 0.0390625, 0.066375732421875, 0.09368896484375, 0.121002197265625, 0.1483154296875, 0.175628662109375, 0.20294189453125, 0.230255126953125, 0.257568359375, 0.284881591796875, 0.31219482421875, 0.339508056640625, 0.3668212890625, 0.394134521484375, 0.42144775390625, 0.448760986328125, 0.47607421875, 0.503387451171875, 0.53070068359375, 0.558013916015625, 0.5853271484375, 0.612640380859375, 0.63995361328125, 0.667266845703125, 0.694580078125, 0.721893310546875, 0.74920654296875, 0.776519775390625, 0.8038330078125, 0.831146240234375, 0.85845947265625, 0.885772705078125, 0.9130859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 9.0, 7.0, 10.0, 16.0, 14.0, 22.0, 25.0, 51.0, 55.0, 72.0, 121.0, 183.0, 294.0, 414.0, 648.0, 1145.0, 2273.0, 5545.0, 18230.0, 88470.0, 593490.0, 274889.0, 43700.0, 10825.0, 3756.0, 1744.0, 924.0, 570.0, 355.0, 225.0, 145.0, 80.0, 69.0, 44.0, 34.0, 22.0, 25.0, 11.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.989501953125, -2.88916015625, -2.788818359375, -2.6884765625, -2.588134765625, -2.48779296875, -2.387451171875, -2.287109375, -2.186767578125, -2.08642578125, -1.986083984375, -1.8857421875, -1.785400390625, -1.68505859375, -1.584716796875, -1.484375, -1.384033203125, -1.28369140625, -1.183349609375, -1.0830078125, -0.982666015625, -0.88232421875, -0.781982421875, -0.681640625, -0.581298828125, -0.48095703125, -0.380615234375, -0.2802734375, -0.179931640625, -0.07958984375, 0.020751953125, 0.12109375, 0.221435546875, 0.32177734375, 0.422119140625, 0.5224609375, 0.622802734375, 0.72314453125, 0.823486328125, 0.923828125, 1.024169921875, 1.12451171875, 1.224853515625, 1.3251953125, 1.425537109375, 1.52587890625, 1.626220703125, 1.7265625, 1.826904296875, 1.92724609375, 2.027587890625, 2.1279296875, 2.228271484375, 2.32861328125, 2.428955078125, 2.529296875, 2.629638671875, 2.72998046875, 2.830322265625, 2.9306640625, 3.031005859375, 3.13134765625, 3.231689453125, 3.33203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 4.0, 5.0, 9.0, 9.0, 10.0, 10.0, 18.0, 23.0, 16.0, 19.0, 20.0, 27.0, 34.0, 28.0, 30.0, 38.0, 52.0, 46.0, 32.0, 46.0, 45.0, 44.0, 53.0, 39.0, 41.0, 34.0, 36.0, 32.0, 32.0, 23.0, 21.0, 15.0, 20.0, 14.0, 14.0, 12.0, 8.0, 8.0, 5.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-3.47265625, -3.3590087890625, -3.245361328125, -3.1317138671875, -3.01806640625, -2.9044189453125, -2.790771484375, -2.6771240234375, -2.5634765625, -2.4498291015625, -2.336181640625, -2.2225341796875, -2.10888671875, -1.9952392578125, -1.881591796875, -1.7679443359375, -1.654296875, -1.5406494140625, -1.427001953125, -1.3133544921875, -1.19970703125, -1.0860595703125, -0.972412109375, -0.8587646484375, -0.7451171875, -0.6314697265625, -0.517822265625, -0.4041748046875, -0.29052734375, -0.1768798828125, -0.063232421875, 0.0504150390625, 0.1640625, 0.2777099609375, 0.391357421875, 0.5050048828125, 0.61865234375, 0.7322998046875, 0.845947265625, 0.9595947265625, 1.0732421875, 1.1868896484375, 1.300537109375, 1.4141845703125, 1.52783203125, 1.6414794921875, 1.755126953125, 1.8687744140625, 1.982421875, 2.0960693359375, 2.209716796875, 2.3233642578125, 2.43701171875, 2.5506591796875, 2.664306640625, 2.7779541015625, 2.8916015625, 3.0052490234375, 3.118896484375, 3.2325439453125, 3.34619140625, 3.4598388671875, 3.573486328125, 3.6871337890625, 3.80078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 9.0, 12.0, 25.0, 31.0, 48.0, 93.0, 185.0, 384.0, 1061.0, 5088.0, 104755.0, 906967.0, 25915.0, 2618.0, 750.0, 294.0, 132.0, 80.0, 42.0, 21.0, 12.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2734375, -3.190185546875, -3.10693359375, -3.023681640625, -2.9404296875, -2.857177734375, -2.77392578125, -2.690673828125, -2.607421875, -2.524169921875, -2.44091796875, -2.357666015625, -2.2744140625, -2.191162109375, -2.10791015625, -2.024658203125, -1.94140625, -1.858154296875, -1.77490234375, -1.691650390625, -1.6083984375, -1.525146484375, -1.44189453125, -1.358642578125, -1.275390625, -1.192138671875, -1.10888671875, -1.025634765625, -0.9423828125, -0.859130859375, -0.77587890625, -0.692626953125, -0.609375, -0.526123046875, -0.44287109375, -0.359619140625, -0.2763671875, -0.193115234375, -0.10986328125, -0.026611328125, 0.056640625, 0.139892578125, 0.22314453125, 0.306396484375, 0.3896484375, 0.472900390625, 0.55615234375, 0.639404296875, 0.72265625, 0.805908203125, 0.88916015625, 0.972412109375, 1.0556640625, 1.138916015625, 1.22216796875, 1.305419921875, 1.388671875, 1.471923828125, 1.55517578125, 1.638427734375, 1.7216796875, 1.804931640625, 1.88818359375, 1.971435546875, 2.0546875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 15.0, 20.0, 24.0, 35.0, 63.0, 88.0, 128.0, 152.0, 136.0, 103.0, 72.0, 60.0, 35.0, 24.0, 13.0, 6.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00039315223693847656, -0.00038183853030204773, -0.0003705248236656189, -0.00035921111702919006, -0.00034789741039276123, -0.0003365837037563324, -0.00032526999711990356, -0.00031395629048347473, -0.0003026425838470459, -0.00029132887721061707, -0.00028001517057418823, -0.0002687014639377594, -0.00025738775730133057, -0.00024607405066490173, -0.0002347603440284729, -0.00022344663739204407, -0.00021213293075561523, -0.0002008192241191864, -0.00018950551748275757, -0.00017819181084632874, -0.0001668781042098999, -0.00015556439757347107, -0.00014425069093704224, -0.0001329369843006134, -0.00012162327766418457, -0.00011030957102775574, -9.89958643913269e-05, -8.768215775489807e-05, -7.636845111846924e-05, -6.50547444820404e-05, -5.374103784561157e-05, -4.242733120918274e-05, -3.1113624572753906e-05, -1.9799917936325073e-05, -8.48621129989624e-06, 2.8274953365325928e-06, 1.4141201972961426e-05, 2.545490860939026e-05, 3.676861524581909e-05, 4.8082321882247925e-05, 5.939602851867676e-05, 7.070973515510559e-05, 8.202344179153442e-05, 9.333714842796326e-05, 0.00010465085506439209, 0.00011596456170082092, 0.00012727826833724976, 0.0001385919749736786, 0.00014990568161010742, 0.00016121938824653625, 0.0001725330948829651, 0.00018384680151939392, 0.00019516050815582275, 0.0002064742147922516, 0.00021778792142868042, 0.00022910162806510925, 0.00024041533470153809, 0.0002517290413379669, 0.00026304274797439575, 0.0002743564546108246, 0.0002856701612472534, 0.00029698386788368225, 0.0003082975745201111, 0.0003196112811565399, 0.00033092498779296875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 12.0, 18.0, 21.0, 27.0, 39.0, 85.0, 131.0, 264.0, 504.0, 1229.0, 3576.0, 15866.0, 169780.0, 763795.0, 79045.0, 9710.0, 2585.0, 929.0, 434.0, 200.0, 116.0, 68.0, 32.0, 24.0, 18.0, 8.0, 10.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.66015625, -1.6132049560546875, -1.566253662109375, -1.5193023681640625, -1.47235107421875, -1.4253997802734375, -1.378448486328125, -1.3314971923828125, -1.2845458984375, -1.2375946044921875, -1.190643310546875, -1.1436920166015625, -1.09674072265625, -1.0497894287109375, -1.002838134765625, -0.9558868408203125, -0.908935546875, -0.8619842529296875, -0.815032958984375, -0.7680816650390625, -0.72113037109375, -0.6741790771484375, -0.627227783203125, -0.5802764892578125, -0.5333251953125, -0.4863739013671875, -0.439422607421875, -0.3924713134765625, -0.34552001953125, -0.2985687255859375, -0.251617431640625, -0.2046661376953125, -0.15771484375, -0.1107635498046875, -0.063812255859375, -0.0168609619140625, 0.03009033203125, 0.0770416259765625, 0.123992919921875, 0.1709442138671875, 0.2178955078125, 0.2648468017578125, 0.311798095703125, 0.3587493896484375, 0.40570068359375, 0.4526519775390625, 0.499603271484375, 0.5465545654296875, 0.593505859375, 0.6404571533203125, 0.687408447265625, 0.7343597412109375, 0.78131103515625, 0.8282623291015625, 0.875213623046875, 0.9221649169921875, 0.9691162109375, 1.0160675048828125, 1.063018798828125, 1.1099700927734375, 1.15692138671875, 1.2038726806640625, 1.250823974609375, 1.2977752685546875, 1.3447265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 8.0, 17.0, 24.0, 32.0, 32.0, 33.0, 62.0, 73.0, 80.0, 91.0, 80.0, 74.0, 80.0, 59.0, 51.0, 40.0, 42.0, 28.0, 24.0, 16.0, 10.0, 6.0, 4.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.1199798583984375, -1.080780029296875, -1.0415802001953125, -1.00238037109375, -0.9631805419921875, -0.923980712890625, -0.8847808837890625, -0.8455810546875, -0.8063812255859375, -0.767181396484375, -0.7279815673828125, -0.68878173828125, -0.6495819091796875, -0.610382080078125, -0.5711822509765625, -0.531982421875, -0.4927825927734375, -0.453582763671875, -0.4143829345703125, -0.37518310546875, -0.3359832763671875, -0.296783447265625, -0.2575836181640625, -0.2183837890625, -0.1791839599609375, -0.139984130859375, -0.1007843017578125, -0.06158447265625, -0.0223846435546875, 0.016815185546875, 0.0560150146484375, 0.09521484375, 0.1344146728515625, 0.173614501953125, 0.2128143310546875, 0.25201416015625, 0.2912139892578125, 0.330413818359375, 0.3696136474609375, 0.4088134765625, 0.4480133056640625, 0.487213134765625, 0.5264129638671875, 0.56561279296875, 0.6048126220703125, 0.644012451171875, 0.6832122802734375, 0.722412109375, 0.7616119384765625, 0.800811767578125, 0.8400115966796875, 0.87921142578125, 0.9184112548828125, 0.957611083984375, 0.9968109130859375, 1.0360107421875, 1.0752105712890625, 1.114410400390625, 1.1536102294921875, 1.19281005859375, 1.2320098876953125, 1.271209716796875, 1.3104095458984375, 1.349609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 11.0, 13.0, 22.0, 35.0, 75.0, 85.0, 135.0, 138.0, 149.0, 106.0, 75.0, 58.0, 28.0, 22.0, 12.0, 8.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.902667999267578, -19.232820510864258, -18.562973022460938, -17.893125534057617, -17.223278045654297, -16.553428649902344, -15.883581161499023, -15.213733673095703, -14.543886184692383, -13.874038696289062, -13.204191207885742, -12.534342765808105, -11.864495277404785, -11.194647789001465, -10.524799346923828, -9.854951858520508, -9.185104370117188, -8.515256881713867, -7.845408916473389, -7.17556095123291, -6.50571346282959, -5.8358659744262695, -5.166018009185791, -4.4961700439453125, -3.826322555541992, -3.1564748287200928, -2.4866271018981934, -1.816779375076294, -1.1469316482543945, -0.4770839214324951, 0.1927638053894043, 0.8626117706298828, 1.5324573516845703, 2.2023050785064697, 2.872152805328369, 3.5420005321502686, 4.211848258972168, 4.881695747375488, 5.551543712615967, 6.221391677856445, 6.891239166259766, 7.561086654663086, 8.230934143066406, 8.900782585144043, 9.570630073547363, 10.240477561950684, 10.91032600402832, 11.58017349243164, 12.250020980834961, 12.919868469238281, 13.589715957641602, 14.259564399719238, 14.929411888122559, 15.599259376525879, 16.269107818603516, 16.938955307006836, 17.608802795410156, 18.278650283813477, 18.948497772216797, 19.618345260620117, 20.288192749023438, 20.95804214477539, 21.62788963317871, 22.29773712158203, 22.96758460998535]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 3.0, 14.0, 16.0, 15.0, 15.0, 8.0, 12.0, 31.0, 33.0, 38.0, 39.0, 42.0, 35.0, 41.0, 50.0, 63.0, 54.0, 52.0, 49.0, 41.0, 43.0, 36.0, 30.0, 31.0, 23.0, 28.0, 26.0, 10.0, 22.0, 17.0, 10.0, 13.0, 13.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-15.03665542602539, -14.563257217407227, -14.089859008789062, -13.616460800170898, -13.143061637878418, -12.669663429260254, -12.19626522064209, -11.722867012023926, -11.249467849731445, -10.776069641113281, -10.302671432495117, -9.829273223876953, -9.355874061584473, -8.882475852966309, -8.409077644348145, -7.9356794357299805, -7.462281227111816, -6.988883018493652, -6.51548433303833, -6.042086124420166, -5.568687438964844, -5.09528923034668, -4.621891021728516, -4.148492813110352, -3.6750941276550293, -3.201695680618286, -2.728297233581543, -2.254899024963379, -1.7815005779266357, -1.3081021308898926, -0.8347039222717285, -0.36130547523498535, 0.11209297180175781, 0.5854913592338562, 1.0588897466659546, 1.5322880744934082, 2.0056865215301514, 2.4790849685668945, 2.9524831771850586, 3.4258816242218018, 3.899280071258545, 4.372678279876709, 4.846076965332031, 5.319475173950195, 5.792873382568359, 6.266272068023682, 6.739670276641846, 7.213068962097168, 7.686467170715332, 8.159865379333496, 8.63326358795166, 9.10666275024414, 9.580060958862305, 10.053459167480469, 10.526857376098633, 11.000255584716797, 11.473653793334961, 11.947052001953125, 12.420450210571289, 12.893848419189453, 13.367247581481934, 13.840645790100098, 14.314043998718262, 14.787442207336426, 15.260841369628906]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 7.0, 10.0, 11.0, 19.0, 15.0, 33.0, 38.0, 60.0, 96.0, 131.0, 322.0, 1452.0, 21770.0, 4114994.0, 52177.0, 2273.0, 403.0, 157.0, 95.0, 74.0, 41.0, 25.0, 18.0, 17.0, 11.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.285400390625, -7.04736328125, -6.809326171875, -6.5712890625, -6.333251953125, -6.09521484375, -5.857177734375, -5.619140625, -5.381103515625, -5.14306640625, -4.905029296875, -4.6669921875, -4.428955078125, -4.19091796875, -3.952880859375, -3.71484375, -3.476806640625, -3.23876953125, -3.000732421875, -2.7626953125, -2.524658203125, -2.28662109375, -2.048583984375, -1.810546875, -1.572509765625, -1.33447265625, -1.096435546875, -0.8583984375, -0.620361328125, -0.38232421875, -0.144287109375, 0.09375, 0.331787109375, 0.56982421875, 0.807861328125, 1.0458984375, 1.283935546875, 1.52197265625, 1.760009765625, 1.998046875, 2.236083984375, 2.47412109375, 2.712158203125, 2.9501953125, 3.188232421875, 3.42626953125, 3.664306640625, 3.90234375, 4.140380859375, 4.37841796875, 4.616455078125, 4.8544921875, 5.092529296875, 5.33056640625, 5.568603515625, 5.806640625, 6.044677734375, 6.28271484375, 6.520751953125, 6.7587890625, 6.996826171875, 7.23486328125, 7.472900390625, 7.7109375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 11.0, 9.0, 8.0, 22.0, 30.0, 27.0, 31.0, 33.0, 36.0, 44.0, 59.0, 62.0, 53.0, 54.0, 46.0, 55.0, 60.0, 49.0, 61.0, 35.0, 49.0, 27.0, 26.0, 23.0, 23.0, 20.0, 18.0, 8.0, 5.0, 8.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0927734375, -1.0590362548828125, -1.025299072265625, -0.9915618896484375, -0.95782470703125, -0.9240875244140625, -0.890350341796875, -0.8566131591796875, -0.8228759765625, -0.7891387939453125, -0.755401611328125, -0.7216644287109375, -0.68792724609375, -0.6541900634765625, -0.620452880859375, -0.5867156982421875, -0.552978515625, -0.5192413330078125, -0.485504150390625, -0.4517669677734375, -0.41802978515625, -0.3842926025390625, -0.350555419921875, -0.3168182373046875, -0.2830810546875, -0.2493438720703125, -0.215606689453125, -0.1818695068359375, -0.14813232421875, -0.1143951416015625, -0.080657958984375, -0.0469207763671875, -0.01318359375, 0.0205535888671875, 0.054290771484375, 0.0880279541015625, 0.12176513671875, 0.1555023193359375, 0.189239501953125, 0.2229766845703125, 0.2567138671875, 0.2904510498046875, 0.324188232421875, 0.3579254150390625, 0.39166259765625, 0.4253997802734375, 0.459136962890625, 0.4928741455078125, 0.526611328125, 0.5603485107421875, 0.594085693359375, 0.6278228759765625, 0.66156005859375, 0.6952972412109375, 0.729034423828125, 0.7627716064453125, 0.7965087890625, 0.8302459716796875, 0.863983154296875, 0.8977203369140625, 0.93145751953125, 0.9651947021484375, 0.998931884765625, 1.0326690673828125, 1.06640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 13.0, 30.0, 48.0, 87.0, 121.0, 269.0, 437.0, 772.0, 1354.0, 2576.0, 4791.0, 10761.0, 27186.0, 93776.0, 873757.0, 2926121.0, 183498.0, 41490.0, 14274.0, 6197.0, 2980.0, 1576.0, 922.0, 521.0, 293.0, 170.0, 103.0, 61.0, 33.0, 18.0, 13.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.0306396484375, -1.969482421875, -1.9083251953125, -1.84716796875, -1.7860107421875, -1.724853515625, -1.6636962890625, -1.6025390625, -1.5413818359375, -1.480224609375, -1.4190673828125, -1.35791015625, -1.2967529296875, -1.235595703125, -1.1744384765625, -1.11328125, -1.0521240234375, -0.990966796875, -0.9298095703125, -0.86865234375, -0.8074951171875, -0.746337890625, -0.6851806640625, -0.6240234375, -0.5628662109375, -0.501708984375, -0.4405517578125, -0.37939453125, -0.3182373046875, -0.257080078125, -0.1959228515625, -0.134765625, -0.0736083984375, -0.012451171875, 0.0487060546875, 0.10986328125, 0.1710205078125, 0.232177734375, 0.2933349609375, 0.3544921875, 0.4156494140625, 0.476806640625, 0.5379638671875, 0.59912109375, 0.6602783203125, 0.721435546875, 0.7825927734375, 0.84375, 0.9049072265625, 0.966064453125, 1.0272216796875, 1.08837890625, 1.1495361328125, 1.210693359375, 1.2718505859375, 1.3330078125, 1.3941650390625, 1.455322265625, 1.5164794921875, 1.57763671875, 1.6387939453125, 1.699951171875, 1.7611083984375, 1.822265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 7.0, 6.0, 9.0, 8.0, 12.0, 13.0, 21.0, 35.0, 53.0, 49.0, 69.0, 132.0, 238.0, 472.0, 1021.0, 902.0, 442.0, 216.0, 129.0, 57.0, 44.0, 41.0, 20.0, 18.0, 13.0, 9.0, 9.0, 1.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.775390625, -2.70013427734375, -2.6248779296875, -2.54962158203125, -2.474365234375, -2.39910888671875, -2.3238525390625, -2.24859619140625, -2.17333984375, -2.09808349609375, -2.0228271484375, -1.94757080078125, -1.872314453125, -1.79705810546875, -1.7218017578125, -1.64654541015625, -1.5712890625, -1.49603271484375, -1.4207763671875, -1.34552001953125, -1.270263671875, -1.19500732421875, -1.1197509765625, -1.04449462890625, -0.96923828125, -0.89398193359375, -0.8187255859375, -0.74346923828125, -0.668212890625, -0.59295654296875, -0.5177001953125, -0.44244384765625, -0.3671875, -0.29193115234375, -0.2166748046875, -0.14141845703125, -0.066162109375, 0.00909423828125, 0.0843505859375, 0.15960693359375, 0.23486328125, 0.31011962890625, 0.3853759765625, 0.46063232421875, 0.535888671875, 0.61114501953125, 0.6864013671875, 0.76165771484375, 0.8369140625, 0.91217041015625, 0.9874267578125, 1.06268310546875, 1.137939453125, 1.21319580078125, 1.2884521484375, 1.36370849609375, 1.43896484375, 1.51422119140625, 1.5894775390625, 1.66473388671875, 1.739990234375, 1.81524658203125, 1.8905029296875, 1.96575927734375, 2.041015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 15.0, 8.0, 24.0, 60.0, 142.0, 232.0, 223.0, 145.0, 69.0, 37.0, 13.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.63908386230469, -38.83693313598633, -38.03478240966797, -37.232635498046875, -36.430484771728516, -35.628334045410156, -34.8261833190918, -34.02403259277344, -33.22188186645508, -32.41973114013672, -31.617582321166992, -30.815431594848633, -30.013280868530273, -29.211132049560547, -28.408981323242188, -27.606830596923828, -26.804683685302734, -26.002532958984375, -25.20038414001465, -24.39823341369629, -23.59608268737793, -22.793933868408203, -21.991783142089844, -21.189632415771484, -20.387481689453125, -19.585330963134766, -18.78318214416504, -17.98103141784668, -17.17888069152832, -16.376731872558594, -15.574581146240234, -14.772431373596191, -13.970281600952148, -13.168131828308105, -12.365981101989746, -11.563831329345703, -10.76168155670166, -9.959531784057617, -9.157381057739258, -8.355231285095215, -7.553081035614014, -6.7509307861328125, -5.9487810134887695, -5.146630764007568, -4.344480514526367, -3.542330741882324, -2.740180492401123, -1.93803071975708, -1.135880470275879, -0.33373039960861206, 0.4684196710586548, 1.2705698013305664, 2.0727198123931885, 2.8748698234558105, 3.6770200729370117, 4.479169845581055, 5.281320095062256, 6.083470344543457, 6.8856201171875, 7.687770366668701, 8.489920616149902, 9.292070388793945, 10.094221115112305, 10.896369934082031, 11.69852066040039]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 8.0, 1.0, 16.0, 15.0, 22.0, 16.0, 23.0, 22.0, 34.0, 31.0, 43.0, 46.0, 65.0, 62.0, 41.0, 61.0, 51.0, 56.0, 50.0, 51.0, 47.0, 46.0, 40.0, 25.0, 24.0, 26.0, 20.0, 14.0, 9.0, 10.0, 5.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.268362998962402, -13.882357597351074, -13.49635124206543, -13.110345840454102, -12.724340438842773, -12.338335037231445, -11.952329635620117, -11.566323280334473, -11.180317878723145, -10.794312477111816, -10.408306121826172, -10.022300720214844, -9.636295318603516, -9.250289916992188, -8.86428451538086, -8.478278160095215, -8.092272758483887, -7.706267356872559, -7.320261478424072, -6.934255599975586, -6.548250198364258, -6.16224479675293, -5.776238918304443, -5.390233039855957, -5.004227638244629, -4.618222236633301, -4.2322163581848145, -3.8462107181549072, -3.460205078125, -3.0741994380950928, -2.6881937980651855, -2.3021881580352783, -1.9161834716796875, -1.5301778316497803, -1.144172191619873, -0.7581665515899658, -0.3721609115600586, 0.013844728469848633, 0.39985036849975586, 0.7858560085296631, 1.1718616485595703, 1.5578672885894775, 1.9438729286193848, 2.329878568649292, 2.715884208679199, 3.1018898487091064, 3.4878954887390137, 3.873901128768921, 4.259906768798828, 4.645912170410156, 5.031918048858643, 5.417923927307129, 5.803929328918457, 6.189934730529785, 6.5759406089782715, 6.961946487426758, 7.347951889038086, 7.733957290649414, 8.119962692260742, 8.505969047546387, 8.891974449157715, 9.277979850769043, 9.663986206054688, 10.049991607666016, 10.435997009277344]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 16.0, 25.0, 29.0, 60.0, 102.0, 150.0, 266.0, 483.0, 848.0, 1605.0, 2866.0, 5730.0, 12286.0, 28817.0, 74719.0, 212195.0, 400892.0, 190750.0, 67494.0, 26478.0, 11329.0, 5409.0, 2676.0, 1420.0, 793.0, 431.0, 281.0, 162.0, 89.0, 43.0, 30.0, 24.0, 16.0, 13.0, 6.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8125, -1.7529754638671875, -1.693450927734375, -1.6339263916015625, -1.57440185546875, -1.5148773193359375, -1.455352783203125, -1.3958282470703125, -1.3363037109375, -1.2767791748046875, -1.217254638671875, -1.1577301025390625, -1.09820556640625, -1.0386810302734375, -0.979156494140625, -0.9196319580078125, -0.860107421875, -0.8005828857421875, -0.741058349609375, -0.6815338134765625, -0.62200927734375, -0.5624847412109375, -0.502960205078125, -0.4434356689453125, -0.3839111328125, -0.3243865966796875, -0.264862060546875, -0.2053375244140625, -0.14581298828125, -0.0862884521484375, -0.026763916015625, 0.0327606201171875, 0.09228515625, 0.1518096923828125, 0.211334228515625, 0.2708587646484375, 0.33038330078125, 0.3899078369140625, 0.449432373046875, 0.5089569091796875, 0.5684814453125, 0.6280059814453125, 0.687530517578125, 0.7470550537109375, 0.80657958984375, 0.8661041259765625, 0.925628662109375, 0.9851531982421875, 1.044677734375, 1.1042022705078125, 1.163726806640625, 1.2232513427734375, 1.28277587890625, 1.3423004150390625, 1.401824951171875, 1.4613494873046875, 1.5208740234375, 1.5803985595703125, 1.639923095703125, 1.6994476318359375, 1.75897216796875, 1.8184967041015625, 1.878021240234375, 1.9375457763671875, 1.9970703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 5.0, 11.0, 13.0, 10.0, 22.0, 18.0, 26.0, 23.0, 28.0, 32.0, 40.0, 37.0, 36.0, 41.0, 53.0, 42.0, 46.0, 51.0, 41.0, 46.0, 52.0, 33.0, 36.0, 39.0, 35.0, 28.0, 28.0, 26.0, 16.0, 17.0, 8.0, 8.0, 8.0, 5.0, 7.0, 5.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.8406448364257812, -0.8126373291015625, -0.7846298217773438, -0.756622314453125, -0.7286148071289062, -0.7006072998046875, -0.6725997924804688, -0.64459228515625, -0.6165847778320312, -0.5885772705078125, -0.5605697631835938, -0.532562255859375, -0.5045547485351562, -0.4765472412109375, -0.44853973388671875, -0.4205322265625, -0.39252471923828125, -0.3645172119140625, -0.33650970458984375, -0.308502197265625, -0.28049468994140625, -0.2524871826171875, -0.22447967529296875, -0.19647216796875, -0.16846466064453125, -0.1404571533203125, -0.11244964599609375, -0.084442138671875, -0.05643463134765625, -0.0284271240234375, -0.00041961669921875, 0.027587890625, 0.05559539794921875, 0.0836029052734375, 0.11161041259765625, 0.139617919921875, 0.16762542724609375, 0.1956329345703125, 0.22364044189453125, 0.25164794921875, 0.27965545654296875, 0.3076629638671875, 0.33567047119140625, 0.363677978515625, 0.39168548583984375, 0.4196929931640625, 0.44770050048828125, 0.4757080078125, 0.5037155151367188, 0.5317230224609375, 0.5597305297851562, 0.587738037109375, 0.6157455444335938, 0.6437530517578125, 0.6717605590820312, 0.69976806640625, 0.7277755737304688, 0.7557830810546875, 0.7837905883789062, 0.811798095703125, 0.8398056030273438, 0.8678131103515625, 0.8958206176757812, 0.923828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 16.0, 12.0, 13.0, 22.0, 31.0, 41.0, 67.0, 128.0, 220.0, 390.0, 823.0, 2110.0, 7085.0, 35357.0, 296731.0, 626571.0, 62791.0, 11038.0, 2876.0, 1059.0, 496.0, 260.0, 159.0, 85.0, 43.0, 41.0, 26.0, 6.0, 15.0, 4.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.765625, -4.640716552734375, -4.51580810546875, -4.390899658203125, -4.2659912109375, -4.141082763671875, -4.01617431640625, -3.891265869140625, -3.766357421875, -3.641448974609375, -3.51654052734375, -3.391632080078125, -3.2667236328125, -3.141815185546875, -3.01690673828125, -2.891998291015625, -2.76708984375, -2.642181396484375, -2.51727294921875, -2.392364501953125, -2.2674560546875, -2.142547607421875, -2.01763916015625, -1.892730712890625, -1.767822265625, -1.642913818359375, -1.51800537109375, -1.393096923828125, -1.2681884765625, -1.143280029296875, -1.01837158203125, -0.893463134765625, -0.7685546875, -0.643646240234375, -0.51873779296875, -0.393829345703125, -0.2689208984375, -0.144012451171875, -0.01910400390625, 0.105804443359375, 0.230712890625, 0.355621337890625, 0.48052978515625, 0.605438232421875, 0.7303466796875, 0.855255126953125, 0.98016357421875, 1.105072021484375, 1.22998046875, 1.354888916015625, 1.47979736328125, 1.604705810546875, 1.7296142578125, 1.854522705078125, 1.97943115234375, 2.104339599609375, 2.229248046875, 2.354156494140625, 2.47906494140625, 2.603973388671875, 2.7288818359375, 2.853790283203125, 2.97869873046875, 3.103607177734375, 3.228515625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 7.0, 4.0, 12.0, 9.0, 14.0, 20.0, 28.0, 31.0, 33.0, 19.0, 59.0, 57.0, 48.0, 53.0, 62.0, 78.0, 57.0, 44.0, 52.0, 47.0, 47.0, 45.0, 34.0, 36.0, 17.0, 17.0, 20.0, 14.0, 10.0, 6.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2421875, -4.099853515625, -3.95751953125, -3.815185546875, -3.6728515625, -3.530517578125, -3.38818359375, -3.245849609375, -3.103515625, -2.961181640625, -2.81884765625, -2.676513671875, -2.5341796875, -2.391845703125, -2.24951171875, -2.107177734375, -1.96484375, -1.822509765625, -1.68017578125, -1.537841796875, -1.3955078125, -1.253173828125, -1.11083984375, -0.968505859375, -0.826171875, -0.683837890625, -0.54150390625, -0.399169921875, -0.2568359375, -0.114501953125, 0.02783203125, 0.170166015625, 0.3125, 0.454833984375, 0.59716796875, 0.739501953125, 0.8818359375, 1.024169921875, 1.16650390625, 1.308837890625, 1.451171875, 1.593505859375, 1.73583984375, 1.878173828125, 2.0205078125, 2.162841796875, 2.30517578125, 2.447509765625, 2.58984375, 2.732177734375, 2.87451171875, 3.016845703125, 3.1591796875, 3.301513671875, 3.44384765625, 3.586181640625, 3.728515625, 3.870849609375, 4.01318359375, 4.155517578125, 4.2978515625, 4.440185546875, 4.58251953125, 4.724853515625, 4.8671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 16.0, 33.0, 46.0, 121.0, 358.0, 1425.0, 11773.0, 788889.0, 238274.0, 6195.0, 938.0, 243.0, 105.0, 48.0, 21.0, 17.0, 10.0, 7.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.826171875, -2.7315673828125, -2.636962890625, -2.5423583984375, -2.44775390625, -2.3531494140625, -2.258544921875, -2.1639404296875, -2.0693359375, -1.9747314453125, -1.880126953125, -1.7855224609375, -1.69091796875, -1.5963134765625, -1.501708984375, -1.4071044921875, -1.3125, -1.2178955078125, -1.123291015625, -1.0286865234375, -0.93408203125, -0.8394775390625, -0.744873046875, -0.6502685546875, -0.5556640625, -0.4610595703125, -0.366455078125, -0.2718505859375, -0.17724609375, -0.0826416015625, 0.011962890625, 0.1065673828125, 0.201171875, 0.2957763671875, 0.390380859375, 0.4849853515625, 0.57958984375, 0.6741943359375, 0.768798828125, 0.8634033203125, 0.9580078125, 1.0526123046875, 1.147216796875, 1.2418212890625, 1.33642578125, 1.4310302734375, 1.525634765625, 1.6202392578125, 1.71484375, 1.8094482421875, 1.904052734375, 1.9986572265625, 2.09326171875, 2.1878662109375, 2.282470703125, 2.3770751953125, 2.4716796875, 2.5662841796875, 2.660888671875, 2.7554931640625, 2.85009765625, 2.9447021484375, 3.039306640625, 3.1339111328125, 3.228515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 12.0, 10.0, 12.0, 23.0, 25.0, 31.0, 45.0, 43.0, 63.0, 79.0, 93.0, 95.0, 91.0, 85.0, 58.0, 45.0, 40.0, 37.0, 18.0, 16.0, 17.0, 12.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019943714141845703, -0.0001930762082338333, -0.0001867152750492096, -0.00018035434186458588, -0.00017399340867996216, -0.00016763247549533844, -0.00016127154231071472, -0.000154910609126091, -0.00014854967594146729, -0.00014218874275684357, -0.00013582780957221985, -0.00012946687638759613, -0.0001231059432029724, -0.0001167450100183487, -0.00011038407683372498, -0.00010402314364910126, -9.766221046447754e-05, -9.130127727985382e-05, -8.49403440952301e-05, -7.857941091060638e-05, -7.221847772598267e-05, -6.585754454135895e-05, -5.949661135673523e-05, -5.313567817211151e-05, -4.677474498748779e-05, -4.0413811802864075e-05, -3.4052878618240356e-05, -2.7691945433616638e-05, -2.133101224899292e-05, -1.4970079064369202e-05, -8.609145879745483e-06, -2.248212695121765e-06, 4.112720489501953e-06, 1.0473653674125671e-05, 1.683458685874939e-05, 2.3195520043373108e-05, 2.9556453227996826e-05, 3.5917386412620544e-05, 4.227831959724426e-05, 4.863925278186798e-05, 5.50001859664917e-05, 6.136111915111542e-05, 6.772205233573914e-05, 7.408298552036285e-05, 8.044391870498657e-05, 8.680485188961029e-05, 9.316578507423401e-05, 9.952671825885773e-05, 0.00010588765144348145, 0.00011224858462810516, 0.00011860951781272888, 0.0001249704509973526, 0.00013133138418197632, 0.00013769231736660004, 0.00014405325055122375, 0.00015041418373584747, 0.0001567751169204712, 0.0001631360501050949, 0.00016949698328971863, 0.00017585791647434235, 0.00018221884965896606, 0.00018857978284358978, 0.0001949407160282135, 0.00020130164921283722, 0.00020766258239746094]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 3.0, 13.0, 16.0, 36.0, 37.0, 70.0, 157.0, 389.0, 1137.0, 5126.0, 71439.0, 915858.0, 48415.0, 4132.0, 1048.0, 339.0, 142.0, 80.0, 39.0, 32.0, 25.0, 9.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7431640625, -1.6718597412109375, -1.600555419921875, -1.5292510986328125, -1.45794677734375, -1.3866424560546875, -1.315338134765625, -1.2440338134765625, -1.1727294921875, -1.1014251708984375, -1.030120849609375, -0.9588165283203125, -0.88751220703125, -0.8162078857421875, -0.744903564453125, -0.6735992431640625, -0.602294921875, -0.5309906005859375, -0.459686279296875, -0.3883819580078125, -0.31707763671875, -0.2457733154296875, -0.174468994140625, -0.1031646728515625, -0.0318603515625, 0.0394439697265625, 0.110748291015625, 0.1820526123046875, 0.25335693359375, 0.3246612548828125, 0.395965576171875, 0.4672698974609375, 0.53857421875, 0.6098785400390625, 0.681182861328125, 0.7524871826171875, 0.82379150390625, 0.8950958251953125, 0.966400146484375, 1.0377044677734375, 1.1090087890625, 1.1803131103515625, 1.251617431640625, 1.3229217529296875, 1.39422607421875, 1.4655303955078125, 1.536834716796875, 1.6081390380859375, 1.679443359375, 1.7507476806640625, 1.822052001953125, 1.8933563232421875, 1.96466064453125, 2.0359649658203125, 2.107269287109375, 2.1785736083984375, 2.2498779296875, 2.3211822509765625, 2.392486572265625, 2.4637908935546875, 2.53509521484375, 2.6063995361328125, 2.677703857421875, 2.7490081787109375, 2.8203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 8.0, 15.0, 18.0, 19.0, 30.0, 41.0, 51.0, 68.0, 97.0, 103.0, 102.0, 63.0, 81.0, 70.0, 66.0, 38.0, 27.0, 23.0, 18.0, 14.0, 10.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -0.993682861328125, -0.95611572265625, -0.918548583984375, -0.8809814453125, -0.843414306640625, -0.80584716796875, -0.768280029296875, -0.730712890625, -0.693145751953125, -0.65557861328125, -0.618011474609375, -0.5804443359375, -0.542877197265625, -0.50531005859375, -0.467742919921875, -0.43017578125, -0.392608642578125, -0.35504150390625, -0.317474365234375, -0.2799072265625, -0.242340087890625, -0.20477294921875, -0.167205810546875, -0.129638671875, -0.092071533203125, -0.05450439453125, -0.016937255859375, 0.0206298828125, 0.058197021484375, 0.09576416015625, 0.133331298828125, 0.1708984375, 0.208465576171875, 0.24603271484375, 0.283599853515625, 0.3211669921875, 0.358734130859375, 0.39630126953125, 0.433868408203125, 0.471435546875, 0.509002685546875, 0.54656982421875, 0.584136962890625, 0.6217041015625, 0.659271240234375, 0.69683837890625, 0.734405517578125, 0.77197265625, 0.809539794921875, 0.84710693359375, 0.884674072265625, 0.9222412109375, 0.959808349609375, 0.99737548828125, 1.034942626953125, 1.072509765625, 1.110076904296875, 1.14764404296875, 1.185211181640625, 1.2227783203125, 1.260345458984375, 1.29791259765625, 1.335479736328125, 1.373046875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 11.0, 11.0, 27.0, 39.0, 55.0, 83.0, 120.0, 201.0, 150.0, 94.0, 78.0, 46.0, 29.0, 12.0, 15.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.539305686950684, -14.880812644958496, -14.222319602966309, -13.563826560974121, -12.905333518981934, -12.246840476989746, -11.588347434997559, -10.929854393005371, -10.271361351013184, -9.612868309020996, -8.954375267028809, -8.295882225036621, -7.637389183044434, -6.978896141052246, -6.320403099060059, -5.661910057067871, -5.003417015075684, -4.344923973083496, -3.6864309310913086, -3.027937889099121, -2.3694448471069336, -1.710951805114746, -1.0524587631225586, -0.3939657211303711, 0.2645273208618164, 0.9230203628540039, 1.5815134048461914, 2.240006446838379, 2.8984994888305664, 3.556992530822754, 4.215485572814941, 4.873978614807129, 5.532472610473633, 6.19096565246582, 6.849458694458008, 7.507951736450195, 8.166444778442383, 8.82493782043457, 9.483430862426758, 10.141923904418945, 10.800416946411133, 11.45890998840332, 12.117403030395508, 12.775896072387695, 13.434389114379883, 14.09288215637207, 14.751375198364258, 15.409868240356445, 16.068361282348633, 16.72685432434082, 17.385347366333008, 18.043840408325195, 18.702333450317383, 19.36082649230957, 20.019319534301758, 20.677812576293945, 21.336305618286133, 21.99479866027832, 22.653291702270508, 23.311784744262695, 23.970277786254883, 24.62877082824707, 25.287263870239258, 25.945756912231445, 26.604249954223633]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 14.0, 9.0, 25.0, 21.0, 25.0, 31.0, 35.0, 38.0, 43.0, 54.0, 61.0, 71.0, 89.0, 73.0, 78.0, 46.0, 45.0, 44.0, 42.0, 31.0, 29.0, 18.0, 24.0, 15.0, 10.0, 10.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.44171142578125, -16.763444900512695, -16.085180282592773, -15.406913757324219, -14.728647232055664, -14.050381660461426, -13.372116088867188, -12.693849563598633, -12.015583992004395, -11.337318420410156, -10.659051895141602, -9.980786323547363, -9.302520751953125, -8.62425422668457, -7.945988655090332, -7.2677226066589355, -6.589456558227539, -5.911190509796143, -5.232924461364746, -4.554658889770508, -3.8763928413391113, -3.198126792907715, -2.5198612213134766, -1.84159517288208, -1.1633291244506836, -0.48506319522857666, 0.19320273399353027, 0.8714685440063477, 1.5497345924377441, 2.2280006408691406, 2.906266212463379, 3.5845322608947754, 4.262798309326172, 4.941064357757568, 5.619330406188965, 6.297595977783203, 6.9758620262146, 7.654128074645996, 8.332393646240234, 9.010660171508789, 9.688925743103027, 10.367191314697266, 11.04545783996582, 11.723723411560059, 12.401988983154297, 13.080255508422852, 13.75852108001709, 14.436786651611328, 15.115053176879883, 15.793318748474121, 16.47158432006836, 17.149850845336914, 17.82811737060547, 18.50638198852539, 19.184648513793945, 19.8629150390625, 20.541179656982422, 21.219446182250977, 21.8977108001709, 22.575977325439453, 23.254243850708008, 23.932510375976562, 24.610774993896484, 25.28904151916504, 25.967308044433594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 9.0, 28.0, 52.0, 95.0, 197.0, 488.0, 943.0, 2039.0, 4648.0, 11742.0, 38726.0, 220064.0, 2615336.0, 1161433.0, 102436.0, 22942.0, 7627.0, 2852.0, 1324.0, 597.0, 318.0, 170.0, 77.0, 33.0, 26.0, 18.0, 17.0, 10.0, 4.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.85498046875, -0.8069839477539062, -0.7589874267578125, -0.7109909057617188, -0.662994384765625, -0.6149978637695312, -0.5670013427734375, -0.5190048217773438, -0.47100830078125, -0.42301177978515625, -0.3750152587890625, -0.32701873779296875, -0.279022216796875, -0.23102569580078125, -0.1830291748046875, -0.13503265380859375, -0.0870361328125, -0.03903961181640625, 0.0089569091796875, 0.05695343017578125, 0.104949951171875, 0.15294647216796875, 0.2009429931640625, 0.24893951416015625, 0.29693603515625, 0.34493255615234375, 0.3929290771484375, 0.44092559814453125, 0.488922119140625, 0.5369186401367188, 0.5849151611328125, 0.6329116821289062, 0.680908203125, 0.7289047241210938, 0.7769012451171875, 0.8248977661132812, 0.872894287109375, 0.9208908081054688, 0.9688873291015625, 1.0168838500976562, 1.06488037109375, 1.1128768920898438, 1.1608734130859375, 1.2088699340820312, 1.256866455078125, 1.3048629760742188, 1.3528594970703125, 1.4008560180664062, 1.4488525390625, 1.4968490600585938, 1.5448455810546875, 1.5928421020507812, 1.640838623046875, 1.6888351440429688, 1.7368316650390625, 1.7848281860351562, 1.83282470703125, 1.8808212280273438, 1.9288177490234375, 1.9768142700195312, 2.024810791015625, 2.0728073120117188, 2.1208038330078125, 2.1688003540039062, 2.216796875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 2.0, 12.0, 20.0, 38.0, 54.0, 73.0, 97.0, 128.0, 141.0, 116.0, 109.0, 76.0, 55.0, 42.0, 16.0, 17.0, 13.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.7780609130859375, -0.711395263671875, -0.6447296142578125, -0.57806396484375, -0.5113983154296875, -0.444732666015625, -0.3780670166015625, -0.3114013671875, -0.2447357177734375, -0.178070068359375, -0.1114044189453125, -0.04473876953125, 0.0219268798828125, 0.088592529296875, 0.1552581787109375, 0.221923828125, 0.2885894775390625, 0.355255126953125, 0.4219207763671875, 0.48858642578125, 0.5552520751953125, 0.621917724609375, 0.6885833740234375, 0.7552490234375, 0.8219146728515625, 0.888580322265625, 0.9552459716796875, 1.02191162109375, 1.0885772705078125, 1.155242919921875, 1.2219085693359375, 1.28857421875, 1.3552398681640625, 1.421905517578125, 1.4885711669921875, 1.55523681640625, 1.6219024658203125, 1.688568115234375, 1.7552337646484375, 1.8218994140625, 1.8885650634765625, 1.955230712890625, 2.0218963623046875, 2.08856201171875, 2.1552276611328125, 2.221893310546875, 2.2885589599609375, 2.355224609375, 2.4218902587890625, 2.488555908203125, 2.5552215576171875, 2.62188720703125, 2.6885528564453125, 2.755218505859375, 2.8218841552734375, 2.8885498046875, 2.9552154541015625, 3.021881103515625, 3.0885467529296875, 3.15521240234375, 3.2218780517578125, 3.288543701171875, 3.3552093505859375, 3.421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 8.0, 14.0, 23.0, 27.0, 46.0, 89.0, 134.0, 255.0, 557.0, 1352.0, 3544.0, 10954.0, 43393.0, 287998.0, 3404462.0, 370387.0, 51505.0, 12910.0, 3985.0, 1384.0, 599.0, 259.0, 135.0, 84.0, 59.0, 40.0, 21.0, 16.0, 8.0, 7.0, 7.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.365234375, -2.29473876953125, -2.2242431640625, -2.15374755859375, -2.083251953125, -2.01275634765625, -1.9422607421875, -1.87176513671875, -1.80126953125, -1.73077392578125, -1.6602783203125, -1.58978271484375, -1.519287109375, -1.44879150390625, -1.3782958984375, -1.30780029296875, -1.2373046875, -1.16680908203125, -1.0963134765625, -1.02581787109375, -0.955322265625, -0.88482666015625, -0.8143310546875, -0.74383544921875, -0.67333984375, -0.60284423828125, -0.5323486328125, -0.46185302734375, -0.391357421875, -0.32086181640625, -0.2503662109375, -0.17987060546875, -0.109375, -0.03887939453125, 0.0316162109375, 0.10211181640625, 0.172607421875, 0.24310302734375, 0.3135986328125, 0.38409423828125, 0.45458984375, 0.52508544921875, 0.5955810546875, 0.66607666015625, 0.736572265625, 0.80706787109375, 0.8775634765625, 0.94805908203125, 1.0185546875, 1.08905029296875, 1.1595458984375, 1.23004150390625, 1.300537109375, 1.37103271484375, 1.4415283203125, 1.51202392578125, 1.58251953125, 1.65301513671875, 1.7235107421875, 1.79400634765625, 1.864501953125, 1.93499755859375, 2.0054931640625, 2.07598876953125, 2.146484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0, 2.0, 9.0, 11.0, 13.0, 14.0, 12.0, 17.0, 26.0, 31.0, 54.0, 57.0, 81.0, 126.0, 147.0, 253.0, 432.0, 612.0, 665.0, 504.0, 306.0, 172.0, 128.0, 96.0, 56.0, 46.0, 39.0, 29.0, 19.0, 20.0, 21.0, 11.0, 11.0, 13.0, 5.0, 7.0, 2.0, 8.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.05078125, -1.992645263671875, -1.93450927734375, -1.876373291015625, -1.8182373046875, -1.760101318359375, -1.70196533203125, -1.643829345703125, -1.585693359375, -1.527557373046875, -1.46942138671875, -1.411285400390625, -1.3531494140625, -1.295013427734375, -1.23687744140625, -1.178741455078125, -1.12060546875, -1.062469482421875, -1.00433349609375, -0.946197509765625, -0.8880615234375, -0.829925537109375, -0.77178955078125, -0.713653564453125, -0.655517578125, -0.597381591796875, -0.53924560546875, -0.481109619140625, -0.4229736328125, -0.364837646484375, -0.30670166015625, -0.248565673828125, -0.1904296875, -0.132293701171875, -0.07415771484375, -0.016021728515625, 0.0421142578125, 0.100250244140625, 0.15838623046875, 0.216522216796875, 0.274658203125, 0.332794189453125, 0.39093017578125, 0.449066162109375, 0.5072021484375, 0.565338134765625, 0.62347412109375, 0.681610107421875, 0.73974609375, 0.797882080078125, 0.85601806640625, 0.914154052734375, 0.9722900390625, 1.030426025390625, 1.08856201171875, 1.146697998046875, 1.204833984375, 1.262969970703125, 1.32110595703125, 1.379241943359375, 1.4373779296875, 1.495513916015625, 1.55364990234375, 1.611785888671875, 1.669921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 18.0, 49.0, 116.0, 193.0, 214.0, 172.0, 111.0, 41.0, 23.0, 16.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-31.580284118652344, -30.81976318359375, -30.059242248535156, -29.298721313476562, -28.53820037841797, -27.777679443359375, -27.01715850830078, -26.256637573242188, -25.496116638183594, -24.735595703125, -23.975074768066406, -23.214553833007812, -22.45403289794922, -21.693511962890625, -20.93299102783203, -20.172470092773438, -19.411951065063477, -18.651430130004883, -17.89090919494629, -17.130388259887695, -16.3698673248291, -15.609346389770508, -14.84882640838623, -14.088305473327637, -13.327784538269043, -12.56726360321045, -11.806742668151855, -11.046222686767578, -10.285701751708984, -9.52518081665039, -8.764659881591797, -8.004138946533203, -7.243618011474609, -6.483097076416016, -5.722576141357422, -4.962055683135986, -4.201534748077393, -3.441013813018799, -2.6804933547973633, -1.9199724197387695, -1.1594514846801758, -0.3989306688308716, 0.3615901470184326, 1.1221108436584473, 1.882631778717041, 2.6431527137756348, 3.4036731719970703, 4.164194107055664, 4.924715042114258, 5.685235977172852, 6.445756912231445, 7.206277370452881, 7.966798305511475, 8.727319717407227, 9.487839698791504, 10.248360633850098, 11.008881568908691, 11.769402503967285, 12.529923439025879, 13.290443420410156, 14.05096435546875, 14.811485290527344, 15.572006225585938, 16.33252716064453, 17.093048095703125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 15.0, 22.0, 21.0, 15.0, 24.0, 41.0, 33.0, 42.0, 34.0, 48.0, 41.0, 48.0, 50.0, 45.0, 52.0, 44.0, 51.0, 51.0, 34.0, 47.0, 41.0, 33.0, 20.0, 17.0, 28.0, 18.0, 9.0, 17.0, 10.0, 5.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.478168487548828, -11.137365341186523, -10.796563148498535, -10.45576000213623, -10.114957809448242, -9.774154663085938, -9.43335247039795, -9.092549324035645, -8.751747131347656, -8.410943984985352, -8.070141792297363, -7.729339122772217, -7.38853645324707, -7.047733783721924, -6.706931114196777, -6.366127967834473, -6.025325298309326, -5.68452262878418, -5.343719959259033, -5.002917289733887, -4.66211462020874, -4.321311950683594, -3.980509042739868, -3.6397063732147217, -3.298903703689575, -2.9581010341644287, -2.6172983646392822, -2.2764954566955566, -1.9356929063796997, -1.5948902368545532, -1.2540874481201172, -0.9132847785949707, -0.5724821090698242, -0.23167940974235535, 0.10912328958511353, 0.4499260187149048, 0.7907286882400513, 1.1315313577651978, 1.4723341464996338, 1.8131368160247803, 2.1539394855499268, 2.4947421550750732, 2.8355448246002197, 3.1763477325439453, 3.517150402069092, 3.8579530715942383, 4.198755741119385, 4.539558410644531, 4.880361080169678, 5.221163749694824, 5.561966419219971, 5.902769088745117, 6.243571758270264, 6.58437442779541, 6.925177574157715, 7.265979766845703, 7.606782913208008, 7.947585582733154, 8.2883882522583, 8.629191398620605, 8.969993591308594, 9.310796737670898, 9.651598930358887, 9.992402076721191, 10.33320426940918]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 7.0, 5.0, 8.0, 21.0, 13.0, 33.0, 64.0, 84.0, 174.0, 321.0, 641.0, 1426.0, 3627.0, 9617.0, 28351.0, 86737.0, 264087.0, 406790.0, 164965.0, 53396.0, 17473.0, 6184.0, 2441.0, 1041.0, 474.0, 238.0, 137.0, 63.0, 47.0, 25.0, 17.0, 11.0, 9.0, 8.0, 8.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.203125, -2.14068603515625, -2.0782470703125, -2.01580810546875, -1.953369140625, -1.89093017578125, -1.8284912109375, -1.76605224609375, -1.70361328125, -1.64117431640625, -1.5787353515625, -1.51629638671875, -1.453857421875, -1.39141845703125, -1.3289794921875, -1.26654052734375, -1.2041015625, -1.14166259765625, -1.0792236328125, -1.01678466796875, -0.954345703125, -0.89190673828125, -0.8294677734375, -0.76702880859375, -0.70458984375, -0.64215087890625, -0.5797119140625, -0.51727294921875, -0.454833984375, -0.39239501953125, -0.3299560546875, -0.26751708984375, -0.205078125, -0.14263916015625, -0.0802001953125, -0.01776123046875, 0.044677734375, 0.10711669921875, 0.1695556640625, 0.23199462890625, 0.29443359375, 0.35687255859375, 0.4193115234375, 0.48175048828125, 0.544189453125, 0.60662841796875, 0.6690673828125, 0.73150634765625, 0.7939453125, 0.85638427734375, 0.9188232421875, 0.98126220703125, 1.043701171875, 1.10614013671875, 1.1685791015625, 1.23101806640625, 1.29345703125, 1.35589599609375, 1.4183349609375, 1.48077392578125, 1.543212890625, 1.60565185546875, 1.6680908203125, 1.73052978515625, 1.79296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 12.0, 21.0, 34.0, 51.0, 51.0, 76.0, 88.0, 84.0, 100.0, 85.0, 100.0, 76.0, 54.0, 42.0, 29.0, 29.0, 27.0, 16.0, 5.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77099609375, -0.7218093872070312, -0.6726226806640625, -0.6234359741210938, -0.574249267578125, -0.5250625610351562, -0.4758758544921875, -0.42668914794921875, -0.37750244140625, -0.32831573486328125, -0.2791290283203125, -0.22994232177734375, -0.180755615234375, -0.13156890869140625, -0.0823822021484375, -0.03319549560546875, 0.0159912109375, 0.06517791748046875, 0.1143646240234375, 0.16355133056640625, 0.212738037109375, 0.26192474365234375, 0.3111114501953125, 0.36029815673828125, 0.40948486328125, 0.45867156982421875, 0.5078582763671875, 0.5570449829101562, 0.606231689453125, 0.6554183959960938, 0.7046051025390625, 0.7537918090820312, 0.802978515625, 0.8521652221679688, 0.9013519287109375, 0.9505386352539062, 0.999725341796875, 1.0489120483398438, 1.0980987548828125, 1.1472854614257812, 1.19647216796875, 1.2456588745117188, 1.2948455810546875, 1.3440322875976562, 1.393218994140625, 1.4424057006835938, 1.4915924072265625, 1.5407791137695312, 1.5899658203125, 1.6391525268554688, 1.6883392333984375, 1.7375259399414062, 1.786712646484375, 1.8358993530273438, 1.8850860595703125, 1.9342727661132812, 1.98345947265625, 2.0326461791992188, 2.0818328857421875, 2.1310195922851562, 2.180206298828125, 2.2293930053710938, 2.2785797119140625, 2.3277664184570312, 2.376953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 9.0, 10.0, 13.0, 17.0, 23.0, 29.0, 48.0, 75.0, 101.0, 186.0, 254.0, 427.0, 731.0, 1283.0, 2716.0, 7987.0, 45481.0, 571413.0, 368546.0, 36856.0, 6942.0, 2417.0, 1221.0, 666.0, 416.0, 256.0, 151.0, 92.0, 66.0, 50.0, 27.0, 18.0, 14.0, 11.0, 4.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.361328125, -3.252716064453125, -3.14410400390625, -3.035491943359375, -2.9268798828125, -2.818267822265625, -2.70965576171875, -2.601043701171875, -2.492431640625, -2.383819580078125, -2.27520751953125, -2.166595458984375, -2.0579833984375, -1.949371337890625, -1.84075927734375, -1.732147216796875, -1.62353515625, -1.514923095703125, -1.40631103515625, -1.297698974609375, -1.1890869140625, -1.080474853515625, -0.97186279296875, -0.863250732421875, -0.754638671875, -0.646026611328125, -0.53741455078125, -0.428802490234375, -0.3201904296875, -0.211578369140625, -0.10296630859375, 0.005645751953125, 0.1142578125, 0.222869873046875, 0.33148193359375, 0.440093994140625, 0.5487060546875, 0.657318115234375, 0.76593017578125, 0.874542236328125, 0.983154296875, 1.091766357421875, 1.20037841796875, 1.308990478515625, 1.4176025390625, 1.526214599609375, 1.63482666015625, 1.743438720703125, 1.85205078125, 1.960662841796875, 2.06927490234375, 2.177886962890625, 2.2864990234375, 2.395111083984375, 2.50372314453125, 2.612335205078125, 2.720947265625, 2.829559326171875, 2.93817138671875, 3.046783447265625, 3.1553955078125, 3.264007568359375, 3.37261962890625, 3.481231689453125, 3.58984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 9.0, 7.0, 6.0, 9.0, 23.0, 12.0, 17.0, 25.0, 26.0, 20.0, 30.0, 33.0, 39.0, 41.0, 40.0, 39.0, 54.0, 47.0, 66.0, 48.0, 57.0, 51.0, 49.0, 44.0, 37.0, 27.0, 27.0, 21.0, 17.0, 18.0, 16.0, 12.0, 10.0, 6.0, 5.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.26171875, -4.147064208984375, -4.03240966796875, -3.917755126953125, -3.8031005859375, -3.688446044921875, -3.57379150390625, -3.459136962890625, -3.344482421875, -3.229827880859375, -3.11517333984375, -3.000518798828125, -2.8858642578125, -2.771209716796875, -2.65655517578125, -2.541900634765625, -2.42724609375, -2.312591552734375, -2.19793701171875, -2.083282470703125, -1.9686279296875, -1.853973388671875, -1.73931884765625, -1.624664306640625, -1.510009765625, -1.395355224609375, -1.28070068359375, -1.166046142578125, -1.0513916015625, -0.936737060546875, -0.82208251953125, -0.707427978515625, -0.5927734375, -0.478118896484375, -0.36346435546875, -0.248809814453125, -0.1341552734375, -0.019500732421875, 0.09515380859375, 0.209808349609375, 0.324462890625, 0.439117431640625, 0.55377197265625, 0.668426513671875, 0.7830810546875, 0.897735595703125, 1.01239013671875, 1.127044677734375, 1.24169921875, 1.356353759765625, 1.47100830078125, 1.585662841796875, 1.7003173828125, 1.814971923828125, 1.92962646484375, 2.044281005859375, 2.158935546875, 2.273590087890625, 2.38824462890625, 2.502899169921875, 2.6175537109375, 2.732208251953125, 2.84686279296875, 2.961517333984375, 3.076171875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 8.0, 10.0, 22.0, 21.0, 25.0, 71.0, 100.0, 229.0, 516.0, 1386.0, 4948.0, 32447.0, 669582.0, 311970.0, 21460.0, 3771.0, 1038.0, 478.0, 219.0, 104.0, 53.0, 28.0, 18.0, 14.0, 14.0, 6.0, 5.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.281768798828125, -1.24029541015625, -1.198822021484375, -1.1573486328125, -1.115875244140625, -1.07440185546875, -1.032928466796875, -0.991455078125, -0.949981689453125, -0.90850830078125, -0.867034912109375, -0.8255615234375, -0.784088134765625, -0.74261474609375, -0.701141357421875, -0.65966796875, -0.618194580078125, -0.57672119140625, -0.535247802734375, -0.4937744140625, -0.452301025390625, -0.41082763671875, -0.369354248046875, -0.327880859375, -0.286407470703125, -0.24493408203125, -0.203460693359375, -0.1619873046875, -0.120513916015625, -0.07904052734375, -0.037567138671875, 0.00390625, 0.045379638671875, 0.08685302734375, 0.128326416015625, 0.1697998046875, 0.211273193359375, 0.25274658203125, 0.294219970703125, 0.335693359375, 0.377166748046875, 0.41864013671875, 0.460113525390625, 0.5015869140625, 0.543060302734375, 0.58453369140625, 0.626007080078125, 0.66748046875, 0.708953857421875, 0.75042724609375, 0.791900634765625, 0.8333740234375, 0.874847412109375, 0.91632080078125, 0.957794189453125, 0.999267578125, 1.040740966796875, 1.08221435546875, 1.123687744140625, 1.1651611328125, 1.206634521484375, 1.24810791015625, 1.289581298828125, 1.3310546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 17.0, 14.0, 14.0, 25.0, 30.0, 33.0, 33.0, 45.0, 43.0, 60.0, 86.0, 97.0, 115.0, 80.0, 64.0, 50.0, 35.0, 32.0, 22.0, 21.0, 20.0, 12.0, 8.0, 5.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019812583923339844, -0.00019183196127414703, -0.00018553808331489563, -0.00017924420535564423, -0.00017295032739639282, -0.00016665644943714142, -0.00016036257147789001, -0.0001540686935186386, -0.0001477748155593872, -0.0001414809376001358, -0.0001351870596408844, -0.000128893181681633, -0.0001225993037223816, -0.00011630542576313019, -0.00011001154780387878, -0.00010371766984462738, -9.742379188537598e-05, -9.112991392612457e-05, -8.483603596687317e-05, -7.854215800762177e-05, -7.224828004837036e-05, -6.595440208911896e-05, -5.9660524129867554e-05, -5.336664617061615e-05, -4.7072768211364746e-05, -4.077889025211334e-05, -3.448501229286194e-05, -2.8191134333610535e-05, -2.189725637435913e-05, -1.5603378415107727e-05, -9.309500455856323e-06, -3.0156224966049194e-06, 3.2782554626464844e-06, 9.572133421897888e-06, 1.5866011381149292e-05, 2.2159889340400696e-05, 2.84537672996521e-05, 3.4747645258903503e-05, 4.104152321815491e-05, 4.733540117740631e-05, 5.3629279136657715e-05, 5.992315709590912e-05, 6.621703505516052e-05, 7.251091301441193e-05, 7.880479097366333e-05, 8.509866893291473e-05, 9.139254689216614e-05, 9.768642485141754e-05, 0.00010398030281066895, 0.00011027418076992035, 0.00011656805872917175, 0.00012286193668842316, 0.00012915581464767456, 0.00013544969260692596, 0.00014174357056617737, 0.00014803744852542877, 0.00015433132648468018, 0.00016062520444393158, 0.00016691908240318298, 0.0001732129603624344, 0.0001795068383216858, 0.0001858007162809372, 0.0001920945942401886, 0.00019838847219944, 0.0002046823501586914]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 13.0, 16.0, 18.0, 26.0, 46.0, 52.0, 88.0, 142.0, 208.0, 393.0, 641.0, 1216.0, 2767.0, 8675.0, 42972.0, 536250.0, 401098.0, 40143.0, 8356.0, 2769.0, 1142.0, 597.0, 313.0, 203.0, 108.0, 72.0, 57.0, 44.0, 37.0, 18.0, 13.0, 13.0, 5.0, 8.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.84130859375, -0.8122787475585938, -0.7832489013671875, -0.7542190551757812, -0.725189208984375, -0.6961593627929688, -0.6671295166015625, -0.6380996704101562, -0.60906982421875, -0.5800399780273438, -0.5510101318359375, -0.5219802856445312, -0.492950439453125, -0.46392059326171875, -0.4348907470703125, -0.40586090087890625, -0.3768310546875, -0.34780120849609375, -0.3187713623046875, -0.28974151611328125, -0.260711669921875, -0.23168182373046875, -0.2026519775390625, -0.17362213134765625, -0.14459228515625, -0.11556243896484375, -0.0865325927734375, -0.05750274658203125, -0.028472900390625, 0.00055694580078125, 0.0295867919921875, 0.05861663818359375, 0.087646484375, 0.11667633056640625, 0.1457061767578125, 0.17473602294921875, 0.203765869140625, 0.23279571533203125, 0.2618255615234375, 0.29085540771484375, 0.31988525390625, 0.34891510009765625, 0.3779449462890625, 0.40697479248046875, 0.436004638671875, 0.46503448486328125, 0.4940643310546875, 0.5230941772460938, 0.5521240234375, 0.5811538696289062, 0.6101837158203125, 0.6392135620117188, 0.668243408203125, 0.6972732543945312, 0.7263031005859375, 0.7553329467773438, 0.78436279296875, 0.8133926391601562, 0.8424224853515625, 0.8714523315429688, 0.900482177734375, 0.9295120239257812, 0.9585418701171875, 0.9875717163085938, 1.0166015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 10.0, 8.0, 16.0, 20.0, 23.0, 30.0, 50.0, 41.0, 72.0, 72.0, 105.0, 117.0, 96.0, 90.0, 58.0, 46.0, 39.0, 26.0, 20.0, 13.0, 13.0, 9.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4248046875, -1.3896102905273438, -1.3544158935546875, -1.3192214965820312, -1.284027099609375, -1.2488327026367188, -1.2136383056640625, -1.1784439086914062, -1.14324951171875, -1.1080551147460938, -1.0728607177734375, -1.0376663208007812, -1.002471923828125, -0.9672775268554688, -0.9320831298828125, -0.8968887329101562, -0.8616943359375, -0.8264999389648438, -0.7913055419921875, -0.7561111450195312, -0.720916748046875, -0.6857223510742188, -0.6505279541015625, -0.6153335571289062, -0.58013916015625, -0.5449447631835938, -0.5097503662109375, -0.47455596923828125, -0.439361572265625, -0.40416717529296875, -0.3689727783203125, -0.33377838134765625, -0.298583984375, -0.26338958740234375, -0.2281951904296875, -0.19300079345703125, -0.157806396484375, -0.12261199951171875, -0.0874176025390625, -0.05222320556640625, -0.01702880859375, 0.01816558837890625, 0.0533599853515625, 0.08855438232421875, 0.123748779296875, 0.15894317626953125, 0.1941375732421875, 0.22933197021484375, 0.2645263671875, 0.29972076416015625, 0.3349151611328125, 0.37010955810546875, 0.405303955078125, 0.44049835205078125, 0.4756927490234375, 0.5108871459960938, 0.54608154296875, 0.5812759399414062, 0.6164703369140625, 0.6516647338867188, 0.686859130859375, 0.7220535278320312, 0.7572479248046875, 0.7924423217773438, 0.82763671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 10.0, 25.0, 41.0, 97.0, 192.0, 289.0, 180.0, 84.0, 40.0, 14.0, 6.0, 3.0, 9.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.92029571533203, -37.045204162597656, -36.17011642456055, -35.29502487182617, -34.41993713378906, -33.54484558105469, -32.66975402832031, -31.794666290283203, -30.919574737548828, -30.044485092163086, -29.169395446777344, -28.29430389404297, -27.419214248657227, -26.544124603271484, -25.669034957885742, -24.7939453125, -23.918855667114258, -23.043766021728516, -22.168676376342773, -21.29358673095703, -20.418495178222656, -19.543405532836914, -18.668315887451172, -17.79322624206543, -16.918136596679688, -16.043046951293945, -15.167956352233887, -14.292866706848145, -13.417776107788086, -12.542686462402344, -11.667596817016602, -10.79250717163086, -9.917417526245117, -9.042327880859375, -8.167237281799316, -7.292147636413574, -6.417057514190674, -5.541967391967773, -4.666877746582031, -3.791787624359131, -2.9166975021362305, -2.04160737991333, -1.1665174961090088, -0.2914276123046875, 0.5836625099182129, 1.4587526321411133, 2.3338422775268555, 3.208932399749756, 4.084022521972656, 4.959112644195557, 5.834202766418457, 6.709292411804199, 7.5843825340271, 8.45947265625, 9.334562301635742, 10.209651947021484, 11.084742546081543, 11.959832191467285, 12.834922790527344, 13.710012435913086, 14.585102081298828, 15.460192680358887, 16.335281372070312, 17.210372924804688, 18.08546257019043]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 9.0, 12.0, 6.0, 10.0, 14.0, 17.0, 23.0, 20.0, 26.0, 19.0, 31.0, 24.0, 33.0, 44.0, 45.0, 58.0, 58.0, 69.0, 71.0, 62.0, 43.0, 42.0, 35.0, 31.0, 30.0, 24.0, 26.0, 22.0, 12.0, 18.0, 18.0, 10.0, 4.0, 8.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.888710975646973, -12.457301139831543, -12.02589225769043, -11.594482421875, -11.16307258605957, -10.73166275024414, -10.300252914428711, -9.868844032287598, -9.437434196472168, -9.006024360656738, -8.574615478515625, -8.143205642700195, -7.711795806884766, -7.280385971069336, -6.8489766120910645, -6.417567253112793, -5.986157417297363, -5.554747581481934, -5.123338222503662, -4.691928863525391, -4.260519027709961, -3.8291094303131104, -3.3976998329162598, -2.966290235519409, -2.5348806381225586, -2.103471040725708, -1.6720614433288574, -1.2406518459320068, -0.8092422485351562, -0.37783265113830566, 0.05357694625854492, 0.4849865436553955, 0.9163951873779297, 1.3478047847747803, 1.7792143821716309, 2.2106239795684814, 2.642033576965332, 3.0734431743621826, 3.504852771759033, 3.936262369155884, 4.367671966552734, 4.799081802368164, 5.2304911613464355, 5.661900520324707, 6.093310356140137, 6.524720191955566, 6.956129550933838, 7.387538909912109, 7.818948745727539, 8.250358581542969, 8.681768417358398, 9.113177299499512, 9.544587135314941, 9.975996971130371, 10.407405853271484, 10.838815689086914, 11.270225524902344, 11.701635360717773, 12.133045196533203, 12.564454078674316, 12.995863914489746, 13.427273750305176, 13.858682632446289, 14.290092468261719, 14.721502304077148]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 16.0, 20.0, 24.0, 25.0, 45.0, 94.0, 158.0, 241.0, 485.0, 958.0, 2032.0, 4491.0, 10132.0, 26980.0, 89324.0, 477701.0, 2426237.0, 949897.0, 144556.0, 36879.0, 13305.0, 5555.0, 2472.0, 1238.0, 547.0, 305.0, 214.0, 110.0, 85.0, 37.0, 36.0, 18.0, 10.0, 20.0, 4.0, 6.0, 6.0, 3.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8154296875, -0.783660888671875, -0.75189208984375, -0.720123291015625, -0.6883544921875, -0.656585693359375, -0.62481689453125, -0.593048095703125, -0.561279296875, -0.529510498046875, -0.49774169921875, -0.465972900390625, -0.4342041015625, -0.402435302734375, -0.37066650390625, -0.338897705078125, -0.30712890625, -0.275360107421875, -0.24359130859375, -0.211822509765625, -0.1800537109375, -0.148284912109375, -0.11651611328125, -0.084747314453125, -0.052978515625, -0.021209716796875, 0.01055908203125, 0.042327880859375, 0.0740966796875, 0.105865478515625, 0.13763427734375, 0.169403076171875, 0.201171875, 0.232940673828125, 0.26470947265625, 0.296478271484375, 0.3282470703125, 0.360015869140625, 0.39178466796875, 0.423553466796875, 0.455322265625, 0.487091064453125, 0.51885986328125, 0.550628662109375, 0.5823974609375, 0.614166259765625, 0.64593505859375, 0.677703857421875, 0.70947265625, 0.741241455078125, 0.77301025390625, 0.804779052734375, 0.8365478515625, 0.868316650390625, 0.90008544921875, 0.931854248046875, 0.963623046875, 0.995391845703125, 1.02716064453125, 1.058929443359375, 1.0906982421875, 1.122467041015625, 1.15423583984375, 1.186004638671875, 1.2177734375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 13.0, 21.0, 24.0, 24.0, 42.0, 33.0, 56.0, 53.0, 78.0, 69.0, 71.0, 84.0, 56.0, 85.0, 61.0, 52.0, 43.0, 33.0, 25.0, 26.0, 15.0, 13.0, 11.0, 8.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.6947860717773438, -0.6566619873046875, -0.6185379028320312, -0.580413818359375, -0.5422897338867188, -0.5041656494140625, -0.46604156494140625, -0.42791748046875, -0.38979339599609375, -0.3516693115234375, -0.31354522705078125, -0.275421142578125, -0.23729705810546875, -0.1991729736328125, -0.16104888916015625, -0.1229248046875, -0.08480072021484375, -0.0466766357421875, -0.00855255126953125, 0.029571533203125, 0.06769561767578125, 0.1058197021484375, 0.14394378662109375, 0.18206787109375, 0.22019195556640625, 0.2583160400390625, 0.29644012451171875, 0.334564208984375, 0.37268829345703125, 0.4108123779296875, 0.44893646240234375, 0.487060546875, 0.5251846313476562, 0.5633087158203125, 0.6014328002929688, 0.639556884765625, 0.6776809692382812, 0.7158050537109375, 0.7539291381835938, 0.79205322265625, 0.8301773071289062, 0.8683013916015625, 0.9064254760742188, 0.944549560546875, 0.9826736450195312, 1.0207977294921875, 1.0589218139648438, 1.0970458984375, 1.1351699829101562, 1.1732940673828125, 1.2114181518554688, 1.249542236328125, 1.2876663208007812, 1.3257904052734375, 1.3639144897460938, 1.40203857421875, 1.4401626586914062, 1.4782867431640625, 1.5164108276367188, 1.554534912109375, 1.5926589965820312, 1.6307830810546875, 1.6689071655273438, 1.70703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 1.0, 10.0, 8.0, 14.0, 39.0, 54.0, 62.0, 107.0, 168.0, 314.0, 576.0, 1274.0, 3093.0, 9739.0, 40062.0, 276098.0, 3371719.0, 421601.0, 51465.0, 11668.0, 3495.0, 1329.0, 652.0, 310.0, 181.0, 96.0, 50.0, 36.0, 13.0, 8.0, 12.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7158203125, -1.657806396484375, -1.59979248046875, -1.541778564453125, -1.4837646484375, -1.425750732421875, -1.36773681640625, -1.309722900390625, -1.251708984375, -1.193695068359375, -1.13568115234375, -1.077667236328125, -1.0196533203125, -0.961639404296875, -0.90362548828125, -0.845611572265625, -0.78759765625, -0.729583740234375, -0.67156982421875, -0.613555908203125, -0.5555419921875, -0.497528076171875, -0.43951416015625, -0.381500244140625, -0.323486328125, -0.265472412109375, -0.20745849609375, -0.149444580078125, -0.0914306640625, -0.033416748046875, 0.02459716796875, 0.082611083984375, 0.140625, 0.198638916015625, 0.25665283203125, 0.314666748046875, 0.3726806640625, 0.430694580078125, 0.48870849609375, 0.546722412109375, 0.604736328125, 0.662750244140625, 0.72076416015625, 0.778778076171875, 0.8367919921875, 0.894805908203125, 0.95281982421875, 1.010833740234375, 1.06884765625, 1.126861572265625, 1.18487548828125, 1.242889404296875, 1.3009033203125, 1.358917236328125, 1.41693115234375, 1.474945068359375, 1.532958984375, 1.590972900390625, 1.64898681640625, 1.707000732421875, 1.7650146484375, 1.823028564453125, 1.88104248046875, 1.939056396484375, 1.9970703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 10.0, 14.0, 23.0, 33.0, 45.0, 55.0, 92.0, 155.0, 339.0, 604.0, 983.0, 783.0, 396.0, 189.0, 117.0, 63.0, 44.0, 28.0, 33.0, 18.0, 14.0, 10.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.69769287109375, -2.6219482421875, -2.54620361328125, -2.470458984375, -2.39471435546875, -2.3189697265625, -2.24322509765625, -2.16748046875, -2.09173583984375, -2.0159912109375, -1.94024658203125, -1.864501953125, -1.78875732421875, -1.7130126953125, -1.63726806640625, -1.5615234375, -1.48577880859375, -1.4100341796875, -1.33428955078125, -1.258544921875, -1.18280029296875, -1.1070556640625, -1.03131103515625, -0.95556640625, -0.87982177734375, -0.8040771484375, -0.72833251953125, -0.652587890625, -0.57684326171875, -0.5010986328125, -0.42535400390625, -0.349609375, -0.27386474609375, -0.1981201171875, -0.12237548828125, -0.046630859375, 0.02911376953125, 0.1048583984375, 0.18060302734375, 0.25634765625, 0.33209228515625, 0.4078369140625, 0.48358154296875, 0.559326171875, 0.63507080078125, 0.7108154296875, 0.78656005859375, 0.8623046875, 0.93804931640625, 1.0137939453125, 1.08953857421875, 1.165283203125, 1.24102783203125, 1.3167724609375, 1.39251708984375, 1.46826171875, 1.54400634765625, 1.6197509765625, 1.69549560546875, 1.771240234375, 1.84698486328125, 1.9227294921875, 1.99847412109375, 2.07421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 24.0, 85.0, 179.0, 262.0, 204.0, 127.0, 58.0, 19.0, 9.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.72513198852539, -17.968921661376953, -17.21271324157715, -16.45650291442871, -15.700294494628906, -14.944084167480469, -14.187874794006348, -13.431665420532227, -12.675456047058105, -11.919246673583984, -11.163037300109863, -10.406827926635742, -9.650617599487305, -8.8944091796875, -8.138198852539062, -7.381989479064941, -6.62578010559082, -5.869570732116699, -5.113361358642578, -4.357151508331299, -3.6009421348571777, -2.8447327613830566, -2.0885229110717773, -1.3323135375976562, -0.5761041641235352, 0.1801053285598755, 0.9363148212432861, 1.6925244331359863, 2.4487338066101074, 3.2049431800842285, 3.961153030395508, 4.717362403869629, 5.47357177734375, 6.229781150817871, 6.985990524291992, 7.7422003746032715, 8.498409271240234, 9.254619598388672, 10.010828971862793, 10.767038345336914, 11.523247718811035, 12.279457092285156, 13.035666465759277, 13.791875839233398, 14.548086166381836, 15.30429458618164, 16.060504913330078, 16.816715240478516, 17.57292366027832, 18.329133987426758, 19.085342407226562, 19.841552734375, 20.597761154174805, 21.353971481323242, 22.110179901123047, 22.866390228271484, 23.622600555419922, 24.37881088256836, 25.135019302368164, 25.8912296295166, 26.647438049316406, 27.403648376464844, 28.15985870361328, 28.916067123413086, 29.67227554321289]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 14.0, 22.0, 22.0, 30.0, 13.0, 25.0, 28.0, 37.0, 36.0, 35.0, 43.0, 51.0, 65.0, 44.0, 50.0, 49.0, 56.0, 40.0, 41.0, 48.0, 34.0, 27.0, 25.0, 28.0, 22.0, 18.0, 12.0, 16.0, 8.0, 5.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.177300453186035, -10.868707656860352, -10.560114860534668, -10.251522064208984, -9.9429292678833, -9.634336471557617, -9.32574462890625, -9.017151832580566, -8.708559036254883, -8.3999662399292, -8.091373443603516, -7.782780647277832, -7.474188327789307, -7.165595531463623, -6.8570027351379395, -6.548410415649414, -6.239817142486572, -5.931224346160889, -5.622631549835205, -5.31403923034668, -5.005446434020996, -4.6968536376953125, -4.388260841369629, -4.079668045043945, -3.771075487136841, -3.4624826908111572, -3.1538901329040527, -2.845297336578369, -2.5367045402526855, -2.228111982345581, -1.9195191860198975, -1.610926628112793, -1.3023338317871094, -0.9937411546707153, -0.6851484179496765, -0.3765556812286377, -0.06796300411224365, 0.2406296730041504, 0.549222469329834, 0.8578150272369385, 1.166407823562622, 1.4750005006790161, 1.7835931777954102, 2.0921859741210938, 2.4007787704467773, 2.709371328353882, 3.0179641246795654, 3.32655668258667, 3.6351494789123535, 3.943742275238037, 4.252335071563721, 4.560927391052246, 4.86952018737793, 5.178112983703613, 5.486705780029297, 5.7952985763549805, 6.103891372680664, 6.412484169006348, 6.721076965332031, 7.029669761657715, 7.33826208114624, 7.646854877471924, 7.955447673797607, 8.264039993286133, 8.572632789611816]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 12.0, 15.0, 32.0, 32.0, 43.0, 63.0, 103.0, 159.0, 222.0, 345.0, 484.0, 712.0, 1168.0, 1704.0, 2983.0, 5153.0, 9270.0, 17337.0, 33627.0, 66909.0, 137550.0, 254224.0, 248897.0, 132060.0, 64629.0, 32186.0, 16674.0, 8987.0, 5018.0, 2861.0, 1702.0, 1160.0, 728.0, 495.0, 305.0, 209.0, 146.0, 109.0, 83.0, 48.0, 44.0, 21.0, 5.0, 7.0, 8.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0537109375, -1.0185546875, -0.9833984375, -0.9482421875, -0.9130859375, -0.8779296875, -0.8427734375, -0.8076171875, -0.7724609375, -0.7373046875, -0.7021484375, -0.6669921875, -0.6318359375, -0.5966796875, -0.5615234375, -0.5263671875, -0.4912109375, -0.4560546875, -0.4208984375, -0.3857421875, -0.3505859375, -0.3154296875, -0.2802734375, -0.2451171875, -0.2099609375, -0.1748046875, -0.1396484375, -0.1044921875, -0.0693359375, -0.0341796875, 0.0009765625, 0.0361328125, 0.0712890625, 0.1064453125, 0.1416015625, 0.1767578125, 0.2119140625, 0.2470703125, 0.2822265625, 0.3173828125, 0.3525390625, 0.3876953125, 0.4228515625, 0.4580078125, 0.4931640625, 0.5283203125, 0.5634765625, 0.5986328125, 0.6337890625, 0.6689453125, 0.7041015625, 0.7392578125, 0.7744140625, 0.8095703125, 0.8447265625, 0.8798828125, 0.9150390625, 0.9501953125, 0.9853515625, 1.0205078125, 1.0556640625, 1.0908203125, 1.1259765625, 1.1611328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 8.0, 9.0, 11.0, 15.0, 14.0, 24.0, 30.0, 28.0, 19.0, 36.0, 43.0, 30.0, 45.0, 59.0, 41.0, 56.0, 54.0, 51.0, 50.0, 35.0, 37.0, 50.0, 47.0, 24.0, 28.0, 22.0, 23.0, 21.0, 13.0, 14.0, 16.0, 15.0, 6.0, 8.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.703094482421875, -0.67767333984375, -0.652252197265625, -0.6268310546875, -0.601409912109375, -0.57598876953125, -0.550567626953125, -0.525146484375, -0.499725341796875, -0.47430419921875, -0.448883056640625, -0.4234619140625, -0.398040771484375, -0.37261962890625, -0.347198486328125, -0.32177734375, -0.296356201171875, -0.27093505859375, -0.245513916015625, -0.2200927734375, -0.194671630859375, -0.16925048828125, -0.143829345703125, -0.118408203125, -0.092987060546875, -0.06756591796875, -0.042144775390625, -0.0167236328125, 0.008697509765625, 0.03411865234375, 0.059539794921875, 0.0849609375, 0.110382080078125, 0.13580322265625, 0.161224365234375, 0.1866455078125, 0.212066650390625, 0.23748779296875, 0.262908935546875, 0.288330078125, 0.313751220703125, 0.33917236328125, 0.364593505859375, 0.3900146484375, 0.415435791015625, 0.44085693359375, 0.466278076171875, 0.49169921875, 0.517120361328125, 0.54254150390625, 0.567962646484375, 0.5933837890625, 0.618804931640625, 0.64422607421875, 0.669647216796875, 0.695068359375, 0.720489501953125, 0.74591064453125, 0.771331787109375, 0.7967529296875, 0.822174072265625, 0.84759521484375, 0.873016357421875, 0.8984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 17.0, 11.0, 27.0, 31.0, 43.0, 64.0, 87.0, 123.0, 213.0, 323.0, 469.0, 765.0, 1460.0, 3537.0, 11727.0, 69582.0, 647388.0, 266089.0, 33926.0, 7151.0, 2489.0, 1221.0, 646.0, 390.0, 227.0, 140.0, 110.0, 63.0, 49.0, 49.0, 32.0, 21.0, 11.0, 14.0, 9.0, 10.0, 2.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.055328369140625, -2.96221923828125, -2.869110107421875, -2.7760009765625, -2.682891845703125, -2.58978271484375, -2.496673583984375, -2.403564453125, -2.310455322265625, -2.21734619140625, -2.124237060546875, -2.0311279296875, -1.938018798828125, -1.84490966796875, -1.751800537109375, -1.65869140625, -1.565582275390625, -1.47247314453125, -1.379364013671875, -1.2862548828125, -1.193145751953125, -1.10003662109375, -1.006927490234375, -0.913818359375, -0.820709228515625, -0.72760009765625, -0.634490966796875, -0.5413818359375, -0.448272705078125, -0.35516357421875, -0.262054443359375, -0.1689453125, -0.075836181640625, 0.01727294921875, 0.110382080078125, 0.2034912109375, 0.296600341796875, 0.38970947265625, 0.482818603515625, 0.575927734375, 0.669036865234375, 0.76214599609375, 0.855255126953125, 0.9483642578125, 1.041473388671875, 1.13458251953125, 1.227691650390625, 1.32080078125, 1.413909912109375, 1.50701904296875, 1.600128173828125, 1.6932373046875, 1.786346435546875, 1.87945556640625, 1.972564697265625, 2.065673828125, 2.158782958984375, 2.25189208984375, 2.345001220703125, 2.4381103515625, 2.531219482421875, 2.62432861328125, 2.717437744140625, 2.810546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 6.0, 11.0, 8.0, 8.0, 18.0, 13.0, 15.0, 21.0, 13.0, 22.0, 27.0, 24.0, 38.0, 33.0, 38.0, 51.0, 35.0, 37.0, 44.0, 53.0, 47.0, 51.0, 43.0, 50.0, 28.0, 31.0, 31.0, 36.0, 35.0, 18.0, 18.0, 21.0, 9.0, 12.0, 6.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.884765625, -2.795745849609375, -2.70672607421875, -2.617706298828125, -2.5286865234375, -2.439666748046875, -2.35064697265625, -2.261627197265625, -2.172607421875, -2.083587646484375, -1.99456787109375, -1.905548095703125, -1.8165283203125, -1.727508544921875, -1.63848876953125, -1.549468994140625, -1.46044921875, -1.371429443359375, -1.28240966796875, -1.193389892578125, -1.1043701171875, -1.015350341796875, -0.92633056640625, -0.837310791015625, -0.748291015625, -0.659271240234375, -0.57025146484375, -0.481231689453125, -0.3922119140625, -0.303192138671875, -0.21417236328125, -0.125152587890625, -0.0361328125, 0.052886962890625, 0.14190673828125, 0.230926513671875, 0.3199462890625, 0.408966064453125, 0.49798583984375, 0.587005615234375, 0.676025390625, 0.765045166015625, 0.85406494140625, 0.943084716796875, 1.0321044921875, 1.121124267578125, 1.21014404296875, 1.299163818359375, 1.38818359375, 1.477203369140625, 1.56622314453125, 1.655242919921875, 1.7442626953125, 1.833282470703125, 1.92230224609375, 2.011322021484375, 2.100341796875, 2.189361572265625, 2.27838134765625, 2.367401123046875, 2.4564208984375, 2.545440673828125, 2.63446044921875, 2.723480224609375, 2.8125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 9.0, 11.0, 12.0, 25.0, 33.0, 26.0, 59.0, 90.0, 193.0, 379.0, 863.0, 2259.0, 9281.0, 73025.0, 778609.0, 161874.0, 16230.0, 3508.0, 1122.0, 410.0, 214.0, 111.0, 73.0, 34.0, 24.0, 19.0, 10.0, 6.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1240234375, -1.0906219482421875, -1.057220458984375, -1.0238189697265625, -0.99041748046875, -0.9570159912109375, -0.923614501953125, -0.8902130126953125, -0.8568115234375, -0.8234100341796875, -0.790008544921875, -0.7566070556640625, -0.72320556640625, -0.6898040771484375, -0.656402587890625, -0.6230010986328125, -0.589599609375, -0.5561981201171875, -0.522796630859375, -0.4893951416015625, -0.45599365234375, -0.4225921630859375, -0.389190673828125, -0.3557891845703125, -0.3223876953125, -0.2889862060546875, -0.255584716796875, -0.2221832275390625, -0.18878173828125, -0.1553802490234375, -0.121978759765625, -0.0885772705078125, -0.05517578125, -0.0217742919921875, 0.011627197265625, 0.0450286865234375, 0.07843017578125, 0.1118316650390625, 0.145233154296875, 0.1786346435546875, 0.2120361328125, 0.2454376220703125, 0.278839111328125, 0.3122406005859375, 0.34564208984375, 0.3790435791015625, 0.412445068359375, 0.4458465576171875, 0.479248046875, 0.5126495361328125, 0.546051025390625, 0.5794525146484375, 0.61285400390625, 0.6462554931640625, 0.679656982421875, 0.7130584716796875, 0.7464599609375, 0.7798614501953125, 0.813262939453125, 0.8466644287109375, 0.88006591796875, 0.9134674072265625, 0.946868896484375, 0.9802703857421875, 1.013671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 7.0, 12.0, 12.0, 16.0, 28.0, 33.0, 46.0, 57.0, 68.0, 84.0, 68.0, 85.0, 74.0, 75.0, 62.0, 57.0, 33.0, 33.0, 22.0, 14.0, 15.0, 10.0, 13.0, 11.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018405914306640625, -0.0001781173050403595, -0.00017217546701431274, -0.000166233628988266, -0.00016029179096221924, -0.00015434995293617249, -0.00014840811491012573, -0.00014246627688407898, -0.00013652443885803223, -0.00013058260083198547, -0.00012464076280593872, -0.00011869892477989197, -0.00011275708675384521, -0.00010681524872779846, -0.00010087341070175171, -9.493157267570496e-05, -8.89897346496582e-05, -8.304789662361145e-05, -7.71060585975647e-05, -7.116422057151794e-05, -6.522238254547119e-05, -5.928054451942444e-05, -5.3338706493377686e-05, -4.739686846733093e-05, -4.145503044128418e-05, -3.551319241523743e-05, -2.9571354389190674e-05, -2.362951636314392e-05, -1.7687678337097168e-05, -1.1745840311050415e-05, -5.804002285003662e-06, 1.3783574104309082e-07, 6.079673767089844e-06, 1.2021511793136597e-05, 1.796334981918335e-05, 2.3905187845230103e-05, 2.9847025871276855e-05, 3.578886389732361e-05, 4.173070192337036e-05, 4.7672539949417114e-05, 5.361437797546387e-05, 5.955621600151062e-05, 6.549805402755737e-05, 7.143989205360413e-05, 7.738173007965088e-05, 8.332356810569763e-05, 8.926540613174438e-05, 9.520724415779114e-05, 0.00010114908218383789, 0.00010709092020988464, 0.0001130327582359314, 0.00011897459626197815, 0.0001249164342880249, 0.00013085827231407166, 0.0001368001103401184, 0.00014274194836616516, 0.00014868378639221191, 0.00015462562441825867, 0.00016056746244430542, 0.00016650930047035217, 0.00017245113849639893, 0.00017839297652244568, 0.00018433481454849243, 0.00019027665257453918, 0.00019621849060058594]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 11.0, 26.0, 18.0, 54.0, 117.0, 223.0, 679.0, 2542.0, 22177.0, 914988.0, 100972.0, 4995.0, 1082.0, 360.0, 152.0, 63.0, 31.0, 21.0, 14.0, 12.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6025390625, -1.5485687255859375, -1.494598388671875, -1.4406280517578125, -1.38665771484375, -1.3326873779296875, -1.278717041015625, -1.2247467041015625, -1.1707763671875, -1.1168060302734375, -1.062835693359375, -1.0088653564453125, -0.95489501953125, -0.9009246826171875, -0.846954345703125, -0.7929840087890625, -0.739013671875, -0.6850433349609375, -0.631072998046875, -0.5771026611328125, -0.52313232421875, -0.4691619873046875, -0.415191650390625, -0.3612213134765625, -0.3072509765625, -0.2532806396484375, -0.199310302734375, -0.1453399658203125, -0.09136962890625, -0.0373992919921875, 0.016571044921875, 0.0705413818359375, 0.12451171875, 0.1784820556640625, 0.232452392578125, 0.2864227294921875, 0.34039306640625, 0.3943634033203125, 0.448333740234375, 0.5023040771484375, 0.5562744140625, 0.6102447509765625, 0.664215087890625, 0.7181854248046875, 0.77215576171875, 0.8261260986328125, 0.880096435546875, 0.9340667724609375, 0.988037109375, 1.0420074462890625, 1.095977783203125, 1.1499481201171875, 1.20391845703125, 1.2578887939453125, 1.311859130859375, 1.3658294677734375, 1.4197998046875, 1.4737701416015625, 1.527740478515625, 1.5817108154296875, 1.63568115234375, 1.6896514892578125, 1.743621826171875, 1.7975921630859375, 1.8515625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 5.0, 8.0, 13.0, 9.0, 13.0, 21.0, 19.0, 14.0, 30.0, 34.0, 51.0, 53.0, 66.0, 70.0, 65.0, 73.0, 62.0, 75.0, 47.0, 52.0, 42.0, 38.0, 25.0, 17.0, 19.0, 18.0, 9.0, 7.0, 9.0, 6.0, 8.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7041015625, -0.682708740234375, -0.66131591796875, -0.639923095703125, -0.6185302734375, -0.597137451171875, -0.57574462890625, -0.554351806640625, -0.532958984375, -0.511566162109375, -0.49017333984375, -0.468780517578125, -0.4473876953125, -0.425994873046875, -0.40460205078125, -0.383209228515625, -0.36181640625, -0.340423583984375, -0.31903076171875, -0.297637939453125, -0.2762451171875, -0.254852294921875, -0.23345947265625, -0.212066650390625, -0.190673828125, -0.169281005859375, -0.14788818359375, -0.126495361328125, -0.1051025390625, -0.083709716796875, -0.06231689453125, -0.040924072265625, -0.01953125, 0.001861572265625, 0.02325439453125, 0.044647216796875, 0.0660400390625, 0.087432861328125, 0.10882568359375, 0.130218505859375, 0.151611328125, 0.173004150390625, 0.19439697265625, 0.215789794921875, 0.2371826171875, 0.258575439453125, 0.27996826171875, 0.301361083984375, 0.32275390625, 0.344146728515625, 0.36553955078125, 0.386932373046875, 0.4083251953125, 0.429718017578125, 0.45111083984375, 0.472503662109375, 0.493896484375, 0.515289306640625, 0.53668212890625, 0.558074951171875, 0.5794677734375, 0.600860595703125, 0.62225341796875, 0.643646240234375, 0.6650390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 12.0, 38.0, 149.0, 411.0, 222.0, 103.0, 30.0, 18.0, 6.0, 7.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.858558654785156, -24.712966918945312, -23.5673770904541, -22.42178726196289, -21.276195526123047, -20.130603790283203, -18.985013961791992, -17.83942413330078, -16.693832397460938, -15.54824161529541, -14.402650833129883, -13.257060050964355, -12.111469268798828, -10.9658784866333, -9.820287704467773, -8.674696922302246, -7.529106140136719, -6.383515357971191, -5.237924575805664, -4.092333793640137, -2.9467430114746094, -1.801152229309082, -0.6555614471435547, 0.49002933502197266, 1.6356201171875, 2.7812108993530273, 3.9268016815185547, 5.072392463684082, 6.217983245849609, 7.363574028015137, 8.509164810180664, 9.654755592346191, 10.800350189208984, 11.945940971374512, 13.091531753540039, 14.237122535705566, 15.382713317871094, 16.528305053710938, 17.67389488220215, 18.81948471069336, 19.965076446533203, 21.110668182373047, 22.256258010864258, 23.40184783935547, 24.547439575195312, 25.693031311035156, 26.838621139526367, 27.984210968017578, 29.129802703857422, 30.275394439697266, 31.420984268188477, 32.56657409667969, 33.71216583251953, 34.857757568359375, 36.00334930419922, 37.1489372253418, 38.29452896118164, 39.440120697021484, 40.58570861816406, 41.731300354003906, 42.87689208984375, 44.022483825683594, 45.16807556152344, 46.313663482666016, 47.45925521850586]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 5.0, 3.0, 7.0, 7.0, 5.0, 10.0, 12.0, 13.0, 10.0, 17.0, 16.0, 25.0, 24.0, 21.0, 25.0, 24.0, 33.0, 40.0, 46.0, 78.0, 79.0, 61.0, 56.0, 48.0, 39.0, 37.0, 35.0, 35.0, 26.0, 29.0, 25.0, 25.0, 17.0, 12.0, 9.0, 13.0, 6.0, 6.0, 7.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.429621696472168, -12.039679527282715, -11.649737358093262, -11.259795188903809, -10.869853019714355, -10.479910850524902, -10.089967727661133, -9.70002555847168, -9.310083389282227, -8.920141220092773, -8.53019905090332, -8.140256881713867, -7.750314712524414, -7.360372543334961, -6.97042989730835, -6.5804877281188965, -6.190546035766602, -5.800603866577148, -5.410661697387695, -5.020719528198242, -4.630777359008789, -4.240835189819336, -3.8508925437927246, -3.4609503746032715, -3.0710082054138184, -2.6810660362243652, -2.291123867034912, -1.9011814594268799, -1.5112392902374268, -1.1212971210479736, -0.7313547134399414, -0.3414125442504883, 0.04853057861328125, 0.43847280740737915, 0.828415036201477, 1.2183573246002197, 1.6082994937896729, 1.998241662979126, 2.388184070587158, 2.7781262397766113, 3.1680684089660645, 3.5580105781555176, 3.9479527473449707, 4.337895393371582, 4.727837562561035, 5.117779731750488, 5.507721900939941, 5.8976640701293945, 6.287606239318848, 6.677548408508301, 7.067490577697754, 7.457432746887207, 7.84737491607666, 8.237317085266113, 8.627260208129883, 9.017202377319336, 9.407144546508789, 9.797086715698242, 10.187028884887695, 10.576971054077148, 10.966913223266602, 11.356855392456055, 11.746797561645508, 12.136739730834961, 12.526681900024414]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 10.0, 27.0, 20.0, 24.0, 60.0, 72.0, 123.0, 200.0, 284.0, 503.0, 883.0, 1444.0, 2802.0, 5946.0, 13826.0, 42492.0, 184426.0, 1073995.0, 2234653.0, 497093.0, 92105.0, 24763.0, 9310.0, 4232.0, 2138.0, 1159.0, 638.0, 377.0, 239.0, 130.0, 101.0, 64.0, 49.0, 29.0, 23.0, 15.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7539138793945312, -0.7290191650390625, -0.7041244506835938, -0.679229736328125, -0.6543350219726562, -0.6294403076171875, -0.6045455932617188, -0.57965087890625, -0.5547561645507812, -0.5298614501953125, -0.5049667358398438, -0.480072021484375, -0.45517730712890625, -0.4302825927734375, -0.40538787841796875, -0.3804931640625, -0.35559844970703125, -0.3307037353515625, -0.30580902099609375, -0.280914306640625, -0.25601959228515625, -0.2311248779296875, -0.20623016357421875, -0.18133544921875, -0.15644073486328125, -0.1315460205078125, -0.10665130615234375, -0.081756591796875, -0.05686187744140625, -0.0319671630859375, -0.00707244873046875, 0.017822265625, 0.04271697998046875, 0.0676116943359375, 0.09250640869140625, 0.117401123046875, 0.14229583740234375, 0.1671905517578125, 0.19208526611328125, 0.21697998046875, 0.24187469482421875, 0.2667694091796875, 0.29166412353515625, 0.316558837890625, 0.34145355224609375, 0.3663482666015625, 0.39124298095703125, 0.4161376953125, 0.44103240966796875, 0.4659271240234375, 0.49082183837890625, 0.515716552734375, 0.5406112670898438, 0.5655059814453125, 0.5904006958007812, 0.61529541015625, 0.6401901245117188, 0.6650848388671875, 0.6899795532226562, 0.714874267578125, 0.7397689819335938, 0.7646636962890625, 0.7895584106445312, 0.814453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 11.0, 13.0, 14.0, 22.0, 21.0, 20.0, 29.0, 31.0, 41.0, 48.0, 32.0, 46.0, 39.0, 50.0, 46.0, 59.0, 47.0, 47.0, 39.0, 48.0, 31.0, 34.0, 24.0, 26.0, 30.0, 24.0, 18.0, 13.0, 17.0, 11.0, 4.0, 9.0, 7.0, 11.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7236328125, -0.7010879516601562, -0.6785430908203125, -0.6559982299804688, -0.633453369140625, -0.6109085083007812, -0.5883636474609375, -0.5658187866210938, -0.54327392578125, -0.5207290649414062, -0.4981842041015625, -0.47563934326171875, -0.453094482421875, -0.43054962158203125, -0.4080047607421875, -0.38545989990234375, -0.3629150390625, -0.34037017822265625, -0.3178253173828125, -0.29528045654296875, -0.272735595703125, -0.25019073486328125, -0.2276458740234375, -0.20510101318359375, -0.18255615234375, -0.16001129150390625, -0.1374664306640625, -0.11492156982421875, -0.092376708984375, -0.06983184814453125, -0.0472869873046875, -0.02474212646484375, -0.002197265625, 0.02034759521484375, 0.0428924560546875, 0.06543731689453125, 0.087982177734375, 0.11052703857421875, 0.1330718994140625, 0.15561676025390625, 0.17816162109375, 0.20070648193359375, 0.2232513427734375, 0.24579620361328125, 0.268341064453125, 0.29088592529296875, 0.3134307861328125, 0.33597564697265625, 0.3585205078125, 0.38106536865234375, 0.4036102294921875, 0.42615509033203125, 0.448699951171875, 0.47124481201171875, 0.4937896728515625, 0.5163345336914062, 0.53887939453125, 0.5614242553710938, 0.5839691162109375, 0.6065139770507812, 0.629058837890625, 0.6516036987304688, 0.6741485595703125, 0.6966934204101562, 0.71923828125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 14.0, 6.0, 12.0, 19.0, 33.0, 51.0, 88.0, 185.0, 444.0, 1016.0, 3227.0, 15988.0, 258172.0, 3818673.0, 84023.0, 8742.0, 2123.0, 742.0, 348.0, 165.0, 77.0, 59.0, 22.0, 22.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.046875, -2.963043212890625, -2.87921142578125, -2.795379638671875, -2.7115478515625, -2.627716064453125, -2.54388427734375, -2.460052490234375, -2.376220703125, -2.292388916015625, -2.20855712890625, -2.124725341796875, -2.0408935546875, -1.957061767578125, -1.87322998046875, -1.789398193359375, -1.70556640625, -1.621734619140625, -1.53790283203125, -1.454071044921875, -1.3702392578125, -1.286407470703125, -1.20257568359375, -1.118743896484375, -1.034912109375, -0.951080322265625, -0.86724853515625, -0.783416748046875, -0.6995849609375, -0.615753173828125, -0.53192138671875, -0.448089599609375, -0.3642578125, -0.280426025390625, -0.19659423828125, -0.112762451171875, -0.0289306640625, 0.054901123046875, 0.13873291015625, 0.222564697265625, 0.306396484375, 0.390228271484375, 0.47406005859375, 0.557891845703125, 0.6417236328125, 0.725555419921875, 0.80938720703125, 0.893218994140625, 0.97705078125, 1.060882568359375, 1.14471435546875, 1.228546142578125, 1.3123779296875, 1.396209716796875, 1.48004150390625, 1.563873291015625, 1.647705078125, 1.731536865234375, 1.81536865234375, 1.899200439453125, 1.9830322265625, 2.066864013671875, 2.15069580078125, 2.234527587890625, 2.318359375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 13.0, 15.0, 20.0, 25.0, 53.0, 80.0, 188.0, 399.0, 961.0, 1114.0, 623.0, 257.0, 113.0, 78.0, 43.0, 29.0, 17.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3046875, -2.228515625, -2.15234375, -2.076171875, -2.0, -1.923828125, -1.84765625, -1.771484375, -1.6953125, -1.619140625, -1.54296875, -1.466796875, -1.390625, -1.314453125, -1.23828125, -1.162109375, -1.0859375, -1.009765625, -0.93359375, -0.857421875, -0.78125, -0.705078125, -0.62890625, -0.552734375, -0.4765625, -0.400390625, -0.32421875, -0.248046875, -0.171875, -0.095703125, -0.01953125, 0.056640625, 0.1328125, 0.208984375, 0.28515625, 0.361328125, 0.4375, 0.513671875, 0.58984375, 0.666015625, 0.7421875, 0.818359375, 0.89453125, 0.970703125, 1.046875, 1.123046875, 1.19921875, 1.275390625, 1.3515625, 1.427734375, 1.50390625, 1.580078125, 1.65625, 1.732421875, 1.80859375, 1.884765625, 1.9609375, 2.037109375, 2.11328125, 2.189453125, 2.265625, 2.341796875, 2.41796875, 2.494140625, 2.5703125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 7.0, 5.0, 11.0, 17.0, 23.0, 92.0, 269.0, 360.0, 156.0, 38.0, 16.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.908599853515625, -32.048179626464844, -31.187755584716797, -30.327335357666016, -29.4669132232666, -28.606491088867188, -27.746068954467773, -26.88564682006836, -26.025226593017578, -25.164804458618164, -24.30438232421875, -23.44396209716797, -22.583539962768555, -21.72311782836914, -20.862695693969727, -20.002273559570312, -19.14185333251953, -18.281431198120117, -17.421009063720703, -16.560588836669922, -15.700166702270508, -14.839744567871094, -13.97932243347168, -13.118901252746582, -12.258478164672852, -11.398056030273438, -10.53763484954834, -9.677212715148926, -8.816791534423828, -7.956369400024414, -7.095947742462158, -6.235526084899902, -5.375104904174805, -4.514683246612549, -3.654261589050293, -2.793839693069458, -1.9334180355072021, -1.0729961395263672, -0.21257448196411133, 0.6478471755981445, 1.5082688331604004, 2.3686904907226562, 3.229112148284912, 4.089533805847168, 4.949955940246582, 5.810377597808838, 6.670799255371094, 7.53122091293335, 8.391642570495605, 9.25206470489502, 10.112485885620117, 10.972908020019531, 11.833329200744629, 12.693751335144043, 13.55417251586914, 14.414594650268555, 15.275016784667969, 16.135438919067383, 16.995861053466797, 17.856281280517578, 18.716703414916992, 19.577125549316406, 20.43754768371582, 21.297969818115234, 22.158390045166016]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 3.0, 12.0, 18.0, 32.0, 16.0, 36.0, 31.0, 49.0, 57.0, 48.0, 65.0, 77.0, 66.0, 64.0, 75.0, 45.0, 50.0, 46.0, 32.0, 42.0, 24.0, 23.0, 19.0, 17.0, 11.0, 10.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.094115257263184, -9.781542778015137, -9.468969345092773, -9.156396865844727, -8.84382438659668, -8.531250953674316, -8.21867847442627, -7.9061055183410645, -7.593532562255859, -7.280959606170654, -6.968386650085449, -6.655814170837402, -6.343241214752197, -6.030668258666992, -5.718095779418945, -5.40552282333374, -5.092949867248535, -4.78037691116333, -4.467803955078125, -4.155231475830078, -3.842658519744873, -3.530085563659668, -3.217512845993042, -2.904940128326416, -2.592367172241211, -2.279794216156006, -1.9672214984893799, -1.6546486616134644, -1.3420758247375488, -1.0295029878616333, -0.7169301509857178, -0.4043574333190918, -0.09178352355957031, 0.22078931331634521, 0.5333621501922607, 0.8459349870681763, 1.1585078239440918, 1.4710806608200073, 1.7836534976959229, 2.096226215362549, 2.408799171447754, 2.721372127532959, 3.033944845199585, 3.346517562866211, 3.659090518951416, 3.971663475036621, 4.284235954284668, 4.596808910369873, 4.909381866455078, 5.221954822540283, 5.534527778625488, 5.847100257873535, 6.15967321395874, 6.472246170043945, 6.784818649291992, 7.097391605377197, 7.409964561462402, 7.722537517547607, 8.035110473632812, 8.34768295288086, 8.660255432128906, 8.97282886505127, 9.285401344299316, 9.59797477722168, 9.910547256469727]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 12.0, 8.0, 16.0, 19.0, 21.0, 36.0, 74.0, 90.0, 142.0, 241.0, 363.0, 591.0, 995.0, 1786.0, 3337.0, 6807.0, 14807.0, 33433.0, 79379.0, 180526.0, 296466.0, 233994.0, 110274.0, 46216.0, 20034.0, 9019.0, 4417.0, 2271.0, 1218.0, 730.0, 437.0, 286.0, 163.0, 114.0, 78.0, 42.0, 34.0, 31.0, 14.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.97900390625, -0.9481124877929688, -0.9172210693359375, -0.8863296508789062, -0.855438232421875, -0.8245468139648438, -0.7936553955078125, -0.7627639770507812, -0.73187255859375, -0.7009811401367188, -0.6700897216796875, -0.6391983032226562, -0.608306884765625, -0.5774154663085938, -0.5465240478515625, -0.5156326293945312, -0.4847412109375, -0.45384979248046875, -0.4229583740234375, -0.39206695556640625, -0.361175537109375, -0.33028411865234375, -0.2993927001953125, -0.26850128173828125, -0.23760986328125, -0.20671844482421875, -0.1758270263671875, -0.14493560791015625, -0.114044189453125, -0.08315277099609375, -0.0522613525390625, -0.02136993408203125, 0.009521484375, 0.04041290283203125, 0.0713043212890625, 0.10219573974609375, 0.133087158203125, 0.16397857666015625, 0.1948699951171875, 0.22576141357421875, 0.25665283203125, 0.28754425048828125, 0.3184356689453125, 0.34932708740234375, 0.380218505859375, 0.41110992431640625, 0.4420013427734375, 0.47289276123046875, 0.5037841796875, 0.5346755981445312, 0.5655670166015625, 0.5964584350585938, 0.627349853515625, 0.6582412719726562, 0.6891326904296875, 0.7200241088867188, 0.75091552734375, 0.7818069458007812, 0.8126983642578125, 0.8435897827148438, 0.874481201171875, 0.9053726196289062, 0.9362640380859375, 0.9671554565429688, 0.998046875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 16.0, 19.0, 18.0, 19.0, 14.0, 29.0, 35.0, 31.0, 41.0, 44.0, 42.0, 44.0, 58.0, 51.0, 50.0, 46.0, 52.0, 53.0, 39.0, 44.0, 37.0, 28.0, 21.0, 25.0, 16.0, 12.0, 18.0, 13.0, 20.0, 5.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7451171875, -0.72198486328125, -0.6988525390625, -0.67572021484375, -0.652587890625, -0.62945556640625, -0.6063232421875, -0.58319091796875, -0.56005859375, -0.53692626953125, -0.5137939453125, -0.49066162109375, -0.467529296875, -0.44439697265625, -0.4212646484375, -0.39813232421875, -0.375, -0.35186767578125, -0.3287353515625, -0.30560302734375, -0.282470703125, -0.25933837890625, -0.2362060546875, -0.21307373046875, -0.18994140625, -0.16680908203125, -0.1436767578125, -0.12054443359375, -0.097412109375, -0.07427978515625, -0.0511474609375, -0.02801513671875, -0.0048828125, 0.01824951171875, 0.0413818359375, 0.06451416015625, 0.087646484375, 0.11077880859375, 0.1339111328125, 0.15704345703125, 0.18017578125, 0.20330810546875, 0.2264404296875, 0.24957275390625, 0.272705078125, 0.29583740234375, 0.3189697265625, 0.34210205078125, 0.365234375, 0.38836669921875, 0.4114990234375, 0.43463134765625, 0.457763671875, 0.48089599609375, 0.5040283203125, 0.52716064453125, 0.55029296875, 0.57342529296875, 0.5965576171875, 0.61968994140625, 0.642822265625, 0.66595458984375, 0.6890869140625, 0.71221923828125, 0.7353515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 5.0, 8.0, 10.0, 9.0, 9.0, 17.0, 15.0, 18.0, 31.0, 49.0, 69.0, 103.0, 201.0, 487.0, 1432.0, 5799.0, 36506.0, 324454.0, 612595.0, 55555.0, 8111.0, 1840.0, 604.0, 227.0, 125.0, 78.0, 39.0, 43.0, 19.0, 24.0, 15.0, 13.0, 12.0, 5.0, 6.0, 8.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.3017578125, -2.22265625, -2.1435546875, -2.064453125, -1.9853515625, -1.90625, -1.8271484375, -1.748046875, -1.6689453125, -1.58984375, -1.5107421875, -1.431640625, -1.3525390625, -1.2734375, -1.1943359375, -1.115234375, -1.0361328125, -0.95703125, -0.8779296875, -0.798828125, -0.7197265625, -0.640625, -0.5615234375, -0.482421875, -0.4033203125, -0.32421875, -0.2451171875, -0.166015625, -0.0869140625, -0.0078125, 0.0712890625, 0.150390625, 0.2294921875, 0.30859375, 0.3876953125, 0.466796875, 0.5458984375, 0.625, 0.7041015625, 0.783203125, 0.8623046875, 0.94140625, 1.0205078125, 1.099609375, 1.1787109375, 1.2578125, 1.3369140625, 1.416015625, 1.4951171875, 1.57421875, 1.6533203125, 1.732421875, 1.8115234375, 1.890625, 1.9697265625, 2.048828125, 2.1279296875, 2.20703125, 2.2861328125, 2.365234375, 2.4443359375, 2.5234375, 2.6025390625, 2.681640625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 10.0, 12.0, 11.0, 23.0, 33.0, 23.0, 30.0, 51.0, 45.0, 58.0, 56.0, 59.0, 64.0, 63.0, 54.0, 59.0, 52.0, 57.0, 50.0, 36.0, 28.0, 27.0, 18.0, 21.0, 13.0, 7.0, 6.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.389404296875, -3.28662109375, -3.183837890625, -3.0810546875, -2.978271484375, -2.87548828125, -2.772705078125, -2.669921875, -2.567138671875, -2.46435546875, -2.361572265625, -2.2587890625, -2.156005859375, -2.05322265625, -1.950439453125, -1.84765625, -1.744873046875, -1.64208984375, -1.539306640625, -1.4365234375, -1.333740234375, -1.23095703125, -1.128173828125, -1.025390625, -0.922607421875, -0.81982421875, -0.717041015625, -0.6142578125, -0.511474609375, -0.40869140625, -0.305908203125, -0.203125, -0.100341796875, 0.00244140625, 0.105224609375, 0.2080078125, 0.310791015625, 0.41357421875, 0.516357421875, 0.619140625, 0.721923828125, 0.82470703125, 0.927490234375, 1.0302734375, 1.133056640625, 1.23583984375, 1.338623046875, 1.44140625, 1.544189453125, 1.64697265625, 1.749755859375, 1.8525390625, 1.955322265625, 2.05810546875, 2.160888671875, 2.263671875, 2.366455078125, 2.46923828125, 2.572021484375, 2.6748046875, 2.777587890625, 2.88037109375, 2.983154296875, 3.0859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 8.0, 25.0, 25.0, 34.0, 39.0, 91.0, 139.0, 254.0, 501.0, 1274.0, 3378.0, 10005.0, 36723.0, 163043.0, 621321.0, 159946.0, 36131.0, 9916.0, 3241.0, 1278.0, 549.0, 278.0, 130.0, 83.0, 38.0, 23.0, 24.0, 11.0, 13.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4465293884277344, -0.43138885498046875, -0.4162483215332031, -0.4011077880859375, -0.3859672546386719, -0.37082672119140625, -0.3556861877441406, -0.340545654296875, -0.3254051208496094, -0.31026458740234375, -0.2951240539550781, -0.2799835205078125, -0.2648429870605469, -0.24970245361328125, -0.23456192016601562, -0.21942138671875, -0.20428085327148438, -0.18914031982421875, -0.17399978637695312, -0.1588592529296875, -0.14371871948242188, -0.12857818603515625, -0.11343765258789062, -0.098297119140625, -0.08315658569335938, -0.06801605224609375, -0.052875518798828125, -0.0377349853515625, -0.022594451904296875, -0.00745391845703125, 0.007686614990234375, 0.0228271484375, 0.037967681884765625, 0.05310821533203125, 0.06824874877929688, 0.0833892822265625, 0.09852981567382812, 0.11367034912109375, 0.12881088256835938, 0.143951416015625, 0.15909194946289062, 0.17423248291015625, 0.18937301635742188, 0.2045135498046875, 0.21965408325195312, 0.23479461669921875, 0.24993515014648438, 0.26507568359375, 0.2802162170410156, 0.29535675048828125, 0.3104972839355469, 0.3256378173828125, 0.3407783508300781, 0.35591888427734375, 0.3710594177246094, 0.386199951171875, 0.4013404846191406, 0.41648101806640625, 0.4316215515136719, 0.4467620849609375, 0.4619026184082031, 0.47704315185546875, 0.4921836853027344, 0.50732421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 8.0, 5.0, 14.0, 19.0, 24.0, 54.0, 63.0, 82.0, 109.0, 125.0, 115.0, 117.0, 68.0, 63.0, 31.0, 25.0, 22.0, 13.0, 8.0, 9.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.00021123886108398438, -0.00020457059144973755, -0.00019790232181549072, -0.0001912340521812439, -0.00018456578254699707, -0.00017789751291275024, -0.00017122924327850342, -0.0001645609736442566, -0.00015789270401000977, -0.00015122443437576294, -0.0001445561647415161, -0.0001378878951072693, -0.00013121962547302246, -0.00012455135583877563, -0.00011788308620452881, -0.00011121481657028198, -0.00010454654693603516, -9.787827730178833e-05, -9.12100076675415e-05, -8.454173803329468e-05, -7.787346839904785e-05, -7.120519876480103e-05, -6.45369291305542e-05, -5.786865949630737e-05, -5.120038986206055e-05, -4.453212022781372e-05, -3.7863850593566895e-05, -3.119558095932007e-05, -2.4527311325073242e-05, -1.7859041690826416e-05, -1.119077205657959e-05, -4.522502422332764e-06, 2.1457672119140625e-06, 8.814036846160889e-06, 1.5482306480407715e-05, 2.215057611465454e-05, 2.8818845748901367e-05, 3.548711538314819e-05, 4.215538501739502e-05, 4.8823654651641846e-05, 5.549192428588867e-05, 6.21601939201355e-05, 6.882846355438232e-05, 7.549673318862915e-05, 8.216500282287598e-05, 8.88332724571228e-05, 9.550154209136963e-05, 0.00010216981172561646, 0.00010883808135986328, 0.00011550635099411011, 0.00012217462062835693, 0.00012884289026260376, 0.00013551115989685059, 0.0001421794295310974, 0.00014884769916534424, 0.00015551596879959106, 0.0001621842384338379, 0.00016885250806808472, 0.00017552077770233154, 0.00018218904733657837, 0.0001888573169708252, 0.00019552558660507202, 0.00020219385623931885, 0.00020886212587356567, 0.0002155303955078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 7.0, 18.0, 23.0, 39.0, 106.0, 149.0, 436.0, 1149.0, 5420.0, 40981.0, 612718.0, 350628.0, 30737.0, 4331.0, 1097.0, 396.0, 146.0, 69.0, 36.0, 25.0, 19.0, 4.0, 8.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.467041015625, -0.4423789978027344, -0.41771697998046875, -0.3930549621582031, -0.3683929443359375, -0.3437309265136719, -0.31906890869140625, -0.2944068908691406, -0.269744873046875, -0.24508285522460938, -0.22042083740234375, -0.19575881958007812, -0.1710968017578125, -0.14643478393554688, -0.12177276611328125, -0.09711074829101562, -0.07244873046875, -0.047786712646484375, -0.02312469482421875, 0.001537322998046875, 0.0261993408203125, 0.050861358642578125, 0.07552337646484375, 0.10018539428710938, 0.124847412109375, 0.14950942993164062, 0.17417144775390625, 0.19883346557617188, 0.2234954833984375, 0.24815750122070312, 0.27281951904296875, 0.2974815368652344, 0.3221435546875, 0.3468055725097656, 0.37146759033203125, 0.3961296081542969, 0.4207916259765625, 0.4454536437988281, 0.47011566162109375, 0.4947776794433594, 0.519439697265625, 0.5441017150878906, 0.5687637329101562, 0.5934257507324219, 0.6180877685546875, 0.6427497863769531, 0.6674118041992188, 0.6920738220214844, 0.71673583984375, 0.7413978576660156, 0.7660598754882812, 0.7907218933105469, 0.8153839111328125, 0.8400459289550781, 0.8647079467773438, 0.8893699645996094, 0.914031982421875, 0.9386940002441406, 0.9633560180664062, 0.9880180358886719, 1.0126800537109375, 1.0373420715332031, 1.0620040893554688, 1.0866661071777344, 1.111328125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 7.0, 12.0, 13.0, 23.0, 20.0, 34.0, 50.0, 56.0, 64.0, 58.0, 82.0, 74.0, 92.0, 83.0, 53.0, 54.0, 41.0, 47.0, 28.0, 31.0, 24.0, 16.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483154296875, -0.4644050598144531, -0.44565582275390625, -0.4269065856933594, -0.4081573486328125, -0.3894081115722656, -0.37065887451171875, -0.3519096374511719, -0.333160400390625, -0.3144111633300781, -0.29566192626953125, -0.2769126892089844, -0.2581634521484375, -0.23941421508789062, -0.22066497802734375, -0.20191574096679688, -0.18316650390625, -0.16441726684570312, -0.14566802978515625, -0.12691879272460938, -0.1081695556640625, -0.08942031860351562, -0.07067108154296875, -0.051921844482421875, -0.033172607421875, -0.014423370361328125, 0.00432586669921875, 0.023075103759765625, 0.0418243408203125, 0.060573577880859375, 0.07932281494140625, 0.09807205200195312, 0.1168212890625, 0.13557052612304688, 0.15431976318359375, 0.17306900024414062, 0.1918182373046875, 0.21056747436523438, 0.22931671142578125, 0.24806594848632812, 0.266815185546875, 0.2855644226074219, 0.30431365966796875, 0.3230628967285156, 0.3418121337890625, 0.3605613708496094, 0.37931060791015625, 0.3980598449707031, 0.41680908203125, 0.4355583190917969, 0.45430755615234375, 0.4730567932128906, 0.4918060302734375, 0.5105552673339844, 0.5293045043945312, 0.5480537414550781, 0.566802978515625, 0.5855522155761719, 0.6043014526367188, 0.6230506896972656, 0.6417999267578125, 0.6605491638183594, 0.6792984008789062, 0.6980476379394531, 0.716796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 15.0, 37.0, 66.0, 142.0, 284.0, 192.0, 106.0, 71.0, 39.0, 17.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.829614639282227, -10.303720474243164, -9.777827262878418, -9.251933097839355, -8.72603988647461, -8.200145721435547, -7.674251556396484, -7.14835786819458, -6.622464179992676, -6.0965704917907715, -5.570676803588867, -5.044782638549805, -4.5188889503479, -3.992995262145996, -3.4671013355255127, -2.9412074089050293, -2.415313720703125, -1.8894199132919312, -1.3635261058807373, -0.8376322984695435, -0.3117384910583496, 0.2141551971435547, 0.7400491237640381, 1.2659430503845215, 1.7918367385864258, 2.31773042678833, 2.8436243534088135, 3.369518280029297, 3.895411968231201, 4.4213056564331055, 4.947199821472168, 5.473093509674072, 5.998987197875977, 6.524880886077881, 7.050774574279785, 7.576668739318848, 8.102561950683594, 8.628456115722656, 9.154350280761719, 9.680244445800781, 10.206137657165527, 10.73203182220459, 11.257925033569336, 11.783819198608398, 12.309713363647461, 12.835606575012207, 13.36150074005127, 13.887393951416016, 14.413288116455078, 14.93918228149414, 15.465075492858887, 15.99096965789795, 16.516862869262695, 17.042757034301758, 17.56865119934082, 18.094545364379883, 18.620437622070312, 19.146331787109375, 19.672225952148438, 20.198118209838867, 20.72401237487793, 21.249906539916992, 21.775800704956055, 22.301694869995117, 22.82758903503418]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 8.0, 9.0, 14.0, 13.0, 15.0, 24.0, 27.0, 21.0, 27.0, 29.0, 38.0, 33.0, 26.0, 49.0, 61.0, 69.0, 58.0, 61.0, 56.0, 37.0, 38.0, 20.0, 34.0, 30.0, 24.0, 20.0, 21.0, 12.0, 12.0, 13.0, 10.0, 9.0, 9.0, 6.0, 10.0, 7.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.875619888305664, -8.588136672973633, -8.300653457641602, -8.01317024230957, -7.725686550140381, -7.438202857971191, -7.15071964263916, -6.863236427307129, -6.575753211975098, -6.288269996643066, -6.000786304473877, -5.713303089141846, -5.4258198738098145, -5.138336181640625, -4.850852966308594, -4.5633697509765625, -4.275886058807373, -3.9884026050567627, -3.7009193897247314, -3.413435935974121, -3.12595272064209, -2.8384692668914795, -2.550985813140869, -2.263502597808838, -1.9760191440582275, -1.6885358095169067, -1.401052474975586, -1.1135690212249756, -0.8260856866836548, -0.538602352142334, -0.25111889839172363, 0.03636431694030762, 0.32384777069091797, 0.6113311052322388, 0.8988144993782043, 1.18629789352417, 1.4737812280654907, 1.7612645626068115, 2.048748016357422, 2.336231231689453, 2.6237146854400635, 2.911198139190674, 3.198681354522705, 3.4861648082733154, 3.773648262023926, 4.061131477355957, 4.348614692687988, 4.6360979080200195, 4.923581600189209, 5.21106481552124, 5.49854850769043, 5.786031723022461, 6.073514938354492, 6.360998153686523, 6.648481845855713, 6.935965061187744, 7.223448753356934, 7.510931968688965, 7.798415660858154, 8.085899353027344, 8.373382568359375, 8.660865783691406, 8.948348999023438, 9.235832214355469, 9.5233154296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 9.0, 16.0, 20.0, 19.0, 32.0, 69.0, 75.0, 115.0, 161.0, 257.0, 475.0, 898.0, 1673.0, 3843.0, 10289.0, 39402.0, 208683.0, 1352319.0, 2129339.0, 362050.0, 60850.0, 14313.0, 4905.0, 2032.0, 1044.0, 534.0, 324.0, 171.0, 93.0, 70.0, 55.0, 35.0, 34.0, 15.0, 13.0, 8.0, 9.0, 4.0, 5.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.87646484375, -0.8522186279296875, -0.827972412109375, -0.8037261962890625, -0.77947998046875, -0.7552337646484375, -0.730987548828125, -0.7067413330078125, -0.6824951171875, -0.6582489013671875, -0.634002685546875, -0.6097564697265625, -0.58551025390625, -0.5612640380859375, -0.537017822265625, -0.5127716064453125, -0.488525390625, -0.4642791748046875, -0.440032958984375, -0.4157867431640625, -0.39154052734375, -0.3672943115234375, -0.343048095703125, -0.3188018798828125, -0.2945556640625, -0.2703094482421875, -0.246063232421875, -0.2218170166015625, -0.19757080078125, -0.1733245849609375, -0.149078369140625, -0.1248321533203125, -0.1005859375, -0.0763397216796875, -0.052093505859375, -0.0278472900390625, -0.00360107421875, 0.0206451416015625, 0.044891357421875, 0.0691375732421875, 0.0933837890625, 0.1176300048828125, 0.141876220703125, 0.1661224365234375, 0.19036865234375, 0.2146148681640625, 0.238861083984375, 0.2631072998046875, 0.287353515625, 0.3115997314453125, 0.335845947265625, 0.3600921630859375, 0.38433837890625, 0.4085845947265625, 0.432830810546875, 0.4570770263671875, 0.4813232421875, 0.5055694580078125, 0.529815673828125, 0.5540618896484375, 0.57830810546875, 0.6025543212890625, 0.626800537109375, 0.6510467529296875, 0.67529296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 2.0, 11.0, 13.0, 19.0, 13.0, 16.0, 21.0, 23.0, 32.0, 42.0, 41.0, 41.0, 50.0, 52.0, 61.0, 56.0, 47.0, 47.0, 60.0, 38.0, 42.0, 37.0, 42.0, 22.0, 26.0, 27.0, 18.0, 22.0, 17.0, 7.0, 8.0, 11.0, 8.0, 9.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74072265625, -0.7177658081054688, -0.6948089599609375, -0.6718521118164062, -0.648895263671875, -0.6259384155273438, -0.6029815673828125, -0.5800247192382812, -0.55706787109375, -0.5341110229492188, -0.5111541748046875, -0.48819732666015625, -0.465240478515625, -0.44228363037109375, -0.4193267822265625, -0.39636993408203125, -0.3734130859375, -0.35045623779296875, -0.3274993896484375, -0.30454254150390625, -0.281585693359375, -0.25862884521484375, -0.2356719970703125, -0.21271514892578125, -0.18975830078125, -0.16680145263671875, -0.1438446044921875, -0.12088775634765625, -0.097930908203125, -0.07497406005859375, -0.0520172119140625, -0.02906036376953125, -0.006103515625, 0.01685333251953125, 0.0398101806640625, 0.06276702880859375, 0.085723876953125, 0.10868072509765625, 0.1316375732421875, 0.15459442138671875, 0.17755126953125, 0.20050811767578125, 0.2234649658203125, 0.24642181396484375, 0.269378662109375, 0.29233551025390625, 0.3152923583984375, 0.33824920654296875, 0.3612060546875, 0.38416290283203125, 0.4071197509765625, 0.43007659912109375, 0.453033447265625, 0.47599029541015625, 0.4989471435546875, 0.5219039916992188, 0.54486083984375, 0.5678176879882812, 0.5907745361328125, 0.6137313842773438, 0.636688232421875, 0.6596450805664062, 0.6826019287109375, 0.7055587768554688, 0.728515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 11.0, 16.0, 26.0, 47.0, 80.0, 221.0, 569.0, 1941.0, 15393.0, 2673641.0, 1487501.0, 12095.0, 1803.0, 501.0, 211.0, 88.0, 51.0, 26.0, 21.0, 10.0, 9.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287109375, -3.193084716796875, -3.09906005859375, -3.005035400390625, -2.9110107421875, -2.816986083984375, -2.72296142578125, -2.628936767578125, -2.534912109375, -2.440887451171875, -2.34686279296875, -2.252838134765625, -2.1588134765625, -2.064788818359375, -1.97076416015625, -1.876739501953125, -1.78271484375, -1.688690185546875, -1.59466552734375, -1.500640869140625, -1.4066162109375, -1.312591552734375, -1.21856689453125, -1.124542236328125, -1.030517578125, -0.936492919921875, -0.84246826171875, -0.748443603515625, -0.6544189453125, -0.560394287109375, -0.46636962890625, -0.372344970703125, -0.2783203125, -0.184295654296875, -0.09027099609375, 0.003753662109375, 0.0977783203125, 0.191802978515625, 0.28582763671875, 0.379852294921875, 0.473876953125, 0.567901611328125, 0.66192626953125, 0.755950927734375, 0.8499755859375, 0.944000244140625, 1.03802490234375, 1.132049560546875, 1.22607421875, 1.320098876953125, 1.41412353515625, 1.508148193359375, 1.6021728515625, 1.696197509765625, 1.79022216796875, 1.884246826171875, 1.978271484375, 2.072296142578125, 2.16632080078125, 2.260345458984375, 2.3543701171875, 2.448394775390625, 2.54241943359375, 2.636444091796875, 2.73046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 18.0, 21.0, 30.0, 46.0, 97.0, 208.0, 381.0, 706.0, 1024.0, 772.0, 357.0, 179.0, 84.0, 49.0, 27.0, 17.0, 11.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6875, -1.63031005859375, -1.5731201171875, -1.51593017578125, -1.458740234375, -1.40155029296875, -1.3443603515625, -1.28717041015625, -1.22998046875, -1.17279052734375, -1.1156005859375, -1.05841064453125, -1.001220703125, -0.94403076171875, -0.8868408203125, -0.82965087890625, -0.7724609375, -0.71527099609375, -0.6580810546875, -0.60089111328125, -0.543701171875, -0.48651123046875, -0.4293212890625, -0.37213134765625, -0.31494140625, -0.25775146484375, -0.2005615234375, -0.14337158203125, -0.086181640625, -0.02899169921875, 0.0281982421875, 0.08538818359375, 0.142578125, 0.19976806640625, 0.2569580078125, 0.31414794921875, 0.371337890625, 0.42852783203125, 0.4857177734375, 0.54290771484375, 0.60009765625, 0.65728759765625, 0.7144775390625, 0.77166748046875, 0.828857421875, 0.88604736328125, 0.9432373046875, 1.00042724609375, 1.0576171875, 1.11480712890625, 1.1719970703125, 1.22918701171875, 1.286376953125, 1.34356689453125, 1.4007568359375, 1.45794677734375, 1.51513671875, 1.57232666015625, 1.6295166015625, 1.68670654296875, 1.743896484375, 1.80108642578125, 1.8582763671875, 1.91546630859375, 1.97265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 14.0, 16.0, 29.0, 80.0, 177.0, 273.0, 225.0, 112.0, 43.0, 20.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.249588966369629, -11.735588073730469, -11.221586227416992, -10.707585334777832, -10.193584442138672, -9.679582595825195, -9.165581703186035, -8.651580810546875, -8.137578964233398, -7.62357759475708, -7.109576225280762, -6.595575332641602, -6.081573963165283, -5.567572593688965, -5.053571701049805, -4.539570331573486, -4.025568962097168, -3.5115675926208496, -2.9975664615631104, -2.483565330505371, -1.9695639610290527, -1.4555625915527344, -0.9415614604949951, -0.42756032943725586, 0.0864410400390625, 0.6004422903060913, 1.1144435405731201, 1.628444790840149, 2.1424460411071777, 2.656447410583496, 3.1704485416412354, 3.6844496726989746, 4.198451995849609, 4.712453365325928, 5.226454734802246, 5.740455627441406, 6.254456996917725, 6.768458366394043, 7.282459259033203, 7.7964606285095215, 8.31046199798584, 8.824462890625, 9.338464736938477, 9.852465629577637, 10.366466522216797, 10.880468368530273, 11.394469261169434, 11.908470153808594, 12.42247200012207, 12.93647289276123, 13.450474739074707, 13.964475631713867, 14.478477478027344, 14.992478370666504, 15.506479263305664, 16.02048110961914, 16.534481048583984, 17.04848289489746, 17.562482833862305, 18.07648468017578, 18.590486526489258, 19.104488372802734, 19.618488311767578, 20.132490158081055, 20.64649200439453]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 7.0, 7.0, 12.0, 10.0, 17.0, 16.0, 30.0, 31.0, 39.0, 33.0, 35.0, 32.0, 46.0, 47.0, 45.0, 40.0, 41.0, 54.0, 59.0, 53.0, 44.0, 40.0, 41.0, 25.0, 38.0, 21.0, 16.0, 24.0, 18.0, 14.0, 12.0, 9.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.983738422393799, -4.802912712097168, -4.622087478637695, -4.4412617683410645, -4.260436058044434, -4.079610824584961, -3.89878511428833, -3.717959403991699, -3.5371339321136475, -3.3563084602355957, -3.175482749938965, -2.994657278060913, -2.8138318061828613, -2.6330060958862305, -2.4521806240081787, -2.271355152130127, -2.090529441833496, -1.9097038507461548, -1.7288782596588135, -1.5480527877807617, -1.3672271966934204, -1.186401605606079, -1.0055761337280273, -0.824750542640686, -0.6439249515533447, -0.4630993902683258, -0.2822738289833069, -0.10144829750061035, 0.07937729358673096, 0.26020288467407227, 0.441028356552124, 0.6218539476394653, 0.8026790618896484, 0.9835046529769897, 1.164330244064331, 1.3451557159423828, 1.5259813070297241, 1.7068068981170654, 1.8876323699951172, 2.068458080291748, 2.2492835521698, 2.4301090240478516, 2.6109347343444824, 2.791760206222534, 2.972585678100586, 3.153411388397217, 3.3342368602752686, 3.5150623321533203, 3.695888042449951, 3.876713514328003, 4.057538986206055, 4.2383646965026855, 4.419190406799316, 4.600015640258789, 4.78084135055542, 4.961667060852051, 5.142492294311523, 5.323318004608154, 5.504143238067627, 5.684968948364258, 5.865794658660889, 6.0466203689575195, 6.227445602416992, 6.408271312713623, 6.589097023010254]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 10.0, 17.0, 19.0, 26.0, 70.0, 71.0, 66.0, 159.0, 222.0, 322.0, 489.0, 768.0, 1168.0, 1896.0, 3236.0, 5826.0, 10407.0, 20004.0, 39576.0, 81575.0, 163870.0, 256893.0, 220489.0, 119997.0, 58609.0, 28863.0, 14755.0, 7974.0, 4327.0, 2527.0, 1502.0, 957.0, 612.0, 384.0, 273.0, 161.0, 102.0, 90.0, 73.0, 39.0, 34.0, 16.0, 14.0, 13.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.810546875, -0.7865447998046875, -0.762542724609375, -0.7385406494140625, -0.71453857421875, -0.6905364990234375, -0.666534423828125, -0.6425323486328125, -0.6185302734375, -0.5945281982421875, -0.570526123046875, -0.5465240478515625, -0.52252197265625, -0.4985198974609375, -0.474517822265625, -0.4505157470703125, -0.426513671875, -0.4025115966796875, -0.378509521484375, -0.3545074462890625, -0.33050537109375, -0.3065032958984375, -0.282501220703125, -0.2584991455078125, -0.2344970703125, -0.2104949951171875, -0.186492919921875, -0.1624908447265625, -0.13848876953125, -0.1144866943359375, -0.090484619140625, -0.0664825439453125, -0.04248046875, -0.0184783935546875, 0.005523681640625, 0.0295257568359375, 0.05352783203125, 0.0775299072265625, 0.101531982421875, 0.1255340576171875, 0.1495361328125, 0.1735382080078125, 0.197540283203125, 0.2215423583984375, 0.24554443359375, 0.2695465087890625, 0.293548583984375, 0.3175506591796875, 0.341552734375, 0.3655548095703125, 0.389556884765625, 0.4135589599609375, 0.43756103515625, 0.4615631103515625, 0.485565185546875, 0.5095672607421875, 0.5335693359375, 0.5575714111328125, 0.581573486328125, 0.6055755615234375, 0.62957763671875, 0.6535797119140625, 0.677581787109375, 0.7015838623046875, 0.7255859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 9.0, 16.0, 13.0, 18.0, 19.0, 25.0, 23.0, 41.0, 39.0, 45.0, 49.0, 53.0, 50.0, 52.0, 57.0, 48.0, 51.0, 56.0, 40.0, 52.0, 37.0, 36.0, 30.0, 28.0, 25.0, 17.0, 14.0, 8.0, 6.0, 4.0, 6.0, 4.0, 5.0, 4.0, 3.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8056640625, -0.7816848754882812, -0.7577056884765625, -0.7337265014648438, -0.709747314453125, -0.6857681274414062, -0.6617889404296875, -0.6378097534179688, -0.61383056640625, -0.5898513793945312, -0.5658721923828125, -0.5418930053710938, -0.517913818359375, -0.49393463134765625, -0.4699554443359375, -0.44597625732421875, -0.4219970703125, -0.39801788330078125, -0.3740386962890625, -0.35005950927734375, -0.326080322265625, -0.30210113525390625, -0.2781219482421875, -0.25414276123046875, -0.23016357421875, -0.20618438720703125, -0.1822052001953125, -0.15822601318359375, -0.134246826171875, -0.11026763916015625, -0.0862884521484375, -0.06230926513671875, -0.038330078125, -0.01435089111328125, 0.0096282958984375, 0.03360748291015625, 0.057586669921875, 0.08156585693359375, 0.1055450439453125, 0.12952423095703125, 0.15350341796875, 0.17748260498046875, 0.2014617919921875, 0.22544097900390625, 0.249420166015625, 0.27339935302734375, 0.2973785400390625, 0.32135772705078125, 0.3453369140625, 0.36931610107421875, 0.3932952880859375, 0.41727447509765625, 0.441253662109375, 0.46523284912109375, 0.4892120361328125, 0.5131912231445312, 0.53717041015625, 0.5611495971679688, 0.5851287841796875, 0.6091079711914062, 0.633087158203125, 0.6570663452148438, 0.6810455322265625, 0.7050247192382812, 0.72900390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 4.0, 9.0, 4.0, 20.0, 14.0, 13.0, 29.0, 36.0, 41.0, 73.0, 81.0, 113.0, 169.0, 282.0, 391.0, 745.0, 1515.0, 4141.0, 15672.0, 86314.0, 678226.0, 215450.0, 33016.0, 7276.0, 2320.0, 1035.0, 564.0, 337.0, 228.0, 124.0, 86.0, 53.0, 38.0, 29.0, 31.0, 24.0, 8.0, 13.0, 5.0, 7.0, 9.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9765625, -1.91796875, -1.859375, -1.80078125, -1.7421875, -1.68359375, -1.625, -1.56640625, -1.5078125, -1.44921875, -1.390625, -1.33203125, -1.2734375, -1.21484375, -1.15625, -1.09765625, -1.0390625, -0.98046875, -0.921875, -0.86328125, -0.8046875, -0.74609375, -0.6875, -0.62890625, -0.5703125, -0.51171875, -0.453125, -0.39453125, -0.3359375, -0.27734375, -0.21875, -0.16015625, -0.1015625, -0.04296875, 0.015625, 0.07421875, 0.1328125, 0.19140625, 0.25, 0.30859375, 0.3671875, 0.42578125, 0.484375, 0.54296875, 0.6015625, 0.66015625, 0.71875, 0.77734375, 0.8359375, 0.89453125, 0.953125, 1.01171875, 1.0703125, 1.12890625, 1.1875, 1.24609375, 1.3046875, 1.36328125, 1.421875, 1.48046875, 1.5390625, 1.59765625, 1.65625, 1.71484375, 1.7734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 3.0, 16.0, 7.0, 8.0, 19.0, 25.0, 25.0, 38.0, 27.0, 39.0, 55.0, 46.0, 51.0, 70.0, 61.0, 64.0, 57.0, 53.0, 54.0, 37.0, 37.0, 29.0, 32.0, 27.0, 27.0, 26.0, 9.0, 13.0, 11.0, 6.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.79010009765625, -2.7032470703125, -2.61639404296875, -2.529541015625, -2.44268798828125, -2.3558349609375, -2.26898193359375, -2.18212890625, -2.09527587890625, -2.0084228515625, -1.92156982421875, -1.834716796875, -1.74786376953125, -1.6610107421875, -1.57415771484375, -1.4873046875, -1.40045166015625, -1.3135986328125, -1.22674560546875, -1.139892578125, -1.05303955078125, -0.9661865234375, -0.87933349609375, -0.79248046875, -0.70562744140625, -0.6187744140625, -0.53192138671875, -0.445068359375, -0.35821533203125, -0.2713623046875, -0.18450927734375, -0.09765625, -0.01080322265625, 0.0760498046875, 0.16290283203125, 0.249755859375, 0.33660888671875, 0.4234619140625, 0.51031494140625, 0.59716796875, 0.68402099609375, 0.7708740234375, 0.85772705078125, 0.944580078125, 1.03143310546875, 1.1182861328125, 1.20513916015625, 1.2919921875, 1.37884521484375, 1.4656982421875, 1.55255126953125, 1.639404296875, 1.72625732421875, 1.8131103515625, 1.89996337890625, 1.98681640625, 2.07366943359375, 2.1605224609375, 2.24737548828125, 2.334228515625, 2.42108154296875, 2.5079345703125, 2.59478759765625, 2.681640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 5.0, 6.0, 15.0, 12.0, 16.0, 37.0, 36.0, 67.0, 83.0, 109.0, 212.0, 330.0, 581.0, 1185.0, 2582.0, 7035.0, 22117.0, 90240.0, 659935.0, 203209.0, 41131.0, 11842.0, 4111.0, 1745.0, 800.0, 396.0, 242.0, 161.0, 92.0, 54.0, 49.0, 28.0, 24.0, 24.0, 10.0, 10.0, 6.0, 2.0, 7.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.385009765625, -0.3711280822753906, -0.35724639892578125, -0.3433647155761719, -0.3294830322265625, -0.3156013488769531, -0.30171966552734375, -0.2878379821777344, -0.273956298828125, -0.2600746154785156, -0.24619293212890625, -0.23231124877929688, -0.2184295654296875, -0.20454788208007812, -0.19066619873046875, -0.17678451538085938, -0.16290283203125, -0.14902114868164062, -0.13513946533203125, -0.12125778198242188, -0.1073760986328125, -0.09349441528320312, -0.07961273193359375, -0.06573104858398438, -0.051849365234375, -0.037967681884765625, -0.02408599853515625, -0.010204315185546875, 0.0036773681640625, 0.017559051513671875, 0.03144073486328125, 0.045322418212890625, 0.0592041015625, 0.07308578491210938, 0.08696746826171875, 0.10084915161132812, 0.1147308349609375, 0.12861251831054688, 0.14249420166015625, 0.15637588500976562, 0.170257568359375, 0.18413925170898438, 0.19802093505859375, 0.21190261840820312, 0.2257843017578125, 0.23966598510742188, 0.25354766845703125, 0.2674293518066406, 0.28131103515625, 0.2951927185058594, 0.30907440185546875, 0.3229560852050781, 0.3368377685546875, 0.3507194519042969, 0.36460113525390625, 0.3784828186035156, 0.392364501953125, 0.4062461853027344, 0.42012786865234375, 0.4340095520019531, 0.4478912353515625, 0.4617729187011719, 0.47565460205078125, 0.4895362854003906, 0.50341796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 11.0, 10.0, 16.0, 18.0, 20.0, 16.0, 42.0, 47.0, 60.0, 69.0, 65.0, 104.0, 85.0, 78.0, 68.0, 60.0, 47.0, 38.0, 16.0, 26.0, 18.0, 20.0, 12.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00014901161193847656, -0.00014521274715662003, -0.0001414138823747635, -0.00013761501759290695, -0.00013381615281105042, -0.00013001728802919388, -0.00012621842324733734, -0.0001224195584654808, -0.00011862069368362427, -0.00011482182890176773, -0.0001110229641199112, -0.00010722409933805466, -0.00010342523455619812, -9.962636977434158e-05, -9.582750499248505e-05, -9.202864021062851e-05, -8.822977542877197e-05, -8.443091064691544e-05, -8.06320458650589e-05, -7.683318108320236e-05, -7.303431630134583e-05, -6.923545151948929e-05, -6.543658673763275e-05, -6.163772195577621e-05, -5.783885717391968e-05, -5.403999239206314e-05, -5.0241127610206604e-05, -4.644226282835007e-05, -4.264339804649353e-05, -3.8844533264636993e-05, -3.5045668482780457e-05, -3.124680370092392e-05, -2.7447938919067383e-05, -2.3649074137210846e-05, -1.985020935535431e-05, -1.6051344573497772e-05, -1.2252479791641235e-05, -8.453615009784698e-06, -4.654750227928162e-06, -8.558854460716248e-07, 2.942979335784912e-06, 6.741844117641449e-06, 1.0540708899497986e-05, 1.4339573681354523e-05, 1.813843846321106e-05, 2.1937303245067596e-05, 2.5736168026924133e-05, 2.953503280878067e-05, 3.333389759063721e-05, 3.7132762372493744e-05, 4.093162715435028e-05, 4.473049193620682e-05, 4.8529356718063354e-05, 5.232822149991989e-05, 5.612708628177643e-05, 5.9925951063632965e-05, 6.37248158454895e-05, 6.752368062734604e-05, 7.132254540920258e-05, 7.512141019105911e-05, 7.892027497291565e-05, 8.271913975477219e-05, 8.651800453662872e-05, 9.031686931848526e-05, 9.41157341003418e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 7.0, 13.0, 20.0, 37.0, 55.0, 112.0, 201.0, 435.0, 964.0, 3040.0, 14739.0, 134793.0, 805328.0, 75304.0, 9809.0, 2134.0, 799.0, 359.0, 168.0, 101.0, 42.0, 34.0, 15.0, 12.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.63330078125, -0.612457275390625, -0.59161376953125, -0.570770263671875, -0.5499267578125, -0.529083251953125, -0.50823974609375, -0.487396240234375, -0.466552734375, -0.445709228515625, -0.42486572265625, -0.404022216796875, -0.3831787109375, -0.362335205078125, -0.34149169921875, -0.320648193359375, -0.2998046875, -0.278961181640625, -0.25811767578125, -0.237274169921875, -0.2164306640625, -0.195587158203125, -0.17474365234375, -0.153900146484375, -0.133056640625, -0.112213134765625, -0.09136962890625, -0.070526123046875, -0.0496826171875, -0.028839111328125, -0.00799560546875, 0.012847900390625, 0.03369140625, 0.054534912109375, 0.07537841796875, 0.096221923828125, 0.1170654296875, 0.137908935546875, 0.15875244140625, 0.179595947265625, 0.200439453125, 0.221282958984375, 0.24212646484375, 0.262969970703125, 0.2838134765625, 0.304656982421875, 0.32550048828125, 0.346343994140625, 0.3671875, 0.388031005859375, 0.40887451171875, 0.429718017578125, 0.4505615234375, 0.471405029296875, 0.49224853515625, 0.513092041015625, 0.533935546875, 0.554779052734375, 0.57562255859375, 0.596466064453125, 0.6173095703125, 0.638153076171875, 0.65899658203125, 0.679840087890625, 0.70068359375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 5.0, 13.0, 17.0, 19.0, 34.0, 28.0, 44.0, 70.0, 96.0, 111.0, 121.0, 98.0, 93.0, 70.0, 49.0, 29.0, 26.0, 19.0, 14.0, 13.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6136093139648438, -0.5934295654296875, -0.5732498168945312, -0.553070068359375, -0.5328903198242188, -0.5127105712890625, -0.49253082275390625, -0.47235107421875, -0.45217132568359375, -0.4319915771484375, -0.41181182861328125, -0.391632080078125, -0.37145233154296875, -0.3512725830078125, -0.33109283447265625, -0.3109130859375, -0.29073333740234375, -0.2705535888671875, -0.25037384033203125, -0.230194091796875, -0.21001434326171875, -0.1898345947265625, -0.16965484619140625, -0.14947509765625, -0.12929534912109375, -0.1091156005859375, -0.08893585205078125, -0.068756103515625, -0.04857635498046875, -0.0283966064453125, -0.00821685791015625, 0.011962890625, 0.03214263916015625, 0.0523223876953125, 0.07250213623046875, 0.092681884765625, 0.11286163330078125, 0.1330413818359375, 0.15322113037109375, 0.17340087890625, 0.19358062744140625, 0.2137603759765625, 0.23394012451171875, 0.254119873046875, 0.27429962158203125, 0.2944793701171875, 0.31465911865234375, 0.3348388671875, 0.35501861572265625, 0.3751983642578125, 0.39537811279296875, 0.415557861328125, 0.43573760986328125, 0.4559173583984375, 0.47609710693359375, 0.49627685546875, 0.5164566040039062, 0.5366363525390625, 0.5568161010742188, 0.576995849609375, 0.5971755981445312, 0.6173553466796875, 0.6375350952148438, 0.65771484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 12.0, 18.0, 42.0, 90.0, 165.0, 344.0, 159.0, 72.0, 47.0, 22.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.959232330322266, -18.452219009399414, -17.94520378112793, -17.438190460205078, -16.931175231933594, -16.424161911010742, -15.91714859008789, -15.410134315490723, -14.903120040893555, -14.396105766296387, -13.889091491699219, -13.382078170776367, -12.8750638961792, -12.368049621582031, -11.86103630065918, -11.354022026062012, -10.847007751464844, -10.339993476867676, -9.832979202270508, -9.325965881347656, -8.818951606750488, -8.31193733215332, -7.8049235343933105, -7.297909736633301, -6.790895462036133, -6.283881187438965, -5.776867389678955, -5.269853591918945, -4.762839317321777, -4.255825042724609, -3.7488112449645996, -3.2417972087860107, -2.7347822189331055, -2.2277681827545166, -1.7207541465759277, -1.2137401103973389, -0.70672607421875, -0.19971203804016113, 0.30730199813842773, 0.8143160343170166, 1.3213300704956055, 1.8283441066741943, 2.335358142852783, 2.842372179031372, 3.349386215209961, 3.85640025138855, 4.363414287567139, 4.870428085327148, 5.377442359924316, 5.884456634521484, 6.391470432281494, 6.898484230041504, 7.405498504638672, 7.91251277923584, 8.419527053833008, 8.92654037475586, 9.433554649353027, 9.940568923950195, 10.447582244873047, 10.954596519470215, 11.461610794067383, 11.96862506866455, 12.475639343261719, 12.98265266418457, 13.489666938781738]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 0.0, 4.0, 13.0, 5.0, 8.0, 10.0, 14.0, 19.0, 20.0, 24.0, 18.0, 25.0, 21.0, 29.0, 29.0, 41.0, 49.0, 85.0, 80.0, 94.0, 61.0, 42.0, 45.0, 38.0, 28.0, 22.0, 27.0, 17.0, 17.0, 16.0, 19.0, 13.0, 15.0, 6.0, 9.0, 6.0, 6.0, 5.0, 1.0, 5.0, 1.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.47958755493164, -10.18771743774414, -9.895848274230957, -9.603978157043457, -9.312108993530273, -9.020238876342773, -8.72836971282959, -8.43649959564209, -8.144630432128906, -7.8527607917785645, -7.560891151428223, -7.269021511077881, -6.977151870727539, -6.685282230377197, -6.3934125900268555, -6.1015424728393555, -5.809672832489014, -5.517803192138672, -5.22593355178833, -4.934063911437988, -4.6421942710876465, -4.350324630737305, -4.058454513549805, -3.766585111618042, -3.4747154712677, -3.1828458309173584, -2.8909761905670166, -2.5991063117980957, -2.307236671447754, -2.015367031097412, -1.7234973907470703, -1.4316277503967285, -1.1397581100463867, -0.8478884696960449, -0.5560187697410583, -0.2641490697860718, 0.02772057056427002, 0.3195902109146118, 0.6114599704742432, 0.903329610824585, 1.1951992511749268, 1.4870688915252686, 1.7789385318756104, 2.0708084106445312, 2.362678050994873, 2.654547691345215, 2.9464173316955566, 3.2382869720458984, 3.5301566123962402, 3.822026252746582, 4.113895893096924, 4.405765533447266, 4.697635173797607, 4.989504814147949, 5.281374931335449, 5.573244094848633, 5.865114212036133, 6.156983852386475, 6.448853492736816, 6.740723133087158, 7.0325927734375, 7.324462413787842, 7.616332054138184, 7.908202171325684, 8.200071334838867]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 21.0, 30.0, 48.0, 73.0, 160.0, 279.0, 506.0, 1073.0, 2337.0, 6035.0, 18746.0, 78093.0, 444032.0, 2119130.0, 1251516.0, 211707.0, 42015.0, 11443.0, 3933.0, 1639.0, 722.0, 362.0, 196.0, 64.0, 47.0, 23.0, 16.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6298675537109375, -0.604461669921875, -0.5790557861328125, -0.55364990234375, -0.5282440185546875, -0.502838134765625, -0.4774322509765625, -0.4520263671875, -0.4266204833984375, -0.401214599609375, -0.3758087158203125, -0.35040283203125, -0.3249969482421875, -0.299591064453125, -0.2741851806640625, -0.248779296875, -0.2233734130859375, -0.197967529296875, -0.1725616455078125, -0.14715576171875, -0.1217498779296875, -0.096343994140625, -0.0709381103515625, -0.0455322265625, -0.0201263427734375, 0.005279541015625, 0.0306854248046875, 0.05609130859375, 0.0814971923828125, 0.106903076171875, 0.1323089599609375, 0.15771484375, 0.1831207275390625, 0.208526611328125, 0.2339324951171875, 0.25933837890625, 0.2847442626953125, 0.310150146484375, 0.3355560302734375, 0.3609619140625, 0.3863677978515625, 0.411773681640625, 0.4371795654296875, 0.46258544921875, 0.4879913330078125, 0.513397216796875, 0.5388031005859375, 0.564208984375, 0.5896148681640625, 0.615020751953125, 0.6404266357421875, 0.66583251953125, 0.6912384033203125, 0.716644287109375, 0.7420501708984375, 0.7674560546875, 0.7928619384765625, 0.818267822265625, 0.8436737060546875, 0.86907958984375, 0.8944854736328125, 0.919891357421875, 0.9452972412109375, 0.970703125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 12.0, 12.0, 16.0, 23.0, 21.0, 23.0, 35.0, 23.0, 48.0, 34.0, 54.0, 43.0, 53.0, 57.0, 55.0, 52.0, 51.0, 56.0, 52.0, 54.0, 33.0, 36.0, 29.0, 31.0, 20.0, 18.0, 7.0, 11.0, 3.0, 3.0, 8.0, 3.0, 10.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.80615234375, -0.7820358276367188, -0.7579193115234375, -0.7338027954101562, -0.709686279296875, -0.6855697631835938, -0.6614532470703125, -0.6373367309570312, -0.61322021484375, -0.5891036987304688, -0.5649871826171875, -0.5408706665039062, -0.516754150390625, -0.49263763427734375, -0.4685211181640625, -0.44440460205078125, -0.4202880859375, -0.39617156982421875, -0.3720550537109375, -0.34793853759765625, -0.323822021484375, -0.29970550537109375, -0.2755889892578125, -0.25147247314453125, -0.22735595703125, -0.20323944091796875, -0.1791229248046875, -0.15500640869140625, -0.130889892578125, -0.10677337646484375, -0.0826568603515625, -0.05854034423828125, -0.034423828125, -0.01030731201171875, 0.0138092041015625, 0.03792572021484375, 0.062042236328125, 0.08615875244140625, 0.1102752685546875, 0.13439178466796875, 0.15850830078125, 0.18262481689453125, 0.2067413330078125, 0.23085784912109375, 0.254974365234375, 0.27909088134765625, 0.3032073974609375, 0.32732391357421875, 0.3514404296875, 0.37555694580078125, 0.3996734619140625, 0.42378997802734375, 0.447906494140625, 0.47202301025390625, 0.4961395263671875, 0.5202560424804688, 0.54437255859375, 0.5684890747070312, 0.5926055908203125, 0.6167221069335938, 0.640838623046875, 0.6649551391601562, 0.6890716552734375, 0.7131881713867188, 0.7373046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 16.0, 36.0, 66.0, 140.0, 275.0, 1044.0, 9957.0, 3665750.0, 511316.0, 4554.0, 692.0, 223.0, 96.0, 54.0, 26.0, 16.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.812530517578125, -2.68951416015625, -2.566497802734375, -2.4434814453125, -2.320465087890625, -2.19744873046875, -2.074432373046875, -1.951416015625, -1.828399658203125, -1.70538330078125, -1.582366943359375, -1.4593505859375, -1.336334228515625, -1.21331787109375, -1.090301513671875, -0.96728515625, -0.844268798828125, -0.72125244140625, -0.598236083984375, -0.4752197265625, -0.352203369140625, -0.22918701171875, -0.106170654296875, 0.016845703125, 0.139862060546875, 0.26287841796875, 0.385894775390625, 0.5089111328125, 0.631927490234375, 0.75494384765625, 0.877960205078125, 1.0009765625, 1.123992919921875, 1.24700927734375, 1.370025634765625, 1.4930419921875, 1.616058349609375, 1.73907470703125, 1.862091064453125, 1.985107421875, 2.108123779296875, 2.23114013671875, 2.354156494140625, 2.4771728515625, 2.600189208984375, 2.72320556640625, 2.846221923828125, 2.96923828125, 3.092254638671875, 3.21527099609375, 3.338287353515625, 3.4613037109375, 3.584320068359375, 3.70733642578125, 3.830352783203125, 3.953369140625, 4.076385498046875, 4.19940185546875, 4.322418212890625, 4.4454345703125, 4.568450927734375, 4.69146728515625, 4.814483642578125, 4.9375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 12.0, 16.0, 28.0, 49.0, 113.0, 218.0, 457.0, 840.0, 1058.0, 650.0, 322.0, 130.0, 64.0, 50.0, 27.0, 13.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.166015625, -3.0944976806640625, -3.022979736328125, -2.9514617919921875, -2.87994384765625, -2.8084259033203125, -2.736907958984375, -2.6653900146484375, -2.5938720703125, -2.5223541259765625, -2.450836181640625, -2.3793182373046875, -2.30780029296875, -2.2362823486328125, -2.164764404296875, -2.0932464599609375, -2.021728515625, -1.9502105712890625, -1.878692626953125, -1.8071746826171875, -1.73565673828125, -1.6641387939453125, -1.592620849609375, -1.5211029052734375, -1.4495849609375, -1.3780670166015625, -1.306549072265625, -1.2350311279296875, -1.16351318359375, -1.0919952392578125, -1.020477294921875, -0.9489593505859375, -0.87744140625, -0.8059234619140625, -0.734405517578125, -0.6628875732421875, -0.59136962890625, -0.5198516845703125, -0.448333740234375, -0.3768157958984375, -0.3052978515625, -0.2337799072265625, -0.162261962890625, -0.0907440185546875, -0.01922607421875, 0.0522918701171875, 0.123809814453125, 0.1953277587890625, 0.266845703125, 0.3383636474609375, 0.409881591796875, 0.4813995361328125, 0.55291748046875, 0.6244354248046875, 0.695953369140625, 0.7674713134765625, 0.8389892578125, 0.9105072021484375, 0.982025146484375, 1.0535430908203125, 1.12506103515625, 1.1965789794921875, 1.268096923828125, 1.3396148681640625, 1.4111328125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 5.0, 9.0, 18.0, 43.0, 54.0, 86.0, 148.0, 177.0, 153.0, 129.0, 82.0, 42.0, 23.0, 10.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-17.182254791259766, -16.81801986694336, -16.453784942626953, -16.089548110961914, -15.725313186645508, -15.361078262329102, -14.996842384338379, -14.632607460021973, -14.26837158203125, -13.904136657714844, -13.539900779724121, -13.175665855407715, -12.811429977416992, -12.447195053100586, -12.082959175109863, -11.718724250793457, -11.354488372802734, -10.990253448486328, -10.626017570495605, -10.2617826461792, -9.897546768188477, -9.53331184387207, -9.169075965881348, -8.804841041564941, -8.440606117248535, -8.076371192932129, -7.712135314941406, -7.347899913787842, -6.983664512634277, -6.619429111480713, -6.255193710327148, -5.890958786010742, -5.5267229080200195, -5.162487506866455, -4.798252105712891, -4.434016704559326, -4.069781303405762, -3.7055459022521973, -3.341310739517212, -2.9770753383636475, -2.612839937210083, -2.2486045360565186, -1.884369134902954, -1.5201338529586792, -1.1558984518051147, -0.7916630506515503, -0.4274277687072754, -0.06319236755371094, 0.3010430335998535, 0.665278434753418, 1.0295138359069824, 1.3937491178512573, 1.7579845190048218, 2.122220039367676, 2.486455202102661, 2.8506906032562256, 3.21492600440979, 3.5791614055633545, 3.943396806716919, 4.307631969451904, 4.671867370605469, 5.036102771759033, 5.400338172912598, 5.764573574066162, 6.128808975219727]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 9.0, 10.0, 10.0, 12.0, 14.0, 12.0, 19.0, 18.0, 34.0, 30.0, 32.0, 47.0, 41.0, 39.0, 40.0, 50.0, 43.0, 70.0, 62.0, 47.0, 51.0, 33.0, 41.0, 32.0, 30.0, 19.0, 23.0, 34.0, 14.0, 22.0, 12.0, 9.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8313493728637695, -6.631371974945068, -6.431395053863525, -6.231417655944824, -6.031440258026123, -5.83146333694458, -5.631485939025879, -5.431509017944336, -5.231531620025635, -5.031554222106934, -4.831577301025391, -4.6315999031066895, -4.431622505187988, -4.231645584106445, -4.031668186187744, -3.831691026687622, -3.631713628768921, -3.431736469268799, -3.2317590713500977, -3.0317819118499756, -2.8318047523498535, -2.6318273544311523, -2.4318501949310303, -2.231873035430908, -2.031895637512207, -1.8319183588027954, -1.6319411993026733, -1.4319639205932617, -1.2319867610931396, -1.032009482383728, -0.8320322036743164, -0.6320550441741943, -0.43207788467407227, -0.23210065066814423, -0.032123416662216187, 0.16785383224487305, 0.3678310513496399, 0.5678082704544067, 0.7677855491638184, 0.9677627086639404, 1.167739987373352, 1.3677172660827637, 1.5676944255828857, 1.7676717042922974, 1.967648983001709, 2.167626142501831, 2.367603302001953, 2.5675806999206543, 2.7675578594207764, 2.9675350189208984, 3.1675124168395996, 3.3674895763397217, 3.5674667358398438, 3.767444133758545, 3.967421293258667, 4.167398452758789, 4.36737585067749, 4.567353248596191, 4.767330169677734, 4.9673075675964355, 5.167284965515137, 5.36726188659668, 5.567239284515381, 5.767216682434082, 5.967193603515625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 15.0, 20.0, 23.0, 54.0, 76.0, 108.0, 173.0, 263.0, 458.0, 827.0, 1549.0, 2933.0, 6072.0, 14055.0, 35797.0, 108530.0, 338458.0, 356106.0, 116177.0, 38667.0, 14982.0, 6513.0, 2987.0, 1592.0, 823.0, 510.0, 309.0, 175.0, 99.0, 75.0, 39.0, 22.0, 12.0, 14.0, 15.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.23858642578125, -1.1959228515625, -1.15325927734375, -1.110595703125, -1.06793212890625, -1.0252685546875, -0.98260498046875, -0.93994140625, -0.89727783203125, -0.8546142578125, -0.81195068359375, -0.769287109375, -0.72662353515625, -0.6839599609375, -0.64129638671875, -0.5986328125, -0.55596923828125, -0.5133056640625, -0.47064208984375, -0.427978515625, -0.38531494140625, -0.3426513671875, -0.29998779296875, -0.25732421875, -0.21466064453125, -0.1719970703125, -0.12933349609375, -0.086669921875, -0.04400634765625, -0.0013427734375, 0.04132080078125, 0.083984375, 0.12664794921875, 0.1693115234375, 0.21197509765625, 0.254638671875, 0.29730224609375, 0.3399658203125, 0.38262939453125, 0.42529296875, 0.46795654296875, 0.5106201171875, 0.55328369140625, 0.595947265625, 0.63861083984375, 0.6812744140625, 0.72393798828125, 0.7666015625, 0.80926513671875, 0.8519287109375, 0.89459228515625, 0.937255859375, 0.97991943359375, 1.0225830078125, 1.06524658203125, 1.10791015625, 1.15057373046875, 1.1932373046875, 1.23590087890625, 1.278564453125, 1.32122802734375, 1.3638916015625, 1.40655517578125, 1.44921875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 18.0, 13.0, 20.0, 17.0, 21.0, 30.0, 29.0, 32.0, 29.0, 48.0, 47.0, 55.0, 53.0, 55.0, 48.0, 38.0, 58.0, 55.0, 52.0, 36.0, 38.0, 33.0, 27.0, 31.0, 18.0, 15.0, 14.0, 9.0, 10.0, 12.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80224609375, -0.7787551879882812, -0.7552642822265625, -0.7317733764648438, -0.708282470703125, -0.6847915649414062, -0.6613006591796875, -0.6378097534179688, -0.61431884765625, -0.5908279418945312, -0.5673370361328125, -0.5438461303710938, -0.520355224609375, -0.49686431884765625, -0.4733734130859375, -0.44988250732421875, -0.4263916015625, -0.40290069580078125, -0.3794097900390625, -0.35591888427734375, -0.332427978515625, -0.30893707275390625, -0.2854461669921875, -0.26195526123046875, -0.23846435546875, -0.21497344970703125, -0.1914825439453125, -0.16799163818359375, -0.144500732421875, -0.12100982666015625, -0.0975189208984375, -0.07402801513671875, -0.050537109375, -0.02704620361328125, -0.0035552978515625, 0.01993560791015625, 0.043426513671875, 0.06691741943359375, 0.0904083251953125, 0.11389923095703125, 0.13739013671875, 0.16088104248046875, 0.1843719482421875, 0.20786285400390625, 0.231353759765625, 0.25484466552734375, 0.2783355712890625, 0.30182647705078125, 0.3253173828125, 0.34880828857421875, 0.3722991943359375, 0.39579010009765625, 0.419281005859375, 0.44277191162109375, 0.4662628173828125, 0.48975372314453125, 0.51324462890625, 0.5367355346679688, 0.5602264404296875, 0.5837173461914062, 0.607208251953125, 0.6306991577148438, 0.6541900634765625, 0.6776809692382812, 0.701171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 8.0, 5.0, 10.0, 10.0, 12.0, 15.0, 27.0, 30.0, 59.0, 78.0, 111.0, 160.0, 257.0, 384.0, 661.0, 1185.0, 2601.0, 7810.0, 39769.0, 624168.0, 324625.0, 34200.0, 7123.0, 2334.0, 1094.0, 603.0, 396.0, 251.0, 181.0, 104.0, 85.0, 52.0, 42.0, 26.0, 27.0, 15.0, 11.0, 6.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.458984375, -2.3924560546875, -2.325927734375, -2.2593994140625, -2.19287109375, -2.1263427734375, -2.059814453125, -1.9932861328125, -1.9267578125, -1.8602294921875, -1.793701171875, -1.7271728515625, -1.66064453125, -1.5941162109375, -1.527587890625, -1.4610595703125, -1.39453125, -1.3280029296875, -1.261474609375, -1.1949462890625, -1.12841796875, -1.0618896484375, -0.995361328125, -0.9288330078125, -0.8623046875, -0.7957763671875, -0.729248046875, -0.6627197265625, -0.59619140625, -0.5296630859375, -0.463134765625, -0.3966064453125, -0.330078125, -0.2635498046875, -0.197021484375, -0.1304931640625, -0.06396484375, 0.0025634765625, 0.069091796875, 0.1356201171875, 0.2021484375, 0.2686767578125, 0.335205078125, 0.4017333984375, 0.46826171875, 0.5347900390625, 0.601318359375, 0.6678466796875, 0.734375, 0.8009033203125, 0.867431640625, 0.9339599609375, 1.00048828125, 1.0670166015625, 1.133544921875, 1.2000732421875, 1.2666015625, 1.3331298828125, 1.399658203125, 1.4661865234375, 1.53271484375, 1.5992431640625, 1.665771484375, 1.7322998046875, 1.798828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 11.0, 16.0, 5.0, 22.0, 18.0, 34.0, 26.0, 41.0, 50.0, 39.0, 33.0, 45.0, 51.0, 65.0, 59.0, 47.0, 57.0, 56.0, 47.0, 32.0, 37.0, 25.0, 24.0, 19.0, 28.0, 16.0, 15.0, 16.0, 8.0, 10.0, 8.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.938934326171875, -1.85833740234375, -1.777740478515625, -1.6971435546875, -1.616546630859375, -1.53594970703125, -1.455352783203125, -1.374755859375, -1.294158935546875, -1.21356201171875, -1.132965087890625, -1.0523681640625, -0.971771240234375, -0.89117431640625, -0.810577392578125, -0.72998046875, -0.649383544921875, -0.56878662109375, -0.488189697265625, -0.4075927734375, -0.326995849609375, -0.24639892578125, -0.165802001953125, -0.085205078125, -0.004608154296875, 0.07598876953125, 0.156585693359375, 0.2371826171875, 0.317779541015625, 0.39837646484375, 0.478973388671875, 0.5595703125, 0.640167236328125, 0.72076416015625, 0.801361083984375, 0.8819580078125, 0.962554931640625, 1.04315185546875, 1.123748779296875, 1.204345703125, 1.284942626953125, 1.36553955078125, 1.446136474609375, 1.5267333984375, 1.607330322265625, 1.68792724609375, 1.768524169921875, 1.84912109375, 1.929718017578125, 2.01031494140625, 2.090911865234375, 2.1715087890625, 2.252105712890625, 2.33270263671875, 2.413299560546875, 2.493896484375, 2.574493408203125, 2.65509033203125, 2.735687255859375, 2.8162841796875, 2.896881103515625, 2.97747802734375, 3.058074951171875, 3.138671875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 6.0, 2.0, 5.0, 5.0, 12.0, 15.0, 15.0, 19.0, 20.0, 32.0, 57.0, 49.0, 92.0, 144.0, 238.0, 378.0, 754.0, 1676.0, 4286.0, 13468.0, 56647.0, 607607.0, 295138.0, 48852.0, 11878.0, 3906.0, 1506.0, 741.0, 370.0, 201.0, 132.0, 83.0, 49.0, 48.0, 29.0, 21.0, 14.0, 16.0, 9.0, 5.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.454345703125, -0.4409637451171875, -0.427581787109375, -0.4141998291015625, -0.40081787109375, -0.3874359130859375, -0.374053955078125, -0.3606719970703125, -0.3472900390625, -0.3339080810546875, -0.320526123046875, -0.3071441650390625, -0.29376220703125, -0.2803802490234375, -0.266998291015625, -0.2536163330078125, -0.240234375, -0.2268524169921875, -0.213470458984375, -0.2000885009765625, -0.18670654296875, -0.1733245849609375, -0.159942626953125, -0.1465606689453125, -0.1331787109375, -0.1197967529296875, -0.106414794921875, -0.0930328369140625, -0.07965087890625, -0.0662689208984375, -0.052886962890625, -0.0395050048828125, -0.026123046875, -0.0127410888671875, 0.000640869140625, 0.0140228271484375, 0.02740478515625, 0.0407867431640625, 0.054168701171875, 0.0675506591796875, 0.0809326171875, 0.0943145751953125, 0.107696533203125, 0.1210784912109375, 0.13446044921875, 0.1478424072265625, 0.161224365234375, 0.1746063232421875, 0.18798828125, 0.2013702392578125, 0.214752197265625, 0.2281341552734375, 0.24151611328125, 0.2548980712890625, 0.268280029296875, 0.2816619873046875, 0.2950439453125, 0.3084259033203125, 0.321807861328125, 0.3351898193359375, 0.34857177734375, 0.3619537353515625, 0.375335693359375, 0.3887176513671875, 0.402099609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 5.0, 14.0, 18.0, 16.0, 23.0, 26.0, 33.0, 36.0, 50.0, 88.0, 97.0, 138.0, 108.0, 76.0, 42.0, 42.0, 39.0, 31.0, 21.0, 15.0, 11.0, 11.0, 8.0, 6.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015938282012939453, -0.00015443749725818634, -0.00014949217438697815, -0.00014454685151576996, -0.00013960152864456177, -0.00013465620577335358, -0.00012971088290214539, -0.0001247655600309372, -0.000119820237159729, -0.00011487491428852081, -0.00010992959141731262, -0.00010498426854610443, -0.00010003894567489624, -9.509362280368805e-05, -9.014829993247986e-05, -8.520297706127167e-05, -8.025765419006348e-05, -7.531233131885529e-05, -7.03670084476471e-05, -6.54216855764389e-05, -6.047636270523071e-05, -5.553103983402252e-05, -5.058571696281433e-05, -4.564039409160614e-05, -4.069507122039795e-05, -3.574974834918976e-05, -3.080442547798157e-05, -2.5859102606773376e-05, -2.0913779735565186e-05, -1.5968456864356995e-05, -1.1023133993148804e-05, -6.077811121940613e-06, -1.1324882507324219e-06, 3.812834620475769e-06, 8.75815749168396e-06, 1.3703480362892151e-05, 1.8648803234100342e-05, 2.3594126105308533e-05, 2.8539448976516724e-05, 3.3484771847724915e-05, 3.8430094718933105e-05, 4.3375417590141296e-05, 4.832074046134949e-05, 5.326606333255768e-05, 5.821138620376587e-05, 6.315670907497406e-05, 6.810203194618225e-05, 7.304735481739044e-05, 7.799267768859863e-05, 8.293800055980682e-05, 8.788332343101501e-05, 9.28286463022232e-05, 9.77739691734314e-05, 0.00010271929204463959, 0.00010766461491584778, 0.00011260993778705597, 0.00011755526065826416, 0.00012250058352947235, 0.00012744590640068054, 0.00013239122927188873, 0.00013733655214309692, 0.00014228187501430511, 0.0001472271978855133, 0.0001521725207567215, 0.0001571178436279297]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 6.0, 4.0, 4.0, 11.0, 9.0, 17.0, 27.0, 31.0, 46.0, 83.0, 124.0, 240.0, 388.0, 743.0, 1673.0, 4634.0, 19159.0, 123588.0, 775429.0, 99061.0, 15856.0, 4200.0, 1582.0, 734.0, 359.0, 233.0, 103.0, 64.0, 56.0, 25.0, 18.0, 7.0, 13.0, 9.0, 6.0, 3.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.4225921630859375, -0.407196044921875, -0.3917999267578125, -0.37640380859375, -0.3610076904296875, -0.345611572265625, -0.3302154541015625, -0.3148193359375, -0.2994232177734375, -0.284027099609375, -0.2686309814453125, -0.25323486328125, -0.2378387451171875, -0.222442626953125, -0.2070465087890625, -0.191650390625, -0.1762542724609375, -0.160858154296875, -0.1454620361328125, -0.13006591796875, -0.1146697998046875, -0.099273681640625, -0.0838775634765625, -0.0684814453125, -0.0530853271484375, -0.037689208984375, -0.0222930908203125, -0.00689697265625, 0.0084991455078125, 0.023895263671875, 0.0392913818359375, 0.0546875, 0.0700836181640625, 0.085479736328125, 0.1008758544921875, 0.11627197265625, 0.1316680908203125, 0.147064208984375, 0.1624603271484375, 0.1778564453125, 0.1932525634765625, 0.208648681640625, 0.2240447998046875, 0.23944091796875, 0.2548370361328125, 0.270233154296875, 0.2856292724609375, 0.301025390625, 0.3164215087890625, 0.331817626953125, 0.3472137451171875, 0.36260986328125, 0.3780059814453125, 0.393402099609375, 0.4087982177734375, 0.4241943359375, 0.4395904541015625, 0.454986572265625, 0.4703826904296875, 0.48577880859375, 0.5011749267578125, 0.516571044921875, 0.5319671630859375, 0.54736328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 12.0, 4.0, 8.0, 7.0, 20.0, 13.0, 28.0, 35.0, 46.0, 54.0, 77.0, 111.0, 106.0, 116.0, 90.0, 70.0, 50.0, 43.0, 36.0, 27.0, 16.0, 11.0, 10.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42724609375, -0.40856170654296875, -0.3898773193359375, -0.37119293212890625, -0.352508544921875, -0.33382415771484375, -0.3151397705078125, -0.29645538330078125, -0.27777099609375, -0.25908660888671875, -0.2404022216796875, -0.22171783447265625, -0.203033447265625, -0.18434906005859375, -0.1656646728515625, -0.14698028564453125, -0.1282958984375, -0.10961151123046875, -0.0909271240234375, -0.07224273681640625, -0.053558349609375, -0.03487396240234375, -0.0161895751953125, 0.00249481201171875, 0.02117919921875, 0.03986358642578125, 0.0585479736328125, 0.07723236083984375, 0.095916748046875, 0.11460113525390625, 0.1332855224609375, 0.15196990966796875, 0.170654296875, 0.18933868408203125, 0.2080230712890625, 0.22670745849609375, 0.245391845703125, 0.26407623291015625, 0.2827606201171875, 0.30144500732421875, 0.32012939453125, 0.33881378173828125, 0.3574981689453125, 0.37618255615234375, 0.394866943359375, 0.41355133056640625, 0.4322357177734375, 0.45092010498046875, 0.4696044921875, 0.48828887939453125, 0.5069732666015625, 0.5256576538085938, 0.544342041015625, 0.5630264282226562, 0.5817108154296875, 0.6003952026367188, 0.61907958984375, 0.6377639770507812, 0.6564483642578125, 0.6751327514648438, 0.693817138671875, 0.7125015258789062, 0.7311859130859375, 0.7498703002929688, 0.7685546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 15.0, 31.0, 78.0, 175.0, 397.0, 163.0, 81.0, 31.0, 14.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.51604461669922, -25.905879974365234, -25.295713424682617, -24.685548782348633, -24.075382232666016, -23.46521759033203, -22.855052947998047, -22.244888305664062, -21.634721755981445, -21.02455711364746, -20.414390563964844, -19.80422592163086, -19.194061279296875, -18.583894729614258, -17.973730087280273, -17.363563537597656, -16.753398895263672, -16.143234252929688, -15.53306770324707, -14.922903060913086, -14.312737464904785, -13.702571868896484, -13.0924072265625, -12.4822416305542, -11.872076034545898, -11.261910438537598, -10.651744842529297, -10.041580200195312, -9.431414604187012, -8.821249008178711, -8.211084365844727, -7.600918769836426, -6.990755081176758, -6.380589485168457, -5.7704243659973145, -5.160259246826172, -4.550093650817871, -3.9399282932281494, -3.3297629356384277, -2.719597816467285, -2.1094322204589844, -1.4992668628692627, -0.889101505279541, -0.27893614768981934, 0.33122920989990234, 0.941394567489624, 1.5515599250793457, 2.1617250442504883, 2.771890640258789, 3.3820559978485107, 3.9922213554382324, 4.602386474609375, 5.212552070617676, 5.822717666625977, 6.432882785797119, 7.043047904968262, 7.6532135009765625, 8.263379096984863, 8.873544692993164, 9.483709335327148, 10.09387493133545, 10.70404052734375, 11.314205169677734, 11.924370765686035, 12.534536361694336]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 9.0, 12.0, 15.0, 17.0, 17.0, 31.0, 27.0, 43.0, 20.0, 31.0, 55.0, 69.0, 134.0, 136.0, 62.0, 41.0, 35.0, 32.0, 28.0, 30.0, 25.0, 22.0, 19.0, 13.0, 11.0, 14.0, 7.0, 5.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.461490631103516, -12.114842414855957, -11.768194198608398, -11.421546936035156, -11.074898719787598, -10.728250503540039, -10.38160228729248, -10.034954071044922, -9.688305854797363, -9.341657638549805, -8.995009422302246, -8.648361206054688, -8.301713943481445, -7.955065727233887, -7.608417510986328, -7.2617692947387695, -6.915121555328369, -6.5684733390808105, -6.22182559967041, -5.875177383422852, -5.528529167175293, -5.181880950927734, -4.835233211517334, -4.488584995269775, -4.141937255859375, -3.7952892780303955, -3.448641061782837, -3.1019930839538574, -2.755344867706299, -2.4086968898773193, -2.06204891204834, -1.7154006958007812, -1.3687524795532227, -1.0221043825149536, -0.6754563450813293, -0.3288083076477051, 0.017839789390563965, 0.364487886428833, 0.7111358642578125, 1.057784080505371, 1.4044320583343506, 1.7510801553726196, 2.0977282524108887, 2.444376230239868, 2.7910242080688477, 3.1376724243164062, 3.4843204021453857, 3.8309686183929443, 4.177616596221924, 4.524264812469482, 4.870912551879883, 5.217560768127441, 5.564208984375, 5.910857200622559, 6.257504940032959, 6.604153156280518, 6.950800895690918, 7.297449111938477, 7.644096851348877, 7.9907450675964355, 8.337392807006836, 8.684041023254395, 9.030689239501953, 9.377337455749512, 9.72398567199707]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 8.0, 21.0, 30.0, 38.0, 58.0, 89.0, 147.0, 217.0, 316.0, 558.0, 1054.0, 2027.0, 4548.0, 11522.0, 39833.0, 202242.0, 1118345.0, 2064728.0, 605147.0, 104551.0, 24263.0, 7821.0, 3213.0, 1498.0, 775.0, 453.0, 289.0, 181.0, 103.0, 67.0, 47.0, 31.0, 23.0, 18.0, 4.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.0054931640625, -0.969970703125, -0.9344482421875, -0.89892578125, -0.8634033203125, -0.827880859375, -0.7923583984375, -0.7568359375, -0.7213134765625, -0.685791015625, -0.6502685546875, -0.61474609375, -0.5792236328125, -0.543701171875, -0.5081787109375, -0.47265625, -0.4371337890625, -0.401611328125, -0.3660888671875, -0.33056640625, -0.2950439453125, -0.259521484375, -0.2239990234375, -0.1884765625, -0.1529541015625, -0.117431640625, -0.0819091796875, -0.04638671875, -0.0108642578125, 0.024658203125, 0.0601806640625, 0.095703125, 0.1312255859375, 0.166748046875, 0.2022705078125, 0.23779296875, 0.2733154296875, 0.308837890625, 0.3443603515625, 0.3798828125, 0.4154052734375, 0.450927734375, 0.4864501953125, 0.52197265625, 0.5574951171875, 0.593017578125, 0.6285400390625, 0.6640625, 0.6995849609375, 0.735107421875, 0.7706298828125, 0.80615234375, 0.8416748046875, 0.877197265625, 0.9127197265625, 0.9482421875, 0.9837646484375, 1.019287109375, 1.0548095703125, 1.09033203125, 1.1258544921875, 1.161376953125, 1.1968994140625, 1.232421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 7.0, 11.0, 15.0, 15.0, 20.0, 18.0, 14.0, 29.0, 28.0, 41.0, 39.0, 40.0, 43.0, 52.0, 51.0, 47.0, 49.0, 60.0, 48.0, 63.0, 48.0, 40.0, 27.0, 39.0, 24.0, 28.0, 21.0, 18.0, 14.0, 9.0, 9.0, 17.0, 4.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80322265625, -0.77972412109375, -0.7562255859375, -0.73272705078125, -0.709228515625, -0.68572998046875, -0.6622314453125, -0.63873291015625, -0.615234375, -0.59173583984375, -0.5682373046875, -0.54473876953125, -0.521240234375, -0.49774169921875, -0.4742431640625, -0.45074462890625, -0.42724609375, -0.40374755859375, -0.3802490234375, -0.35675048828125, -0.333251953125, -0.30975341796875, -0.2862548828125, -0.26275634765625, -0.2392578125, -0.21575927734375, -0.1922607421875, -0.16876220703125, -0.145263671875, -0.12176513671875, -0.0982666015625, -0.07476806640625, -0.05126953125, -0.02777099609375, -0.0042724609375, 0.01922607421875, 0.042724609375, 0.06622314453125, 0.0897216796875, 0.11322021484375, 0.13671875, 0.16021728515625, 0.1837158203125, 0.20721435546875, 0.230712890625, 0.25421142578125, 0.2777099609375, 0.30120849609375, 0.32470703125, 0.34820556640625, 0.3717041015625, 0.39520263671875, 0.418701171875, 0.44219970703125, 0.4656982421875, 0.48919677734375, 0.5126953125, 0.53619384765625, 0.5596923828125, 0.58319091796875, 0.606689453125, 0.63018798828125, 0.6536865234375, 0.67718505859375, 0.70068359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 7.0, 10.0, 15.0, 31.0, 60.0, 131.0, 271.0, 718.0, 3120.0, 209019.0, 3971676.0, 7484.0, 1125.0, 348.0, 146.0, 70.0, 27.0, 18.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2265625, -5.9974365234375, -5.768310546875, -5.5391845703125, -5.31005859375, -5.0809326171875, -4.851806640625, -4.6226806640625, -4.3935546875, -4.1644287109375, -3.935302734375, -3.7061767578125, -3.47705078125, -3.2479248046875, -3.018798828125, -2.7896728515625, -2.560546875, -2.3314208984375, -2.102294921875, -1.8731689453125, -1.64404296875, -1.4149169921875, -1.185791015625, -0.9566650390625, -0.7275390625, -0.4984130859375, -0.269287109375, -0.0401611328125, 0.18896484375, 0.4180908203125, 0.647216796875, 0.8763427734375, 1.10546875, 1.3345947265625, 1.563720703125, 1.7928466796875, 2.02197265625, 2.2510986328125, 2.480224609375, 2.7093505859375, 2.9384765625, 3.1676025390625, 3.396728515625, 3.6258544921875, 3.85498046875, 4.0841064453125, 4.313232421875, 4.5423583984375, 4.771484375, 5.0006103515625, 5.229736328125, 5.4588623046875, 5.68798828125, 5.9171142578125, 6.146240234375, 6.3753662109375, 6.6044921875, 6.8336181640625, 7.062744140625, 7.2918701171875, 7.52099609375, 7.7501220703125, 7.979248046875, 8.2083740234375, 8.4375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 12.0, 17.0, 38.0, 67.0, 144.0, 248.0, 458.0, 834.0, 918.0, 607.0, 321.0, 187.0, 100.0, 48.0, 35.0, 14.0, 10.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.390625, -5.2786712646484375, -5.166717529296875, -5.0547637939453125, -4.94281005859375, -4.8308563232421875, -4.718902587890625, -4.6069488525390625, -4.4949951171875, -4.3830413818359375, -4.271087646484375, -4.1591339111328125, -4.04718017578125, -3.9352264404296875, -3.823272705078125, -3.7113189697265625, -3.599365234375, -3.4874114990234375, -3.375457763671875, -3.2635040283203125, -3.15155029296875, -3.0395965576171875, -2.927642822265625, -2.8156890869140625, -2.7037353515625, -2.5917816162109375, -2.479827880859375, -2.3678741455078125, -2.25592041015625, -2.1439666748046875, -2.032012939453125, -1.9200592041015625, -1.80810546875, -1.6961517333984375, -1.584197998046875, -1.4722442626953125, -1.36029052734375, -1.2483367919921875, -1.136383056640625, -1.0244293212890625, -0.9124755859375, -0.8005218505859375, -0.688568115234375, -0.5766143798828125, -0.46466064453125, -0.3527069091796875, -0.240753173828125, -0.1287994384765625, -0.016845703125, 0.0951080322265625, 0.207061767578125, 0.3190155029296875, 0.43096923828125, 0.5429229736328125, 0.654876708984375, 0.7668304443359375, 0.8787841796875, 0.9907379150390625, 1.102691650390625, 1.2146453857421875, 1.32659912109375, 1.4385528564453125, 1.550506591796875, 1.6624603271484375, 1.7744140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 10.0, 7.0, 11.0, 45.0, 90.0, 203.0, 275.0, 173.0, 99.0, 45.0, 12.0, 12.0, 12.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.668264389038086, -29.586027145385742, -28.5037899017334, -27.421550750732422, -26.339313507080078, -25.257076263427734, -24.17483901977539, -23.092601776123047, -22.010364532470703, -20.92812728881836, -19.845890045166016, -18.763652801513672, -17.681413650512695, -16.59917640686035, -15.516939163208008, -14.434701919555664, -13.352462768554688, -12.270225524902344, -11.187987327575684, -10.10575008392334, -9.02351188659668, -7.941274642944336, -6.859037399291992, -5.77679967880249, -4.694561958312988, -3.6123242378234863, -2.5300867557525635, -1.4478492736816406, -0.36561155319213867, 0.7166261672973633, 1.798863410949707, 2.881101131439209, 3.9633407592773438, 5.045578479766846, 6.127816200256348, 7.210053443908691, 8.292291641235352, 9.374528884887695, 10.456766128540039, 11.539003372192383, 12.621241569519043, 13.703478813171387, 14.785717010498047, 15.86795425415039, 16.950191497802734, 18.032428741455078, 19.114665985107422, 20.1969051361084, 21.279142379760742, 22.361379623413086, 23.44361686706543, 24.525856018066406, 25.60809326171875, 26.690330505371094, 27.772567749023438, 28.85480499267578, 29.937042236328125, 31.01927947998047, 32.10151672363281, 33.183753967285156, 34.2659912109375, 35.348228454589844, 36.43046569824219, 37.5127067565918, 38.59494400024414]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 8.0, 17.0, 16.0, 33.0, 46.0, 45.0, 52.0, 71.0, 78.0, 91.0, 120.0, 83.0, 94.0, 64.0, 46.0, 41.0, 28.0, 28.0, 15.0, 10.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.39293670654297, -26.723655700683594, -26.05437660217285, -25.385095596313477, -24.7158145904541, -24.04653549194336, -23.377254486083984, -22.70797348022461, -22.038692474365234, -21.36941146850586, -20.700132369995117, -20.030851364135742, -19.361570358276367, -18.692291259765625, -18.02301025390625, -17.353729248046875, -16.684450149536133, -16.015169143676758, -15.3458890914917, -14.67660903930664, -14.007328033447266, -13.338047981262207, -12.668767929077148, -11.999486923217773, -11.330206871032715, -10.660926818847656, -9.991645812988281, -9.322365760803223, -8.653085708618164, -7.983804702758789, -7.3145246505737305, -6.645244121551514, -5.975963592529297, -5.30668306350708, -4.637402534484863, -3.9681224822998047, -3.298841953277588, -2.629561424255371, -1.9602813720703125, -1.2910008430480957, -0.6217203140258789, 0.04756009578704834, 0.7168405055999756, 1.3861207962036133, 2.05540132522583, 2.724681854248047, 3.3939619064331055, 4.063242435455322, 4.732522964477539, 5.401803493499756, 6.071084022521973, 6.740364074707031, 7.409644603729248, 8.078925132751465, 8.748205184936523, 9.417486190795898, 10.086766242980957, 10.756046295166016, 11.42532730102539, 12.09460735321045, 12.763887405395508, 13.433168411254883, 14.102448463439941, 14.771728515625, 15.441009521484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 14.0, 11.0, 20.0, 37.0, 66.0, 137.0, 269.0, 556.0, 1354.0, 3695.0, 12503.0, 57500.0, 522163.0, 386250.0, 47414.0, 10852.0, 3387.0, 1249.0, 524.0, 244.0, 125.0, 78.0, 35.0, 22.0, 16.0, 9.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.2501220703125, -2.183837890625, -2.1175537109375, -2.05126953125, -1.9849853515625, -1.918701171875, -1.8524169921875, -1.7861328125, -1.7198486328125, -1.653564453125, -1.5872802734375, -1.52099609375, -1.4547119140625, -1.388427734375, -1.3221435546875, -1.255859375, -1.1895751953125, -1.123291015625, -1.0570068359375, -0.99072265625, -0.9244384765625, -0.858154296875, -0.7918701171875, -0.7255859375, -0.6593017578125, -0.593017578125, -0.5267333984375, -0.46044921875, -0.3941650390625, -0.327880859375, -0.2615966796875, -0.1953125, -0.1290283203125, -0.062744140625, 0.0035400390625, 0.06982421875, 0.1361083984375, 0.202392578125, 0.2686767578125, 0.3349609375, 0.4012451171875, 0.467529296875, 0.5338134765625, 0.60009765625, 0.6663818359375, 0.732666015625, 0.7989501953125, 0.865234375, 0.9315185546875, 0.997802734375, 1.0640869140625, 1.13037109375, 1.1966552734375, 1.262939453125, 1.3292236328125, 1.3955078125, 1.4617919921875, 1.528076171875, 1.5943603515625, 1.66064453125, 1.7269287109375, 1.793212890625, 1.8594970703125, 1.92578125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 19.0, 31.0, 32.0, 46.0, 43.0, 85.0, 84.0, 91.0, 81.0, 104.0, 100.0, 70.0, 62.0, 42.0, 33.0, 28.0, 16.0, 6.0, 5.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0], "bins": [-2.29296875, -2.2446746826171875, -2.196380615234375, -2.1480865478515625, -2.09979248046875, -2.0514984130859375, -2.003204345703125, -1.9549102783203125, -1.9066162109375, -1.8583221435546875, -1.810028076171875, -1.7617340087890625, -1.71343994140625, -1.6651458740234375, -1.616851806640625, -1.5685577392578125, -1.520263671875, -1.4719696044921875, -1.423675537109375, -1.3753814697265625, -1.32708740234375, -1.2787933349609375, -1.230499267578125, -1.1822052001953125, -1.1339111328125, -1.0856170654296875, -1.037322998046875, -0.9890289306640625, -0.94073486328125, -0.8924407958984375, -0.844146728515625, -0.7958526611328125, -0.74755859375, -0.6992645263671875, -0.650970458984375, -0.6026763916015625, -0.55438232421875, -0.5060882568359375, -0.457794189453125, -0.4095001220703125, -0.3612060546875, -0.3129119873046875, -0.264617919921875, -0.2163238525390625, -0.16802978515625, -0.1197357177734375, -0.071441650390625, -0.0231475830078125, 0.025146484375, 0.0734405517578125, 0.121734619140625, 0.1700286865234375, 0.21832275390625, 0.2666168212890625, 0.314910888671875, 0.3632049560546875, 0.4114990234375, 0.4597930908203125, 0.508087158203125, 0.5563812255859375, 0.60467529296875, 0.6529693603515625, 0.701263427734375, 0.7495574951171875, 0.7978515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 7.0, 9.0, 17.0, 15.0, 30.0, 33.0, 48.0, 88.0, 158.0, 272.0, 505.0, 1237.0, 3836.0, 18316.0, 216124.0, 776640.0, 23898.0, 4516.0, 1415.0, 591.0, 320.0, 147.0, 111.0, 54.0, 49.0, 36.0, 15.0, 9.0, 11.0, 9.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.066986083984375, -1.99334716796875, -1.919708251953125, -1.8460693359375, -1.772430419921875, -1.69879150390625, -1.625152587890625, -1.551513671875, -1.477874755859375, -1.40423583984375, -1.330596923828125, -1.2569580078125, -1.183319091796875, -1.10968017578125, -1.036041259765625, -0.96240234375, -0.888763427734375, -0.81512451171875, -0.741485595703125, -0.6678466796875, -0.594207763671875, -0.52056884765625, -0.446929931640625, -0.373291015625, -0.299652099609375, -0.22601318359375, -0.152374267578125, -0.0787353515625, -0.005096435546875, 0.06854248046875, 0.142181396484375, 0.2158203125, 0.289459228515625, 0.36309814453125, 0.436737060546875, 0.5103759765625, 0.584014892578125, 0.65765380859375, 0.731292724609375, 0.804931640625, 0.878570556640625, 0.95220947265625, 1.025848388671875, 1.0994873046875, 1.173126220703125, 1.24676513671875, 1.320404052734375, 1.39404296875, 1.467681884765625, 1.54132080078125, 1.614959716796875, 1.6885986328125, 1.762237548828125, 1.83587646484375, 1.909515380859375, 1.983154296875, 2.056793212890625, 2.13043212890625, 2.204071044921875, 2.2777099609375, 2.351348876953125, 2.42498779296875, 2.498626708984375, 2.572265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 6.0, 8.0, 8.0, 8.0, 11.0, 8.0, 16.0, 13.0, 30.0, 32.0, 45.0, 50.0, 83.0, 85.0, 102.0, 84.0, 76.0, 84.0, 56.0, 36.0, 31.0, 20.0, 25.0, 15.0, 15.0, 23.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.38177490234375, -3.2401123046875, -3.09844970703125, -2.956787109375, -2.81512451171875, -2.6734619140625, -2.53179931640625, -2.39013671875, -2.24847412109375, -2.1068115234375, -1.96514892578125, -1.823486328125, -1.68182373046875, -1.5401611328125, -1.39849853515625, -1.2568359375, -1.11517333984375, -0.9735107421875, -0.83184814453125, -0.690185546875, -0.54852294921875, -0.4068603515625, -0.26519775390625, -0.12353515625, 0.01812744140625, 0.1597900390625, 0.30145263671875, 0.443115234375, 0.58477783203125, 0.7264404296875, 0.86810302734375, 1.009765625, 1.15142822265625, 1.2930908203125, 1.43475341796875, 1.576416015625, 1.71807861328125, 1.8597412109375, 2.00140380859375, 2.14306640625, 2.28472900390625, 2.4263916015625, 2.56805419921875, 2.709716796875, 2.85137939453125, 2.9930419921875, 3.13470458984375, 3.2763671875, 3.41802978515625, 3.5596923828125, 3.70135498046875, 3.843017578125, 3.98468017578125, 4.1263427734375, 4.26800537109375, 4.40966796875, 4.55133056640625, 4.6929931640625, 4.83465576171875, 4.976318359375, 5.11798095703125, 5.2596435546875, 5.40130615234375, 5.54296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 2.0, 6.0, 14.0, 13.0, 16.0, 16.0, 16.0, 23.0, 45.0, 64.0, 74.0, 153.0, 336.0, 708.0, 1673.0, 5508.0, 22965.0, 278047.0, 705378.0, 24581.0, 5498.0, 1806.0, 764.0, 345.0, 167.0, 109.0, 53.0, 47.0, 27.0, 18.0, 10.0, 14.0, 16.0, 6.0, 4.0, 6.0, 6.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452392578125, -0.438690185546875, -0.42498779296875, -0.411285400390625, -0.3975830078125, -0.383880615234375, -0.37017822265625, -0.356475830078125, -0.3427734375, -0.329071044921875, -0.31536865234375, -0.301666259765625, -0.2879638671875, -0.274261474609375, -0.26055908203125, -0.246856689453125, -0.233154296875, -0.219451904296875, -0.20574951171875, -0.192047119140625, -0.1783447265625, -0.164642333984375, -0.15093994140625, -0.137237548828125, -0.12353515625, -0.109832763671875, -0.09613037109375, -0.082427978515625, -0.0687255859375, -0.055023193359375, -0.04132080078125, -0.027618408203125, -0.013916015625, -0.000213623046875, 0.01348876953125, 0.027191162109375, 0.0408935546875, 0.054595947265625, 0.06829833984375, 0.082000732421875, 0.095703125, 0.109405517578125, 0.12310791015625, 0.136810302734375, 0.1505126953125, 0.164215087890625, 0.17791748046875, 0.191619873046875, 0.205322265625, 0.219024658203125, 0.23272705078125, 0.246429443359375, 0.2601318359375, 0.273834228515625, 0.28753662109375, 0.301239013671875, 0.31494140625, 0.328643798828125, 0.34234619140625, 0.356048583984375, 0.3697509765625, 0.383453369140625, 0.39715576171875, 0.410858154296875, 0.424560546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 5.0, 14.0, 12.0, 20.0, 25.0, 33.0, 41.0, 74.0, 107.0, 118.0, 115.0, 122.0, 86.0, 50.0, 36.0, 34.0, 19.0, 15.0, 13.0, 11.0, 10.0, 10.0, 7.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00015151500701904297, -0.00014719553291797638, -0.0001428760588169098, -0.0001385565847158432, -0.0001342371106147766, -0.00012991763651371002, -0.00012559816241264343, -0.00012127868831157684, -0.00011695921421051025, -0.00011263974010944366, -0.00010832026600837708, -0.00010400079190731049, -9.96813178062439e-05, -9.536184370517731e-05, -9.104236960411072e-05, -8.672289550304413e-05, -8.240342140197754e-05, -7.808394730091095e-05, -7.376447319984436e-05, -6.944499909877777e-05, -6.512552499771118e-05, -6.080605089664459e-05, -5.6486576795578e-05, -5.2167102694511414e-05, -4.7847628593444824e-05, -4.3528154492378235e-05, -3.9208680391311646e-05, -3.4889206290245056e-05, -3.056973218917847e-05, -2.6250258088111877e-05, -2.1930783987045288e-05, -1.76113098859787e-05, -1.329183578491211e-05, -8.97236168384552e-06, -4.652887582778931e-06, -3.334134817123413e-07, 3.986060619354248e-06, 8.305534720420837e-06, 1.2625008821487427e-05, 1.6944482922554016e-05, 2.1263957023620605e-05, 2.5583431124687195e-05, 2.9902905225753784e-05, 3.4222379326820374e-05, 3.854185342788696e-05, 4.286132752895355e-05, 4.718080163002014e-05, 5.150027573108673e-05, 5.581974983215332e-05, 6.013922393321991e-05, 6.44586980342865e-05, 6.877817213535309e-05, 7.309764623641968e-05, 7.741712033748627e-05, 8.173659443855286e-05, 8.605606853961945e-05, 9.037554264068604e-05, 9.469501674175262e-05, 9.901449084281921e-05, 0.0001033339649438858, 0.00010765343904495239, 0.00011197291314601898, 0.00011629238724708557, 0.00012061186134815216, 0.00012493133544921875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 10.0, 5.0, 15.0, 16.0, 14.0, 9.0, 16.0, 24.0, 37.0, 37.0, 90.0, 120.0, 167.0, 277.0, 477.0, 766.0, 1465.0, 3154.0, 7183.0, 19269.0, 67481.0, 755160.0, 140389.0, 32404.0, 11013.0, 4370.0, 2043.0, 969.0, 594.0, 316.0, 202.0, 140.0, 85.0, 56.0, 51.0, 33.0, 29.0, 17.0, 10.0, 7.0, 9.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 3.0, 4.0], "bins": [-0.255859375, -0.24889183044433594, -0.24192428588867188, -0.2349567413330078, -0.22798919677734375, -0.2210216522216797, -0.21405410766601562, -0.20708656311035156, -0.2001190185546875, -0.19315147399902344, -0.18618392944335938, -0.1792163848876953, -0.17224884033203125, -0.1652812957763672, -0.15831375122070312, -0.15134620666503906, -0.144378662109375, -0.13741111755371094, -0.13044357299804688, -0.12347602844238281, -0.11650848388671875, -0.10954093933105469, -0.10257339477539062, -0.09560585021972656, -0.0886383056640625, -0.08167076110839844, -0.07470321655273438, -0.06773567199707031, -0.06076812744140625, -0.05380058288574219, -0.046833038330078125, -0.03986549377441406, -0.03289794921875, -0.025930404663085938, -0.018962860107421875, -0.011995315551757812, -0.00502777099609375, 0.0019397735595703125, 0.008907318115234375, 0.015874862670898438, 0.0228424072265625, 0.029809951782226562, 0.036777496337890625, 0.04374504089355469, 0.05071258544921875, 0.05768013000488281, 0.06464767456054688, 0.07161521911621094, 0.078582763671875, 0.08555030822753906, 0.09251785278320312, 0.09948539733886719, 0.10645294189453125, 0.11342048645019531, 0.12038803100585938, 0.12735557556152344, 0.1343231201171875, 0.14129066467285156, 0.14825820922851562, 0.1552257537841797, 0.16219329833984375, 0.1691608428955078, 0.17612838745117188, 0.18309593200683594, 0.1900634765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 7.0, 5.0, 5.0, 0.0, 6.0, 7.0, 8.0, 7.0, 9.0, 24.0, 20.0, 17.0, 24.0, 36.0, 50.0, 73.0, 107.0, 92.0, 104.0, 122.0, 65.0, 51.0, 35.0, 34.0, 28.0, 12.0, 7.0, 9.0, 4.0, 7.0, 7.0, 8.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32275390625, -0.3111572265625, -0.299560546875, -0.2879638671875, -0.2763671875, -0.2647705078125, -0.253173828125, -0.2415771484375, -0.22998046875, -0.2183837890625, -0.206787109375, -0.1951904296875, -0.18359375, -0.1719970703125, -0.160400390625, -0.1488037109375, -0.13720703125, -0.1256103515625, -0.114013671875, -0.1024169921875, -0.0908203125, -0.0792236328125, -0.067626953125, -0.0560302734375, -0.04443359375, -0.0328369140625, -0.021240234375, -0.0096435546875, 0.001953125, 0.0135498046875, 0.025146484375, 0.0367431640625, 0.04833984375, 0.0599365234375, 0.071533203125, 0.0831298828125, 0.0947265625, 0.1063232421875, 0.117919921875, 0.1295166015625, 0.14111328125, 0.1527099609375, 0.164306640625, 0.1759033203125, 0.1875, 0.1990966796875, 0.210693359375, 0.2222900390625, 0.23388671875, 0.2454833984375, 0.257080078125, 0.2686767578125, 0.2802734375, 0.2918701171875, 0.303466796875, 0.3150634765625, 0.32666015625, 0.3382568359375, 0.349853515625, 0.3614501953125, 0.373046875, 0.3846435546875, 0.396240234375, 0.4078369140625, 0.41943359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 9.0, 29.0, 26.0, 54.0, 122.0, 535.0, 108.0, 55.0, 28.0, 16.0, 9.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.833745956420898, -14.199544906616211, -13.565343856811523, -12.931142807006836, -12.296941757202148, -11.662740707397461, -11.02854061126709, -10.394339561462402, -9.760138511657715, -9.125937461853027, -8.49173641204834, -7.8575358390808105, -7.223334789276123, -6.5891337394714355, -5.954933166503906, -5.320732116699219, -4.686531066894531, -4.052330017089844, -3.4181292057037354, -2.783928394317627, -2.1497273445129395, -1.515526294708252, -0.8813254833221436, -0.24712467193603516, 0.38707637786865234, 1.0212773084640503, 1.6554782390594482, 2.2896790504455566, 2.923880100250244, 3.5580811500549316, 4.192281723022461, 4.826482772827148, 5.460683822631836, 6.094884872436523, 6.729085922241211, 7.36328649520874, 7.997487545013428, 8.631689071655273, 9.265889167785645, 9.900090217590332, 10.53429126739502, 11.168492317199707, 11.802693367004395, 12.436894416809082, 13.071094512939453, 13.70529556274414, 14.339496612548828, 14.973697662353516, 15.607898712158203, 16.24209976196289, 16.876300811767578, 17.510501861572266, 18.144702911376953, 18.77890396118164, 19.413105010986328, 20.047306060791016, 20.681507110595703, 21.31570816040039, 21.949909210205078, 22.584110260009766, 23.218311309814453, 23.85251235961914, 24.486713409423828, 25.120914459228516, 25.75511360168457]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 7.0, 8.0, 7.0, 12.0, 19.0, 15.0, 18.0, 29.0, 29.0, 25.0, 27.0, 51.0, 154.0, 255.0, 107.0, 30.0, 23.0, 21.0, 19.0, 19.0, 21.0, 14.0, 18.0, 15.0, 12.0, 8.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.662029266357422, -10.321331024169922, -9.980632781982422, -9.639934539794922, -9.299236297607422, -8.958538055419922, -8.617839813232422, -8.277141571044922, -7.93644380569458, -7.59574556350708, -7.25504732131958, -6.914349555969238, -6.573651313781738, -6.232953071594238, -5.892254829406738, -5.551556587219238, -5.210858345031738, -4.870160102844238, -4.529461860656738, -4.188763618469238, -3.8480656147003174, -3.5073673725128174, -3.1666693687438965, -2.8259711265563965, -2.4852728843688965, -2.1445746421813965, -1.803876519203186, -1.4631783962249756, -1.1224801540374756, -0.7817819118499756, -0.4410839080810547, -0.10038566589355469, 0.2403116226196289, 0.5810098052024841, 0.9217079877853394, 1.2624061107635498, 1.6031043529510498, 1.9438025951385498, 2.2845005989074707, 2.6251988410949707, 2.9658970832824707, 3.3065953254699707, 3.6472935676574707, 3.9879915714263916, 4.3286895751953125, 4.6693878173828125, 5.0100860595703125, 5.3507843017578125, 5.6914825439453125, 6.0321807861328125, 6.3728790283203125, 6.7135772705078125, 7.0542755126953125, 7.3949737548828125, 7.735671520233154, 8.076370239257812, 8.417068481445312, 8.757766723632812, 9.098464965820312, 9.439163208007812, 9.779861450195312, 10.120559692382812, 10.461257934570312, 10.801956176757812, 11.142653465270996]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 6.0, 10.0, 8.0, 13.0, 8.0, 5.0, 18.0, 13.0, 22.0, 25.0, 37.0, 39.0, 50.0, 94.0, 265.0, 92.0, 56.0, 35.0, 22.0, 28.0, 32.0, 21.0, 18.0, 15.0, 16.0, 9.0, 7.0, 9.0, 12.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7928237915039062, -0.7667999267578125, -0.7407760620117188, -0.714752197265625, -0.6887283325195312, -0.6627044677734375, -0.6366806030273438, -0.61065673828125, -0.5846328735351562, -0.5586090087890625, -0.5325851440429688, -0.506561279296875, -0.48053741455078125, -0.4545135498046875, -0.42848968505859375, -0.4024658203125, -0.37644195556640625, -0.3504180908203125, -0.32439422607421875, -0.298370361328125, -0.27234649658203125, -0.2463226318359375, -0.22029876708984375, -0.19427490234375, -0.16825103759765625, -0.1422271728515625, -0.11620330810546875, -0.090179443359375, -0.06415557861328125, -0.0381317138671875, -0.01210784912109375, 0.013916015625, 0.03993988037109375, 0.0659637451171875, 0.09198760986328125, 0.118011474609375, 0.14403533935546875, 0.1700592041015625, 0.19608306884765625, 0.22210693359375, 0.24813079833984375, 0.2741546630859375, 0.30017852783203125, 0.326202392578125, 0.35222625732421875, 0.3782501220703125, 0.40427398681640625, 0.4302978515625, 0.45632171630859375, 0.4823455810546875, 0.5083694458007812, 0.534393310546875, 0.5604171752929688, 0.5864410400390625, 0.6124649047851562, 0.63848876953125, 0.6645126342773438, 0.6905364990234375, 0.7165603637695312, 0.742584228515625, 0.7686080932617188, 0.7946319580078125, 0.8206558227539062, 0.8466796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 8.0, 8.0, 12.0, 8.0, 14.0, 18.0, 37.0, 65.0, 141.0, 373.0, 1599.0, 18244.0, 8360083.0, 6565.0, 900.0, 234.0, 117.0, 51.0, 29.0, 14.0, 20.0, 8.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-11.275091171264648, -10.890626907348633, -10.5061616897583, -10.121697425842285, -9.737232208251953, -9.352767944335938, -8.968303680419922, -8.58383846282959, -8.199374198913574, -7.8149094581604, -7.430444717407227, -7.045980453491211, -6.661515712738037, -6.277050971984863, -5.8925862312316895, -5.508121490478516, -5.123656749725342, -4.739192008972168, -4.354727268218994, -3.9702627658843994, -3.5857982635498047, -3.201333522796631, -2.816868782043457, -2.4324042797088623, -2.0479395389556885, -1.6634749174118042, -1.27901029586792, -0.8945455551147461, -0.5100809335708618, -0.12561631202697754, 0.2588484287261963, 0.643312931060791, 1.0277776718139648, 1.4122422933578491, 1.7967069149017334, 2.1811716556549072, 2.565636157989502, 2.950100898742676, 3.3345656394958496, 3.7190301418304443, 4.103494644165039, 4.487959384918213, 4.872424125671387, 5.256888389587402, 5.641353130340576, 6.02581787109375, 6.410282611846924, 6.794747352600098, 7.1792120933532715, 7.563676834106445, 7.948141574859619, 8.332606315612793, 8.717070579528809, 9.10153579711914, 9.486000061035156, 9.870464324951172, 10.254929542541504, 10.63939380645752, 11.023859024047852, 11.408323287963867, 11.7927885055542, 12.177252769470215, 12.561717987060547, 12.946182250976562, 13.330646514892578]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 5.0, 5.0, 1.0, 6.0, 7.0, 2.0, 8.0, 3.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.4850492477417, -8.188342094421387, -7.891635417938232, -7.594928741455078, -7.298221588134766, -7.001514911651611, -6.704808235168457, -6.4081010818481445, -6.11139440536499, -5.814687728881836, -5.517980575561523, -5.221273899078369, -4.924567222595215, -4.627860069274902, -4.331153392791748, -4.034446716308594, -3.7377395629882812, -3.441032648086548, -3.1443257331848145, -2.84761905670166, -2.5509121417999268, -2.2542052268981934, -1.9574984312057495, -1.6607916355133057, -1.3640847206115723, -1.0673778057098389, -0.770671010017395, -0.4739641547203064, -0.17725729942321777, 0.11944961547851562, 0.4161564111709595, 0.7128632068634033, 1.0095701217651367, 1.3062770366668701, 1.602983832359314, 1.8996906280517578, 2.196397542953491, 2.4931044578552246, 2.789811134338379, 3.0865180492401123, 3.3832249641418457, 3.679931879043579, 3.9766387939453125, 4.273345470428467, 4.570052146911621, 4.866759300231934, 5.163465976715088, 5.460172653198242, 5.756879806518555, 6.053586483001709, 6.3502936363220215, 6.647000312805176, 6.943707466125488, 7.240414142608643, 7.537120819091797, 7.833827972412109, 8.130535125732422, 8.427242279052734, 8.72394847869873, 9.020655632019043, 9.317362785339355, 9.614068984985352, 9.910776138305664, 10.207483291625977, 10.504189491271973]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 7.0, 15.0, 21.0, 30.0, 29.0, 54.0, 96.0, 141.0, 249.0, 514.0, 1446.0, 4823.0, 16533.0, 65241.0, 226302.0, 155829.0, 38390.0, 9853.0, 2838.0, 906.0, 386.0, 192.0, 132.0, 64.0, 54.0, 35.0, 25.0, 16.0, 6.0, 7.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.078125, -8.84423828125, -8.6103515625, -8.37646484375, -8.142578125, -7.90869140625, -7.6748046875, -7.44091796875, -7.20703125, -6.97314453125, -6.7392578125, -6.50537109375, -6.271484375, -6.03759765625, -5.8037109375, -5.56982421875, -5.3359375, -5.10205078125, -4.8681640625, -4.63427734375, -4.400390625, -4.16650390625, -3.9326171875, -3.69873046875, -3.46484375, -3.23095703125, -2.9970703125, -2.76318359375, -2.529296875, -2.29541015625, -2.0615234375, -1.82763671875, -1.59375, -1.35986328125, -1.1259765625, -0.89208984375, -0.658203125, -0.42431640625, -0.1904296875, 0.04345703125, 0.27734375, 0.51123046875, 0.7451171875, 0.97900390625, 1.212890625, 1.44677734375, 1.6806640625, 1.91455078125, 2.1484375, 2.38232421875, 2.6162109375, 2.85009765625, 3.083984375, 3.31787109375, 3.5517578125, 3.78564453125, 4.01953125, 4.25341796875, 4.4873046875, 4.72119140625, 4.955078125, 5.18896484375, 5.4228515625, 5.65673828125, 5.890625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 6.0, 17.0, 15.0, 21.0, 36.0, 53.0, 72.0, 70.0, 117.0, 109.0, 125.0, 92.0, 92.0, 50.0, 42.0, 37.0, 15.0, 7.0, 12.0, 3.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.224609375, -2.1771011352539062, -2.1295928955078125, -2.0820846557617188, -2.034576416015625, -1.9870681762695312, -1.9395599365234375, -1.8920516967773438, -1.84454345703125, -1.7970352172851562, -1.7495269775390625, -1.7020187377929688, -1.654510498046875, -1.6070022583007812, -1.5594940185546875, -1.5119857788085938, -1.4644775390625, -1.4169692993164062, -1.3694610595703125, -1.3219528198242188, -1.274444580078125, -1.2269363403320312, -1.1794281005859375, -1.1319198608398438, -1.08441162109375, -1.0369033813476562, -0.9893951416015625, -0.9418869018554688, -0.894378662109375, -0.8468704223632812, -0.7993621826171875, -0.7518539428710938, -0.704345703125, -0.6568374633789062, -0.6093292236328125, -0.5618209838867188, -0.514312744140625, -0.46680450439453125, -0.4192962646484375, -0.37178802490234375, -0.32427978515625, -0.27677154541015625, -0.2292633056640625, -0.18175506591796875, -0.134246826171875, -0.08673858642578125, -0.0392303466796875, 0.00827789306640625, 0.0557861328125, 0.10329437255859375, 0.1508026123046875, 0.19831085205078125, 0.245819091796875, 0.29332733154296875, 0.3408355712890625, 0.38834381103515625, 0.43585205078125, 0.48336029052734375, 0.5308685302734375, 0.5783767700195312, 0.625885009765625, 0.6733932495117188, 0.7209014892578125, 0.7684097290039062, 0.81591796875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 9.0, 10.0, 7.0, 18.0, 49.0, 86.0, 124.0, 103.0, 45.0, 11.0, 8.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.007118225097656, -7.69016170501709, -7.373204708099365, -7.056247711181641, -6.739291191101074, -6.422334671020508, -6.105377674102783, -5.788420677185059, -5.471464157104492, -5.154507637023926, -4.837550640106201, -4.520593643188477, -4.20363712310791, -3.8866803646087646, -3.569723606109619, -3.2527668476104736, -2.935810089111328, -2.6188533306121826, -2.301896572113037, -1.9849398136138916, -1.667983055114746, -1.3510262966156006, -1.034069538116455, -0.7171127796173096, -0.40015602111816406, -0.08319926261901855, 0.23375749588012695, 0.5507142543792725, 0.867671012878418, 1.1846277713775635, 1.501584529876709, 1.8185412883758545, 2.1354970932006836, 2.452453851699829, 2.7694106101989746, 3.08636736869812, 3.4033241271972656, 3.720280885696411, 4.037237644195557, 4.354194641113281, 4.671151161193848, 4.988107681274414, 5.305064678192139, 5.622021675109863, 5.93897819519043, 6.255934715270996, 6.572891712188721, 6.889848709106445, 7.206805229187012, 7.523761749267578, 7.840718746185303, 8.157675743103027, 8.474632263183594, 8.79158878326416, 9.108545303344727, 9.42550277709961, 9.742459297180176, 10.059415817260742, 10.376373291015625, 10.693329811096191, 11.010286331176758, 11.327242851257324, 11.64419937133789, 11.961156845092773, 12.27811336517334]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 8.0, 11.0, 13.0, 25.0, 67.0, 123.0, 136.0, 53.0, 11.0, 9.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.562443733215332, -12.272331237792969, -11.982219696044922, -11.692107200622559, -11.401995658874512, -11.111883163452148, -10.821771621704102, -10.531659126281738, -10.241546630859375, -9.951434135437012, -9.661322593688965, -9.371210098266602, -9.081098556518555, -8.790986061096191, -8.500873565673828, -8.210762023925781, -7.920650005340576, -7.630537986755371, -7.340425968170166, -7.050313949584961, -6.760201454162598, -6.470089435577393, -6.1799774169921875, -5.889864921569824, -5.599753379821777, -5.309641361236572, -5.019529342651367, -4.729416847229004, -4.439304828643799, -4.149192810058594, -3.8590807914733887, -3.5689685344696045, -3.2788567543029785, -2.9887447357177734, -2.6986324787139893, -2.408520460128784, -2.118408203125, -1.828296184539795, -1.5381841659545898, -1.2480719089508057, -0.9579598903656006, -0.667847752571106, -0.3777356743812561, -0.08762359619140625, 0.20248854160308838, 0.492600679397583, 0.7827126979827881, 1.0728249549865723, 1.3629369735717773, 1.653049111366272, 1.9431612491607666, 2.2332732677459717, 2.523385524749756, 2.813497543334961, 3.103609561920166, 3.39372181892395, 3.6838338375091553, 3.9739458560943604, 4.2640581130981445, 4.55417013168335, 4.844282150268555, 5.134394645690918, 5.424506187438965, 5.714618682861328, 6.004730701446533]}, "eval/loss": 4.330733299255371, "eval/wer": 1.92959143197144, "eval/runtime": 943.0842, "eval/samples_per_second": 2.801, "eval/steps_per_second": 0.351} \ No newline at end of file +{"train/loss": 3.4805, "train/learning_rate": 3.1152647975077885e-07, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 8506, "_timestamp": 1646163402, "_step": 1787, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 17.0, 19.0, 52.0, 108.0, 280.0, 250.0, 111.0, 44.0, 41.0, 26.0, 16.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.1670684814453, -248.654052734375, -243.14105224609375, -237.62803649902344, -232.1150360107422, -226.60202026367188, -221.08901977539062, -215.5760040283203, -210.06298828125, -204.5499725341797, -199.03697204589844, -193.52395629882812, -188.01095581054688, -182.49794006347656, -176.98492431640625, -171.471923828125, -165.95892333984375, -160.44590759277344, -154.9329071044922, -149.41989135742188, -143.90689086914062, -138.3938751220703, -132.880859375, -127.36785888671875, -121.85485076904297, -116.34184265136719, -110.8288345336914, -105.31582641601562, -99.80281066894531, -94.28981018066406, -88.77679443359375, -83.26378631591797, -77.75078582763672, -72.23777770996094, -66.72476959228516, -61.21175765991211, -55.69874954223633, -50.18574142456055, -44.6727294921875, -39.15972137451172, -33.64671325683594, -28.133705139160156, -22.620695114135742, -17.107685089111328, -11.594676971435547, -6.081668853759766, -0.5686569213867188, 4.9443511962890625, 10.457359313964844, 15.970368385314941, 21.48337745666504, 26.996387481689453, 32.509395599365234, 38.022403717041016, 43.53541564941406, 49.048423767089844, 54.561431884765625, 60.074440002441406, 65.58744812011719, 71.1004638671875, 76.61346435546875, 82.12648010253906, 87.63948822021484, 93.15249633789062, 98.6655044555664]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 6.0, 3.0, 9.0, 11.0, 8.0, 13.0, 8.0, 13.0, 12.0, 23.0, 17.0, 23.0, 24.0, 26.0, 21.0, 23.0, 43.0, 67.0, 77.0, 103.0, 92.0, 79.0, 66.0, 38.0, 29.0, 19.0, 15.0, 20.0, 20.0, 13.0, 11.0, 11.0, 10.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-328.735595703125, -319.05816650390625, -309.3807373046875, -299.70330810546875, -290.02587890625, -280.34844970703125, -270.6710205078125, -260.9935607910156, -251.31613159179688, -241.63870239257812, -231.96127319335938, -222.28384399414062, -212.6063995361328, -202.92897033691406, -193.2515411376953, -183.5740966796875, -173.8966827392578, -164.21925354003906, -154.5418243408203, -144.8643798828125, -135.18695068359375, -125.509521484375, -115.83209228515625, -106.15465545654297, -96.47722625732422, -86.79979705810547, -77.12236022949219, -67.44493103027344, -57.76749801635742, -48.090065002441406, -38.412635803222656, -28.735198974609375, -19.057769775390625, -9.380337715148926, 0.29709434509277344, 9.974525451660156, 19.651958465576172, 29.329391479492188, 39.00682067871094, 48.68425750732422, 58.36168670654297, 68.03911590576172, 77.716552734375, 87.39398193359375, 97.0714111328125, 106.74884796142578, 116.42627716064453, 126.10371398925781, 135.78114318847656, 145.4585723876953, 155.13600158691406, 164.81344604492188, 174.49087524414062, 184.16830444335938, 193.84573364257812, 203.52316284179688, 213.20059204101562, 222.87802124023438, 232.55545043945312, 242.23287963867188, 251.9103240966797, 261.5877685546875, 271.26519775390625, 280.942626953125, 290.62005615234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 12.0, 11.0, 11.0, 8.0, 17.0, 19.0, 18.0, 19.0, 30.0, 16.0, 30.0, 29.0, 35.0, 72.0, 65.0, 79.0, 86.0, 75.0, 73.0, 55.0, 36.0, 33.0, 18.0, 19.0, 20.0, 18.0, 14.0, 10.0, 6.0, 11.0, 10.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.234375, -9.9219970703125, -9.609619140625, -9.2972412109375, -8.98486328125, -8.6724853515625, -8.360107421875, -8.0477294921875, -7.7353515625, -7.4229736328125, -7.110595703125, -6.7982177734375, -6.48583984375, -6.1734619140625, -5.861083984375, -5.5487060546875, -5.236328125, -4.9239501953125, -4.611572265625, -4.2991943359375, -3.98681640625, -3.6744384765625, -3.362060546875, -3.0496826171875, -2.7373046875, -2.4249267578125, -2.112548828125, -1.8001708984375, -1.48779296875, -1.1754150390625, -0.863037109375, -0.5506591796875, -0.23828125, 0.0740966796875, 0.386474609375, 0.6988525390625, 1.01123046875, 1.3236083984375, 1.635986328125, 1.9483642578125, 2.2607421875, 2.5731201171875, 2.885498046875, 3.1978759765625, 3.51025390625, 3.8226318359375, 4.135009765625, 4.4473876953125, 4.759765625, 5.0721435546875, 5.384521484375, 5.6968994140625, 6.00927734375, 6.3216552734375, 6.634033203125, 6.9464111328125, 7.2587890625, 7.5711669921875, 7.883544921875, 8.1959228515625, 8.50830078125, 8.8206787109375, 9.133056640625, 9.4454345703125, 9.7578125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 8.0, 7.0, 11.0, 15.0, 17.0, 28.0, 26.0, 45.0, 56.0, 58.0, 123.0, 160.0, 206.0, 339.0, 539.0, 915.0, 1751.0, 3869.0, 9968.0, 40686.0, 3829855.0, 278658.0, 16287.0, 5380.0, 2248.0, 1170.0, 611.0, 389.0, 238.0, 173.0, 111.0, 90.0, 63.0, 41.0, 33.0, 29.0, 13.0, 14.0, 14.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-73.9375, -71.6787109375, -69.419921875, -67.1611328125, -64.90234375, -62.6435546875, -60.384765625, -58.1259765625, -55.8671875, -53.6083984375, -51.349609375, -49.0908203125, -46.83203125, -44.5732421875, -42.314453125, -40.0556640625, -37.796875, -35.5380859375, -33.279296875, -31.0205078125, -28.76171875, -26.5029296875, -24.244140625, -21.9853515625, -19.7265625, -17.4677734375, -15.208984375, -12.9501953125, -10.69140625, -8.4326171875, -6.173828125, -3.9150390625, -1.65625, 0.6025390625, 2.861328125, 5.1201171875, 7.37890625, 9.6376953125, 11.896484375, 14.1552734375, 16.4140625, 18.6728515625, 20.931640625, 23.1904296875, 25.44921875, 27.7080078125, 29.966796875, 32.2255859375, 34.484375, 36.7431640625, 39.001953125, 41.2607421875, 43.51953125, 45.7783203125, 48.037109375, 50.2958984375, 52.5546875, 54.8134765625, 57.072265625, 59.3310546875, 61.58984375, 63.8486328125, 66.107421875, 68.3662109375, 70.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 11.0, 9.0, 13.0, 16.0, 20.0, 27.0, 32.0, 38.0, 65.0, 83.0, 129.0, 271.0, 571.0, 910.0, 781.0, 413.0, 233.0, 125.0, 82.0, 50.0, 38.0, 30.0, 21.0, 19.0, 10.0, 9.0, 13.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.8125, -38.70068359375, -37.5888671875, -36.47705078125, -35.365234375, -34.25341796875, -33.1416015625, -32.02978515625, -30.91796875, -29.80615234375, -28.6943359375, -27.58251953125, -26.470703125, -25.35888671875, -24.2470703125, -23.13525390625, -22.0234375, -20.91162109375, -19.7998046875, -18.68798828125, -17.576171875, -16.46435546875, -15.3525390625, -14.24072265625, -13.12890625, -12.01708984375, -10.9052734375, -9.79345703125, -8.681640625, -7.56982421875, -6.4580078125, -5.34619140625, -4.234375, -3.12255859375, -2.0107421875, -0.89892578125, 0.212890625, 1.32470703125, 2.4365234375, 3.54833984375, 4.66015625, 5.77197265625, 6.8837890625, 7.99560546875, 9.107421875, 10.21923828125, 11.3310546875, 12.44287109375, 13.5546875, 14.66650390625, 15.7783203125, 16.89013671875, 18.001953125, 19.11376953125, 20.2255859375, 21.33740234375, 22.44921875, 23.56103515625, 24.6728515625, 25.78466796875, 26.896484375, 28.00830078125, 29.1201171875, 30.23193359375, 31.34375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 18.0, 15.0, 21.0, 29.0, 42.0, 41.0, 63.0, 83.0, 113.0, 168.0, 251.0, 484.0, 1171.0, 5046.0, 40401.0, 3845028.0, 283300.0, 13704.0, 2394.0, 745.0, 391.0, 188.0, 138.0, 86.0, 79.0, 55.0, 38.0, 36.0, 26.0, 20.0, 14.0, 15.0, 11.0, 13.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.4375, -106.9609375, -103.484375, -100.0078125, -96.53125, -93.0546875, -89.578125, -86.1015625, -82.625, -79.1484375, -75.671875, -72.1953125, -68.71875, -65.2421875, -61.765625, -58.2890625, -54.8125, -51.3359375, -47.859375, -44.3828125, -40.90625, -37.4296875, -33.953125, -30.4765625, -27.0, -23.5234375, -20.046875, -16.5703125, -13.09375, -9.6171875, -6.140625, -2.6640625, 0.8125, 4.2890625, 7.765625, 11.2421875, 14.71875, 18.1953125, 21.671875, 25.1484375, 28.625, 32.1015625, 35.578125, 39.0546875, 42.53125, 46.0078125, 49.484375, 52.9609375, 56.4375, 59.9140625, 63.390625, 66.8671875, 70.34375, 73.8203125, 77.296875, 80.7734375, 84.25, 87.7265625, 91.203125, 94.6796875, 98.15625, 101.6328125, 105.109375, 108.5859375, 112.0625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 5.0, 12.0, 8.0, 11.0, 11.0, 27.0, 35.0, 58.0, 88.0, 100.0, 134.0, 157.0, 120.0, 83.0, 48.0, 30.0, 25.0, 22.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.20794677734375, -48.859764099121094, -46.51158142089844, -44.16339874267578, -41.815216064453125, -39.46703338623047, -37.11885070800781, -34.770668029785156, -32.4224853515625, -30.074302673339844, -27.726119995117188, -25.37793731689453, -23.029754638671875, -20.68157196044922, -18.333389282226562, -15.985206604003906, -13.63702392578125, -11.288841247558594, -8.940658569335938, -6.592475891113281, -4.244293212890625, -1.8961105346679688, 0.4520721435546875, 2.8002548217773438, 5.1484375, 7.496620178222656, 9.844802856445312, 12.192985534667969, 14.541168212890625, 16.88935089111328, 19.237533569335938, 21.585716247558594, 23.93390655517578, 26.282089233398438, 28.630271911621094, 30.97845458984375, 33.326637268066406, 35.67481994628906, 38.02300262451172, 40.371185302734375, 42.71936798095703, 45.06755065917969, 47.415733337402344, 49.763916015625, 52.112098693847656, 54.46028137207031, 56.80846405029297, 59.156646728515625, 61.50482940673828, 63.85301208496094, 66.2011947631836, 68.54937744140625, 70.8975601196289, 73.24574279785156, 75.59392547607422, 77.94210815429688, 80.29029083251953, 82.63847351074219, 84.98665618896484, 87.3348388671875, 89.68302154541016, 92.03120422363281, 94.37938690185547, 96.72756958007812, 99.07575225830078]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 6.0, 2.0, 8.0, 5.0, 10.0, 9.0, 9.0, 12.0, 19.0, 23.0, 22.0, 25.0, 28.0, 28.0, 26.0, 35.0, 34.0, 35.0, 29.0, 35.0, 33.0, 40.0, 47.0, 40.0, 39.0, 31.0, 37.0, 35.0, 33.0, 33.0, 33.0, 24.0, 27.0, 24.0, 23.0, 15.0, 17.0, 17.0, 9.0, 6.0, 5.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-96.27719116210938, -93.53274536132812, -90.78829956054688, -88.04385375976562, -85.29940795898438, -82.55496215820312, -79.81051635742188, -77.06607055664062, -74.32162475585938, -71.57717895507812, -68.83273315429688, -66.08828735351562, -63.343841552734375, -60.599395751953125, -57.85495376586914, -55.11050796508789, -52.366065979003906, -49.621620178222656, -46.877174377441406, -44.132728576660156, -41.388282775878906, -38.643836975097656, -35.89939498901367, -33.15494918823242, -30.410503387451172, -27.666057586669922, -24.921611785888672, -22.177167892456055, -19.432722091674805, -16.688276290893555, -13.943832397460938, -11.199386596679688, -8.454940795898438, -5.710495471954346, -2.966050148010254, -0.2216053009033203, 2.5228404998779297, 5.26728630065918, 8.011730194091797, 10.756175994873047, 13.500621795654297, 16.245067596435547, 18.989513397216797, 21.733957290649414, 24.478403091430664, 27.222848892211914, 29.96729278564453, 32.71173858642578, 35.45618438720703, 38.20063018798828, 40.94507598876953, 43.68952178955078, 46.43396759033203, 49.17841339111328, 51.922855377197266, 54.667301177978516, 57.411746978759766, 60.156192779541016, 62.900638580322266, 65.64508056640625, 68.3895263671875, 71.13397216796875, 73.87841796875, 76.62286376953125, 79.3673095703125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 10.0, 20.0, 15.0, 18.0, 16.0, 26.0, 24.0, 27.0, 37.0, 44.0, 49.0, 54.0, 84.0, 64.0, 72.0, 65.0, 67.0, 59.0, 31.0, 34.0, 14.0, 16.0, 13.0, 18.0, 17.0, 14.0, 6.0, 5.0, 0.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-10.2734375, -9.971923828125, -9.67041015625, -9.368896484375, -9.0673828125, -8.765869140625, -8.46435546875, -8.162841796875, -7.861328125, -7.559814453125, -7.25830078125, -6.956787109375, -6.6552734375, -6.353759765625, -6.05224609375, -5.750732421875, -5.44921875, -5.147705078125, -4.84619140625, -4.544677734375, -4.2431640625, -3.941650390625, -3.64013671875, -3.338623046875, -3.037109375, -2.735595703125, -2.43408203125, -2.132568359375, -1.8310546875, -1.529541015625, -1.22802734375, -0.926513671875, -0.625, -0.323486328125, -0.02197265625, 0.279541015625, 0.5810546875, 0.882568359375, 1.18408203125, 1.485595703125, 1.787109375, 2.088623046875, 2.39013671875, 2.691650390625, 2.9931640625, 3.294677734375, 3.59619140625, 3.897705078125, 4.19921875, 4.500732421875, 4.80224609375, 5.103759765625, 5.4052734375, 5.706787109375, 6.00830078125, 6.309814453125, 6.611328125, 6.912841796875, 7.21435546875, 7.515869140625, 7.8173828125, 8.118896484375, 8.42041015625, 8.721923828125, 9.0234375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 18.0, 16.0, 26.0, 38.0, 44.0, 60.0, 84.0, 124.0, 188.0, 239.0, 340.0, 540.0, 723.0, 1042.0, 1484.0, 2157.0, 3172.0, 4801.0, 7321.0, 11238.0, 18346.0, 31834.0, 60447.0, 130418.0, 262386.0, 252306.0, 120841.0, 57405.0, 30192.0, 17940.0, 11047.0, 7083.0, 4607.0, 3076.0, 2217.0, 1391.0, 947.0, 732.0, 483.0, 326.0, 251.0, 174.0, 134.0, 95.0, 62.0, 45.0, 34.0, 19.0, 19.0, 15.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.185546875, -1.1484527587890625, -1.111358642578125, -1.0742645263671875, -1.03717041015625, -1.0000762939453125, -0.962982177734375, -0.9258880615234375, -0.8887939453125, -0.8516998291015625, -0.814605712890625, -0.7775115966796875, -0.74041748046875, -0.7033233642578125, -0.666229248046875, -0.6291351318359375, -0.592041015625, -0.5549468994140625, -0.517852783203125, -0.4807586669921875, -0.44366455078125, -0.4065704345703125, -0.369476318359375, -0.3323822021484375, -0.2952880859375, -0.2581939697265625, -0.221099853515625, -0.1840057373046875, -0.14691162109375, -0.1098175048828125, -0.072723388671875, -0.0356292724609375, 0.00146484375, 0.0385589599609375, 0.075653076171875, 0.1127471923828125, 0.14984130859375, 0.1869354248046875, 0.224029541015625, 0.2611236572265625, 0.2982177734375, 0.3353118896484375, 0.372406005859375, 0.4095001220703125, 0.44659423828125, 0.4836883544921875, 0.520782470703125, 0.5578765869140625, 0.594970703125, 0.6320648193359375, 0.669158935546875, 0.7062530517578125, 0.74334716796875, 0.7804412841796875, 0.817535400390625, 0.8546295166015625, 0.8917236328125, 0.9288177490234375, 0.965911865234375, 1.0030059814453125, 1.04010009765625, 1.0771942138671875, 1.114288330078125, 1.1513824462890625, 1.1884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 12.0, 11.0, 10.0, 15.0, 15.0, 16.0, 22.0, 28.0, 26.0, 29.0, 29.0, 35.0, 30.0, 36.0, 45.0, 40.0, 38.0, 40.0, 1071.0, 34.0, 32.0, 39.0, 25.0, 42.0, 26.0, 24.0, 32.0, 29.0, 28.0, 19.0, 25.0, 23.0, 13.0, 15.0, 12.0, 8.0, 12.0, 5.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.56640625, -4.422607421875, -4.27880859375, -4.135009765625, -3.9912109375, -3.847412109375, -3.70361328125, -3.559814453125, -3.416015625, -3.272216796875, -3.12841796875, -2.984619140625, -2.8408203125, -2.697021484375, -2.55322265625, -2.409423828125, -2.265625, -2.121826171875, -1.97802734375, -1.834228515625, -1.6904296875, -1.546630859375, -1.40283203125, -1.259033203125, -1.115234375, -0.971435546875, -0.82763671875, -0.683837890625, -0.5400390625, -0.396240234375, -0.25244140625, -0.108642578125, 0.03515625, 0.178955078125, 0.32275390625, 0.466552734375, 0.6103515625, 0.754150390625, 0.89794921875, 1.041748046875, 1.185546875, 1.329345703125, 1.47314453125, 1.616943359375, 1.7607421875, 1.904541015625, 2.04833984375, 2.192138671875, 2.3359375, 2.479736328125, 2.62353515625, 2.767333984375, 2.9111328125, 3.054931640625, 3.19873046875, 3.342529296875, 3.486328125, 3.630126953125, 3.77392578125, 3.917724609375, 4.0615234375, 4.205322265625, 4.34912109375, 4.492919921875, 4.63671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 7.0, 8.0, 24.0, 30.0, 45.0, 79.0, 81.0, 120.0, 170.0, 240.0, 363.0, 568.0, 816.0, 1206.0, 1775.0, 2704.0, 4202.0, 6254.0, 10045.0, 15284.0, 24306.0, 39418.0, 65242.0, 108011.0, 172210.0, 1251262.0, 150025.0, 93137.0, 55945.0, 34130.0, 21241.0, 13224.0, 8507.0, 5678.0, 3608.0, 2371.0, 1565.0, 1042.0, 684.0, 459.0, 355.0, 211.0, 128.0, 115.0, 70.0, 46.0, 35.0, 24.0, 18.0, 16.0, 11.0, 5.0, 8.0, 0.0, 1.0, 3.0], "bins": [-0.6181640625, -0.5996246337890625, -0.581085205078125, -0.5625457763671875, -0.54400634765625, -0.5254669189453125, -0.506927490234375, -0.4883880615234375, -0.4698486328125, -0.4513092041015625, -0.432769775390625, -0.4142303466796875, -0.39569091796875, -0.3771514892578125, -0.358612060546875, -0.3400726318359375, -0.321533203125, -0.3029937744140625, -0.284454345703125, -0.2659149169921875, -0.24737548828125, -0.2288360595703125, -0.210296630859375, -0.1917572021484375, -0.1732177734375, -0.1546783447265625, -0.136138916015625, -0.1175994873046875, -0.09906005859375, -0.0805206298828125, -0.061981201171875, -0.0434417724609375, -0.02490234375, -0.0063629150390625, 0.012176513671875, 0.0307159423828125, 0.04925537109375, 0.0677947998046875, 0.086334228515625, 0.1048736572265625, 0.1234130859375, 0.1419525146484375, 0.160491943359375, 0.1790313720703125, 0.19757080078125, 0.2161102294921875, 0.234649658203125, 0.2531890869140625, 0.271728515625, 0.2902679443359375, 0.308807373046875, 0.3273468017578125, 0.34588623046875, 0.3644256591796875, 0.382965087890625, 0.4015045166015625, 0.4200439453125, 0.4385833740234375, 0.457122802734375, 0.4756622314453125, 0.49420166015625, 0.5127410888671875, 0.531280517578125, 0.5498199462890625, 0.568359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 11.0, 16.0, 15.0, 15.0, 27.0, 44.0, 41.0, 57.0, 70.0, 80.0, 87.0, 71.0, 73.0, 69.0, 58.0, 45.0, 39.0, 28.0, 28.0, 21.0, 19.0, 15.0, 9.0, 10.0, 4.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0063323974609375, -0.0061487555503845215, -0.005965113639831543, -0.0057814717292785645, -0.005597829818725586, -0.005414187908172607, -0.005230545997619629, -0.00504690408706665, -0.004863262176513672, -0.004679620265960693, -0.004495978355407715, -0.004312336444854736, -0.004128694534301758, -0.003945052623748779, -0.0037614107131958008, -0.0035777688026428223, -0.0033941268920898438, -0.0032104849815368652, -0.0030268430709838867, -0.002843201160430908, -0.0026595592498779297, -0.002475917339324951, -0.0022922754287719727, -0.002108633518218994, -0.0019249916076660156, -0.0017413496971130371, -0.0015577077865600586, -0.00137406587600708, -0.0011904239654541016, -0.001006782054901123, -0.0008231401443481445, -0.000639498233795166, -0.0004558563232421875, -0.000272214412689209, -8.857250213623047e-05, 9.506940841674805e-05, 0.00027871131896972656, 0.0004623532295227051, 0.0006459951400756836, 0.0008296370506286621, 0.0010132789611816406, 0.0011969208717346191, 0.0013805627822875977, 0.0015642046928405762, 0.0017478466033935547, 0.0019314885139465332, 0.0021151304244995117, 0.0022987723350524902, 0.0024824142456054688, 0.0026660561561584473, 0.0028496980667114258, 0.0030333399772644043, 0.003216981887817383, 0.0034006237983703613, 0.00358426570892334, 0.0037679076194763184, 0.003951549530029297, 0.004135191440582275, 0.004318833351135254, 0.004502475261688232, 0.004686117172241211, 0.0048697590827941895, 0.005053400993347168, 0.0052370429039001465, 0.005420684814453125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 8.0, 5.0, 3.0, 10.0, 12.0, 15.0, 25.0, 19.0, 35.0, 43.0, 42.0, 83.0, 111.0, 112.0, 205.0, 284.0, 534.0, 1481.0, 1022864.0, 20674.0, 798.0, 323.0, 225.0, 154.0, 110.0, 88.0, 68.0, 44.0, 41.0, 29.0, 28.0, 19.0, 9.0, 4.0, 8.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10167598724365234, -0.09837150573730469, -0.09506702423095703, -0.09176254272460938, -0.08845806121826172, -0.08515357971191406, -0.0818490982055664, -0.07854461669921875, -0.0752401351928711, -0.07193565368652344, -0.06863117218017578, -0.06532669067382812, -0.06202220916748047, -0.05871772766113281, -0.055413246154785156, -0.0521087646484375, -0.048804283142089844, -0.04549980163574219, -0.04219532012939453, -0.038890838623046875, -0.03558635711669922, -0.03228187561035156, -0.028977394104003906, -0.02567291259765625, -0.022368431091308594, -0.019063949584960938, -0.01575946807861328, -0.012454986572265625, -0.009150505065917969, -0.0058460235595703125, -0.0025415420532226562, 0.000762939453125, 0.004067420959472656, 0.0073719024658203125, 0.010676383972167969, 0.013980865478515625, 0.01728534698486328, 0.020589828491210938, 0.023894309997558594, 0.02719879150390625, 0.030503273010253906, 0.03380775451660156, 0.03711223602294922, 0.040416717529296875, 0.04372119903564453, 0.04702568054199219, 0.050330162048339844, 0.0536346435546875, 0.056939125061035156, 0.06024360656738281, 0.06354808807373047, 0.06685256958007812, 0.07015705108642578, 0.07346153259277344, 0.0767660140991211, 0.08007049560546875, 0.0833749771118164, 0.08667945861816406, 0.08998394012451172, 0.09328842163085938, 0.09659290313720703, 0.09989738464355469, 0.10320186614990234, 0.10650634765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 33.0, 981.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06518911570310593, -0.0632871463894844, -0.061385173350572586, -0.05948320031166077, -0.05758122727274895, -0.05567925423383713, -0.05377728492021561, -0.05187531188130379, -0.04997333884239197, -0.04807136580348015, -0.04616939648985863, -0.04426742345094681, -0.04236545041203499, -0.04046347737312317, -0.03856150805950165, -0.03665953502058983, -0.03475756198167801, -0.03285558894276619, -0.03095361776649952, -0.02905164659023285, -0.02714967355132103, -0.02524770237505436, -0.02334573119878769, -0.02144375815987587, -0.01954178884625435, -0.01763981766998768, -0.01573784463107586, -0.013835873454809189, -0.01193390041589737, -0.0100319292396307, -0.008129957132041454, -0.0062279850244522095, -0.00432601198554039, -0.002424039877951145, -0.000522068003192544, 0.0013799038715660572, 0.003281875979155302, 0.00518384762108326, 0.007085819728672504, 0.00898779183626175, 0.010889763943850994, 0.012791736051440239, 0.014693708159029484, 0.01659568026661873, 0.0184976514428854, 0.02039962261915207, 0.02230159565806389, 0.024203568696975708, 0.026105539873242378, 0.02800751104950905, 0.029909484088420868, 0.03181145712733269, 0.03371342644095421, 0.03561539947986603, 0.03751737251877785, 0.03941934555768967, 0.04132131487131119, 0.04322328791022301, 0.04512525722384453, 0.04702723026275635, 0.04892920330166817, 0.05083117634057999, 0.05273314565420151, 0.05463511869311333, 0.056537091732025146]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 7.0, 10.0, 11.0, 13.0, 20.0, 27.0, 33.0, 54.0, 44.0, 57.0, 58.0, 48.0, 77.0, 65.0, 81.0, 66.0, 59.0, 54.0, 47.0, 35.0, 25.0, 22.0, 23.0, 18.0, 10.0, 12.0, 10.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004211902618408203, -0.004020778462290764, -0.0038296543061733246, -0.0036385301500558853, -0.003447405993938446, -0.0032562818378210068, -0.0030651576817035675, -0.0028740335255861282, -0.002682909369468689, -0.0024917852133512497, -0.0023006610572338104, -0.002109536901116371, -0.0019184127449989319, -0.0017272885888814926, -0.0015361644327640533, -0.001345040276646614, -0.0011539161205291748, -0.0009627919644117355, -0.0007716678082942963, -0.000580543652176857, -0.0003894194960594177, -0.00019829533994197845, -7.1711838245391846e-06, 0.00018395297229290009, 0.00037507712841033936, 0.0005662012845277786, 0.0007573254406452179, 0.0009484495967626572, 0.0011395737528800964, 0.0013306979089975357, 0.001521822065114975, 0.0017129462212324142, 0.0019040703773498535, 0.002095194533467293, 0.002286318689584732, 0.0024774428457021713, 0.0026685670018196106, 0.00285969115793705, 0.003050815314054489, 0.0032419394701719284, 0.0034330636262893677, 0.003624187782406807, 0.003815311938524246, 0.0040064360946416855, 0.004197560250759125, 0.004388684406876564, 0.004579808562994003, 0.0047709327191114426, 0.004962056875228882, 0.005153181031346321, 0.00534430518746376, 0.0055354293435812, 0.005726553499698639, 0.005917677655816078, 0.0061088018119335175, 0.006299925968050957, 0.006491050124168396, 0.006682174280285835, 0.0068732984364032745, 0.007064422592520714, 0.007255546748638153, 0.007446670904755592, 0.007637795060873032, 0.007828919216990471, 0.00802004337310791]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 10.0, 20.0, 15.0, 18.0, 16.0, 26.0, 24.0, 27.0, 37.0, 44.0, 49.0, 54.0, 84.0, 64.0, 72.0, 65.0, 67.0, 59.0, 31.0, 34.0, 14.0, 16.0, 13.0, 18.0, 17.0, 14.0, 6.0, 5.0, 0.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-10.2734375, -9.971923828125, -9.67041015625, -9.368896484375, -9.0673828125, -8.765869140625, -8.46435546875, -8.162841796875, -7.861328125, -7.559814453125, -7.25830078125, -6.956787109375, -6.6552734375, -6.353759765625, -6.05224609375, -5.750732421875, -5.44921875, -5.147705078125, -4.84619140625, -4.544677734375, -4.2431640625, -3.941650390625, -3.64013671875, -3.338623046875, -3.037109375, -2.735595703125, -2.43408203125, -2.132568359375, -1.8310546875, -1.529541015625, -1.22802734375, -0.926513671875, -0.625, -0.323486328125, -0.02197265625, 0.279541015625, 0.5810546875, 0.882568359375, 1.18408203125, 1.485595703125, 1.787109375, 2.088623046875, 2.39013671875, 2.691650390625, 2.9931640625, 3.294677734375, 3.59619140625, 3.897705078125, 4.19921875, 4.500732421875, 4.80224609375, 5.103759765625, 5.4052734375, 5.706787109375, 6.00830078125, 6.309814453125, 6.611328125, 6.912841796875, 7.21435546875, 7.515869140625, 7.8173828125, 8.118896484375, 8.42041015625, 8.721923828125, 9.0234375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 7.0, 10.0, 13.0, 12.0, 21.0, 43.0, 57.0, 84.0, 106.0, 123.0, 151.0, 239.0, 390.0, 525.0, 715.0, 1089.0, 1541.0, 2357.0, 3712.0, 5885.0, 10908.0, 22385.0, 56508.0, 270048.0, 528212.0, 81037.0, 28779.0, 13629.0, 7365.0, 4239.0, 2621.0, 1770.0, 1249.0, 814.0, 535.0, 384.0, 273.0, 193.0, 143.0, 115.0, 72.0, 56.0, 30.0, 32.0, 23.0, 23.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-27.8125, -26.9736328125, -26.134765625, -25.2958984375, -24.45703125, -23.6181640625, -22.779296875, -21.9404296875, -21.1015625, -20.2626953125, -19.423828125, -18.5849609375, -17.74609375, -16.9072265625, -16.068359375, -15.2294921875, -14.390625, -13.5517578125, -12.712890625, -11.8740234375, -11.03515625, -10.1962890625, -9.357421875, -8.5185546875, -7.6796875, -6.8408203125, -6.001953125, -5.1630859375, -4.32421875, -3.4853515625, -2.646484375, -1.8076171875, -0.96875, -0.1298828125, 0.708984375, 1.5478515625, 2.38671875, 3.2255859375, 4.064453125, 4.9033203125, 5.7421875, 6.5810546875, 7.419921875, 8.2587890625, 9.09765625, 9.9365234375, 10.775390625, 11.6142578125, 12.453125, 13.2919921875, 14.130859375, 14.9697265625, 15.80859375, 16.6474609375, 17.486328125, 18.3251953125, 19.1640625, 20.0029296875, 20.841796875, 21.6806640625, 22.51953125, 23.3583984375, 24.197265625, 25.0361328125, 25.875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 10.0, 6.0, 9.0, 10.0, 19.0, 19.0, 16.0, 23.0, 29.0, 26.0, 34.0, 46.0, 36.0, 41.0, 64.0, 62.0, 113.0, 162.0, 1397.0, 239.0, 124.0, 85.0, 68.0, 54.0, 48.0, 36.0, 40.0, 25.0, 15.0, 30.0, 14.0, 22.0, 18.0, 13.0, 7.0, 13.0, 16.0, 10.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-25.6875, -24.880126953125, -24.07275390625, -23.265380859375, -22.4580078125, -21.650634765625, -20.84326171875, -20.035888671875, -19.228515625, -18.421142578125, -17.61376953125, -16.806396484375, -15.9990234375, -15.191650390625, -14.38427734375, -13.576904296875, -12.76953125, -11.962158203125, -11.15478515625, -10.347412109375, -9.5400390625, -8.732666015625, -7.92529296875, -7.117919921875, -6.310546875, -5.503173828125, -4.69580078125, -3.888427734375, -3.0810546875, -2.273681640625, -1.46630859375, -0.658935546875, 0.1484375, 0.955810546875, 1.76318359375, 2.570556640625, 3.3779296875, 4.185302734375, 4.99267578125, 5.800048828125, 6.607421875, 7.414794921875, 8.22216796875, 9.029541015625, 9.8369140625, 10.644287109375, 11.45166015625, 12.259033203125, 13.06640625, 13.873779296875, 14.68115234375, 15.488525390625, 16.2958984375, 17.103271484375, 17.91064453125, 18.718017578125, 19.525390625, 20.332763671875, 21.14013671875, 21.947509765625, 22.7548828125, 23.562255859375, 24.36962890625, 25.177001953125, 25.984375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 4.0, 2.0, 7.0, 8.0, 10.0, 18.0, 16.0, 11.0, 18.0, 22.0, 22.0, 26.0, 36.0, 47.0, 82.0, 140.0, 278.0, 1068.0, 16341.0, 3030881.0, 93448.0, 2232.0, 417.0, 180.0, 79.0, 66.0, 40.0, 35.0, 25.0, 22.0, 20.0, 13.0, 14.0, 18.0, 4.0, 10.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.3125, -108.767578125, -105.22265625, -101.677734375, -98.1328125, -94.587890625, -91.04296875, -87.498046875, -83.953125, -80.408203125, -76.86328125, -73.318359375, -69.7734375, -66.228515625, -62.68359375, -59.138671875, -55.59375, -52.048828125, -48.50390625, -44.958984375, -41.4140625, -37.869140625, -34.32421875, -30.779296875, -27.234375, -23.689453125, -20.14453125, -16.599609375, -13.0546875, -9.509765625, -5.96484375, -2.419921875, 1.125, 4.669921875, 8.21484375, 11.759765625, 15.3046875, 18.849609375, 22.39453125, 25.939453125, 29.484375, 33.029296875, 36.57421875, 40.119140625, 43.6640625, 47.208984375, 50.75390625, 54.298828125, 57.84375, 61.388671875, 64.93359375, 68.478515625, 72.0234375, 75.568359375, 79.11328125, 82.658203125, 86.203125, 89.748046875, 93.29296875, 96.837890625, 100.3828125, 103.927734375, 107.47265625, 111.017578125, 114.5625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 42.0, 868.0, 105.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.68983840942383, -23.963428497314453, -9.237020492553711, 5.489387512207031, 20.215797424316406, 34.942203521728516, 49.66861343383789, 64.39501953125, 79.12142944335938, 93.84783935546875, 108.57424926757812, 123.3006591796875, 138.02706909179688, 152.75347900390625, 167.47988891601562, 182.206298828125, 196.93270874023438, 211.65911865234375, 226.38552856445312, 241.1119384765625, 255.83834838867188, 270.56475830078125, 285.2911682128906, 300.017578125, 314.7439880371094, 329.47039794921875, 344.1968078613281, 358.9232177734375, 373.6496276855469, 388.37603759765625, 403.1024475097656, 417.828857421875, 432.5552673339844, 447.28167724609375, 462.0080871582031, 476.7344970703125, 491.4609069824219, 506.18731689453125, 520.9136962890625, 535.64013671875, 550.3665161132812, 565.0928955078125, 579.8193359375, 594.5457153320312, 609.2721557617188, 623.99853515625, 638.7249755859375, 653.4513549804688, 668.1777954101562, 682.9041748046875, 697.630615234375, 712.3569946289062, 727.0834350585938, 741.809814453125, 756.5362548828125, 771.2626342773438, 785.9890747070312, 800.7154541015625, 815.44189453125, 830.1682739257812, 844.8947143554688, 859.62109375, 874.3475341796875, 889.0739135742188, 903.8003540039062]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 2.0, 9.0, 11.0, 5.0, 17.0, 16.0, 18.0, 23.0, 26.0, 26.0, 33.0, 29.0, 50.0, 28.0, 34.0, 34.0, 32.0, 34.0, 43.0, 45.0, 50.0, 45.0, 40.0, 31.0, 45.0, 33.0, 28.0, 28.0, 29.0, 26.0, 20.0, 26.0, 14.0, 13.0, 12.0, 3.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-88.4848861694336, -85.51607513427734, -82.54727172851562, -79.57846069335938, -76.60964965820312, -73.6408462524414, -70.67203521728516, -67.70323181152344, -64.73442077636719, -61.7656135559082, -58.79680633544922, -55.82799530029297, -52.859188079833984, -49.890380859375, -46.92156982421875, -43.952762603759766, -40.98395538330078, -38.0151481628418, -35.04634094238281, -32.07752990722656, -29.108722686767578, -26.139915466308594, -23.171106338500977, -20.20229721069336, -17.233489990234375, -14.264681816101074, -11.295873641967773, -8.327065467834473, -5.358257293701172, -2.389449119567871, 0.5793590545654297, 3.548168182373047, 6.516975402832031, 9.485783576965332, 12.454591751098633, 15.423399925231934, 18.392208099365234, 21.36101531982422, 24.329824447631836, 27.298633575439453, 30.267440795898438, 33.23624801635742, 36.205055236816406, 39.173866271972656, 42.14267349243164, 45.111480712890625, 48.080291748046875, 51.04909896850586, 54.017906188964844, 56.98671340942383, 59.95552062988281, 62.92433166503906, 65.89314270019531, 68.86194610595703, 71.83075714111328, 74.799560546875, 77.76837158203125, 80.7371826171875, 83.70598602294922, 86.67479705810547, 89.64360046386719, 92.61241149902344, 95.58122253417969, 98.55003356933594, 101.51883697509766]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 7.0, 15.0, 11.0, 15.0, 15.0, 20.0, 17.0, 19.0, 21.0, 25.0, 39.0, 45.0, 50.0, 54.0, 57.0, 71.0, 77.0, 74.0, 58.0, 62.0, 51.0, 32.0, 20.0, 21.0, 22.0, 16.0, 17.0, 13.0, 5.0, 5.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.4375, -11.096923828125, -10.75634765625, -10.415771484375, -10.0751953125, -9.734619140625, -9.39404296875, -9.053466796875, -8.712890625, -8.372314453125, -8.03173828125, -7.691162109375, -7.3505859375, -7.010009765625, -6.66943359375, -6.328857421875, -5.98828125, -5.647705078125, -5.30712890625, -4.966552734375, -4.6259765625, -4.285400390625, -3.94482421875, -3.604248046875, -3.263671875, -2.923095703125, -2.58251953125, -2.241943359375, -1.9013671875, -1.560791015625, -1.22021484375, -0.879638671875, -0.5390625, -0.198486328125, 0.14208984375, 0.482666015625, 0.8232421875, 1.163818359375, 1.50439453125, 1.844970703125, 2.185546875, 2.526123046875, 2.86669921875, 3.207275390625, 3.5478515625, 3.888427734375, 4.22900390625, 4.569580078125, 4.91015625, 5.250732421875, 5.59130859375, 5.931884765625, 6.2724609375, 6.613037109375, 6.95361328125, 7.294189453125, 7.634765625, 7.975341796875, 8.31591796875, 8.656494140625, 8.9970703125, 9.337646484375, 9.67822265625, 10.018798828125, 10.359375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 7.0, 8.0, 13.0, 15.0, 15.0, 27.0, 30.0, 42.0, 53.0, 76.0, 111.0, 245.0, 438.0, 1046.0, 2529.0, 7849.0, 44036.0, 3920242.0, 200139.0, 11441.0, 3314.0, 1281.0, 567.0, 275.0, 170.0, 87.0, 55.0, 35.0, 28.0, 21.0, 15.0, 8.0, 12.0, 7.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-76.0625, -73.8037109375, -71.544921875, -69.2861328125, -67.02734375, -64.7685546875, -62.509765625, -60.2509765625, -57.9921875, -55.7333984375, -53.474609375, -51.2158203125, -48.95703125, -46.6982421875, -44.439453125, -42.1806640625, -39.921875, -37.6630859375, -35.404296875, -33.1455078125, -30.88671875, -28.6279296875, -26.369140625, -24.1103515625, -21.8515625, -19.5927734375, -17.333984375, -15.0751953125, -12.81640625, -10.5576171875, -8.298828125, -6.0400390625, -3.78125, -1.5224609375, 0.736328125, 2.9951171875, 5.25390625, 7.5126953125, 9.771484375, 12.0302734375, 14.2890625, 16.5478515625, 18.806640625, 21.0654296875, 23.32421875, 25.5830078125, 27.841796875, 30.1005859375, 32.359375, 34.6181640625, 36.876953125, 39.1357421875, 41.39453125, 43.6533203125, 45.912109375, 48.1708984375, 50.4296875, 52.6884765625, 54.947265625, 57.2060546875, 59.46484375, 61.7236328125, 63.982421875, 66.2412109375, 68.5]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 11.0, 16.0, 14.0, 20.0, 49.0, 46.0, 78.0, 156.0, 308.0, 652.0, 1034.0, 751.0, 397.0, 162.0, 87.0, 76.0, 46.0, 27.0, 21.0, 13.0, 20.0, 14.0, 13.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -37.41650390625, -36.2705078125, -35.12451171875, -33.978515625, -32.83251953125, -31.6865234375, -30.54052734375, -29.39453125, -28.24853515625, -27.1025390625, -25.95654296875, -24.810546875, -23.66455078125, -22.5185546875, -21.37255859375, -20.2265625, -19.08056640625, -17.9345703125, -16.78857421875, -15.642578125, -14.49658203125, -13.3505859375, -12.20458984375, -11.05859375, -9.91259765625, -8.7666015625, -7.62060546875, -6.474609375, -5.32861328125, -4.1826171875, -3.03662109375, -1.890625, -0.74462890625, 0.4013671875, 1.54736328125, 2.693359375, 3.83935546875, 4.9853515625, 6.13134765625, 7.27734375, 8.42333984375, 9.5693359375, 10.71533203125, 11.861328125, 13.00732421875, 14.1533203125, 15.29931640625, 16.4453125, 17.59130859375, 18.7373046875, 19.88330078125, 21.029296875, 22.17529296875, 23.3212890625, 24.46728515625, 25.61328125, 26.75927734375, 27.9052734375, 29.05126953125, 30.197265625, 31.34326171875, 32.4892578125, 33.63525390625, 34.78125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 8.0, 11.0, 19.0, 23.0, 25.0, 66.0, 131.0, 278.0, 511.0, 1422.0, 4692.0, 22261.0, 362192.0, 3720072.0, 68306.0, 9988.0, 2600.0, 876.0, 364.0, 163.0, 105.0, 44.0, 29.0, 29.0, 19.0, 12.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.3125, -84.6875, -82.0625, -79.4375, -76.8125, -74.1875, -71.5625, -68.9375, -66.3125, -63.6875, -61.0625, -58.4375, -55.8125, -53.1875, -50.5625, -47.9375, -45.3125, -42.6875, -40.0625, -37.4375, -34.8125, -32.1875, -29.5625, -26.9375, -24.3125, -21.6875, -19.0625, -16.4375, -13.8125, -11.1875, -8.5625, -5.9375, -3.3125, -0.6875, 1.9375, 4.5625, 7.1875, 9.8125, 12.4375, 15.0625, 17.6875, 20.3125, 22.9375, 25.5625, 28.1875, 30.8125, 33.4375, 36.0625, 38.6875, 41.3125, 43.9375, 46.5625, 49.1875, 51.8125, 54.4375, 57.0625, 59.6875, 62.3125, 64.9375, 67.5625, 70.1875, 72.8125, 75.4375, 78.0625, 80.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 38.0, 63.0, 186.0, 318.0, 227.0, 95.0, 31.0, 15.0, 10.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.1020050048828, -245.06678771972656, -239.03158569335938, -232.99636840820312, -226.96115112304688, -220.92593383789062, -214.89073181152344, -208.8555145263672, -202.8203125, -196.78509521484375, -190.74989318847656, -184.7146759033203, -178.67945861816406, -172.64425659179688, -166.60903930664062, -160.57382202148438, -154.53860473632812, -148.50338745117188, -142.4681854248047, -136.43296813964844, -130.3977508544922, -124.36254119873047, -118.32733154296875, -112.2921142578125, -106.25690460205078, -100.22169494628906, -94.18647766113281, -88.1512680053711, -82.11605834960938, -76.08084106445312, -70.0456314086914, -64.01042175292969, -57.9752197265625, -51.940006256103516, -45.90479278564453, -39.86958312988281, -33.83436965942383, -27.799156188964844, -21.763946533203125, -15.72873306274414, -9.693519592285156, -3.6583070755004883, 2.3769054412841797, 8.412117004394531, 14.447330474853516, 20.4825439453125, 26.51775360107422, 32.5529670715332, 38.58818054199219, 44.62339401245117, 50.658607482910156, 56.693817138671875, 62.72903060913086, 68.76424407958984, 74.79945373535156, 80.83467102050781, 86.86988067626953, 92.90509033203125, 98.9403076171875, 104.97551727294922, 111.01072692871094, 117.04594421386719, 123.0811538696289, 129.11636352539062, 135.15158081054688]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 9.0, 14.0, 12.0, 24.0, 16.0, 20.0, 16.0, 26.0, 25.0, 32.0, 29.0, 29.0, 35.0, 28.0, 35.0, 40.0, 43.0, 39.0, 46.0, 34.0, 40.0, 40.0, 31.0, 37.0, 33.0, 35.0, 25.0, 29.0, 19.0, 21.0, 16.0, 17.0, 11.0, 10.0, 10.0, 9.0, 6.0, 5.0, 8.0, 6.0, 0.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.43560791015625, -80.85160827636719, -78.26760864257812, -75.68360900878906, -73.099609375, -70.51560974121094, -67.93161010742188, -65.34761047363281, -62.763607025146484, -60.17960739135742, -57.59560775756836, -55.0116081237793, -52.42760467529297, -49.843605041503906, -47.259605407714844, -44.67560577392578, -42.09160614013672, -39.507606506347656, -36.923606872558594, -34.33960723876953, -31.755605697631836, -29.171606063842773, -26.587604522705078, -24.003604888916016, -21.419605255126953, -18.83560562133789, -16.251605987548828, -13.667604446411133, -11.08360481262207, -8.499605178833008, -5.915604591369629, -3.33160400390625, -0.7476043701171875, 1.8363957405090332, 4.420395851135254, 7.004395961761475, 9.588396072387695, 12.172395706176758, 14.756396293640137, 17.340396881103516, 19.924396514892578, 22.50839614868164, 25.092395782470703, 27.6763973236084, 30.26039695739746, 32.844398498535156, 35.42839813232422, 38.01239776611328, 40.596397399902344, 43.180397033691406, 45.76439666748047, 48.34839630126953, 50.932395935058594, 53.516395568847656, 56.100399017333984, 58.68439865112305, 61.26839828491211, 63.85239791870117, 66.4364013671875, 69.02040100097656, 71.60440063476562, 74.18840026855469, 76.77239990234375, 79.35639953613281, 81.94039916992188]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 12.0, 17.0, 16.0, 12.0, 22.0, 20.0, 29.0, 43.0, 48.0, 42.0, 43.0, 51.0, 70.0, 63.0, 73.0, 82.0, 56.0, 42.0, 32.0, 29.0, 27.0, 25.0, 18.0, 16.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.7454833984375, -10.420654296875, -10.0958251953125, -9.77099609375, -9.4461669921875, -9.121337890625, -8.7965087890625, -8.4716796875, -8.1468505859375, -7.822021484375, -7.4971923828125, -7.17236328125, -6.8475341796875, -6.522705078125, -6.1978759765625, -5.873046875, -5.5482177734375, -5.223388671875, -4.8985595703125, -4.57373046875, -4.2489013671875, -3.924072265625, -3.5992431640625, -3.2744140625, -2.9495849609375, -2.624755859375, -2.2999267578125, -1.97509765625, -1.6502685546875, -1.325439453125, -1.0006103515625, -0.67578125, -0.3509521484375, -0.026123046875, 0.2987060546875, 0.62353515625, 0.9483642578125, 1.273193359375, 1.5980224609375, 1.9228515625, 2.2476806640625, 2.572509765625, 2.8973388671875, 3.22216796875, 3.5469970703125, 3.871826171875, 4.1966552734375, 4.521484375, 4.8463134765625, 5.171142578125, 5.4959716796875, 5.82080078125, 6.1456298828125, 6.470458984375, 6.7952880859375, 7.1201171875, 7.4449462890625, 7.769775390625, 8.0946044921875, 8.41943359375, 8.7442626953125, 9.069091796875, 9.3939208984375, 9.71875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 20.0, 23.0, 27.0, 58.0, 72.0, 122.0, 167.0, 250.0, 354.0, 530.0, 767.0, 1170.0, 1826.0, 2850.0, 4442.0, 7092.0, 12205.0, 22085.0, 42091.0, 90378.0, 212546.0, 321599.0, 171651.0, 73756.0, 35133.0, 18943.0, 10773.0, 6255.0, 3942.0, 2469.0, 1674.0, 1069.0, 684.0, 476.0, 327.0, 232.0, 151.0, 86.0, 87.0, 37.0, 41.0, 18.0, 20.0, 13.0, 7.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.4951171875, -1.4503173828125, -1.405517578125, -1.3607177734375, -1.31591796875, -1.2711181640625, -1.226318359375, -1.1815185546875, -1.13671875, -1.0919189453125, -1.047119140625, -1.0023193359375, -0.95751953125, -0.9127197265625, -0.867919921875, -0.8231201171875, -0.7783203125, -0.7335205078125, -0.688720703125, -0.6439208984375, -0.59912109375, -0.5543212890625, -0.509521484375, -0.4647216796875, -0.419921875, -0.3751220703125, -0.330322265625, -0.2855224609375, -0.24072265625, -0.1959228515625, -0.151123046875, -0.1063232421875, -0.0615234375, -0.0167236328125, 0.028076171875, 0.0728759765625, 0.11767578125, 0.1624755859375, 0.207275390625, 0.2520751953125, 0.296875, 0.3416748046875, 0.386474609375, 0.4312744140625, 0.47607421875, 0.5208740234375, 0.565673828125, 0.6104736328125, 0.6552734375, 0.7000732421875, 0.744873046875, 0.7896728515625, 0.83447265625, 0.8792724609375, 0.924072265625, 0.9688720703125, 1.013671875, 1.0584716796875, 1.103271484375, 1.1480712890625, 1.19287109375, 1.2376708984375, 1.282470703125, 1.3272705078125, 1.3720703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 15.0, 16.0, 17.0, 17.0, 23.0, 26.0, 18.0, 37.0, 40.0, 29.0, 31.0, 41.0, 25.0, 33.0, 64.0, 36.0, 1055.0, 40.0, 37.0, 36.0, 32.0, 41.0, 31.0, 24.0, 25.0, 22.0, 31.0, 26.0, 16.0, 13.0, 10.0, 13.0, 10.0, 8.0, 8.0, 6.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.05859375, -4.9053955078125, -4.752197265625, -4.5989990234375, -4.44580078125, -4.2926025390625, -4.139404296875, -3.9862060546875, -3.8330078125, -3.6798095703125, -3.526611328125, -3.3734130859375, -3.22021484375, -3.0670166015625, -2.913818359375, -2.7606201171875, -2.607421875, -2.4542236328125, -2.301025390625, -2.1478271484375, -1.99462890625, -1.8414306640625, -1.688232421875, -1.5350341796875, -1.3818359375, -1.2286376953125, -1.075439453125, -0.9222412109375, -0.76904296875, -0.6158447265625, -0.462646484375, -0.3094482421875, -0.15625, -0.0030517578125, 0.150146484375, 0.3033447265625, 0.45654296875, 0.6097412109375, 0.762939453125, 0.9161376953125, 1.0693359375, 1.2225341796875, 1.375732421875, 1.5289306640625, 1.68212890625, 1.8353271484375, 1.988525390625, 2.1417236328125, 2.294921875, 2.4481201171875, 2.601318359375, 2.7545166015625, 2.90771484375, 3.0609130859375, 3.214111328125, 3.3673095703125, 3.5205078125, 3.6737060546875, 3.826904296875, 3.9801025390625, 4.13330078125, 4.2864990234375, 4.439697265625, 4.5928955078125, 4.74609375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 9.0, 19.0, 20.0, 22.0, 32.0, 49.0, 72.0, 100.0, 123.0, 240.0, 279.0, 442.0, 596.0, 875.0, 1305.0, 1752.0, 2631.0, 3893.0, 5702.0, 8242.0, 12401.0, 19155.0, 29883.0, 47558.0, 77440.0, 125213.0, 482230.0, 933916.0, 127114.0, 78151.0, 48267.0, 30164.0, 19622.0, 12749.0, 8451.0, 5783.0, 3843.0, 2696.0, 1869.0, 1297.0, 857.0, 624.0, 421.0, 315.0, 218.0, 142.0, 111.0, 80.0, 54.0, 34.0, 25.0, 19.0, 11.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0], "bins": [-0.6259765625, -0.6064224243164062, -0.5868682861328125, -0.5673141479492188, -0.547760009765625, -0.5282058715820312, -0.5086517333984375, -0.48909759521484375, -0.46954345703125, -0.44998931884765625, -0.4304351806640625, -0.41088104248046875, -0.391326904296875, -0.37177276611328125, -0.3522186279296875, -0.33266448974609375, -0.3131103515625, -0.29355621337890625, -0.2740020751953125, -0.25444793701171875, -0.234893798828125, -0.21533966064453125, -0.1957855224609375, -0.17623138427734375, -0.15667724609375, -0.13712310791015625, -0.1175689697265625, -0.09801483154296875, -0.078460693359375, -0.05890655517578125, -0.0393524169921875, -0.01979827880859375, -0.000244140625, 0.01930999755859375, 0.0388641357421875, 0.05841827392578125, 0.077972412109375, 0.09752655029296875, 0.1170806884765625, 0.13663482666015625, 0.15618896484375, 0.17574310302734375, 0.1952972412109375, 0.21485137939453125, 0.234405517578125, 0.25395965576171875, 0.2735137939453125, 0.29306793212890625, 0.3126220703125, 0.33217620849609375, 0.3517303466796875, 0.37128448486328125, 0.390838623046875, 0.41039276123046875, 0.4299468994140625, 0.44950103759765625, 0.46905517578125, 0.48860931396484375, 0.5081634521484375, 0.5277175903320312, 0.547271728515625, 0.5668258666992188, 0.5863800048828125, 0.6059341430664062, 0.62548828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 13.0, 14.0, 14.0, 13.0, 25.0, 26.0, 34.0, 46.0, 64.0, 73.0, 88.0, 93.0, 87.0, 95.0, 65.0, 49.0, 48.0, 43.0, 14.0, 19.0, 16.0, 16.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074462890625, -0.00719761848449707, -0.006948947906494141, -0.006700277328491211, -0.006451606750488281, -0.0062029361724853516, -0.005954265594482422, -0.005705595016479492, -0.0054569244384765625, -0.005208253860473633, -0.004959583282470703, -0.0047109127044677734, -0.004462242126464844, -0.004213571548461914, -0.003964900970458984, -0.0037162303924560547, -0.003467559814453125, -0.0032188892364501953, -0.0029702186584472656, -0.002721548080444336, -0.0024728775024414062, -0.0022242069244384766, -0.001975536346435547, -0.0017268657684326172, -0.0014781951904296875, -0.0012295246124267578, -0.0009808540344238281, -0.0007321834564208984, -0.00048351287841796875, -0.00023484230041503906, 1.3828277587890625e-05, 0.0002624988555908203, 0.00051116943359375, 0.0007598400115966797, 0.0010085105895996094, 0.001257181167602539, 0.0015058517456054688, 0.0017545223236083984, 0.002003192901611328, 0.002251863479614258, 0.0025005340576171875, 0.002749204635620117, 0.002997875213623047, 0.0032465457916259766, 0.0034952163696289062, 0.003743886947631836, 0.003992557525634766, 0.004241228103637695, 0.004489898681640625, 0.004738569259643555, 0.004987239837646484, 0.005235910415649414, 0.005484580993652344, 0.0057332515716552734, 0.005981922149658203, 0.006230592727661133, 0.0064792633056640625, 0.006727933883666992, 0.006976604461669922, 0.0072252750396728516, 0.007473945617675781, 0.007722616195678711, 0.00797128677368164, 0.00821995735168457, 0.0084686279296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 7.0, 11.0, 5.0, 8.0, 15.0, 23.0, 26.0, 27.0, 27.0, 47.0, 60.0, 92.0, 127.0, 199.0, 328.0, 803.0, 11635.0, 1024063.0, 9304.0, 767.0, 312.0, 176.0, 124.0, 103.0, 47.0, 44.0, 35.0, 31.0, 11.0, 13.0, 15.0, 12.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.158447265625, -0.15385055541992188, -0.14925384521484375, -0.14465713500976562, -0.1400604248046875, -0.13546371459960938, -0.13086700439453125, -0.12627029418945312, -0.121673583984375, -0.11707687377929688, -0.11248016357421875, -0.10788345336914062, -0.1032867431640625, -0.09869003295898438, -0.09409332275390625, -0.08949661254882812, -0.08489990234375, -0.08030319213867188, -0.07570648193359375, -0.07110977172851562, -0.0665130615234375, -0.061916351318359375, -0.05731964111328125, -0.052722930908203125, -0.048126220703125, -0.043529510498046875, -0.03893280029296875, -0.034336090087890625, -0.0297393798828125, -0.025142669677734375, -0.02054595947265625, -0.015949249267578125, -0.0113525390625, -0.006755828857421875, -0.00215911865234375, 0.002437591552734375, 0.0070343017578125, 0.011631011962890625, 0.01622772216796875, 0.020824432373046875, 0.025421142578125, 0.030017852783203125, 0.03461456298828125, 0.039211273193359375, 0.0438079833984375, 0.048404693603515625, 0.05300140380859375, 0.057598114013671875, 0.06219482421875, 0.06679153442382812, 0.07138824462890625, 0.07598495483398438, 0.0805816650390625, 0.08517837524414062, 0.08977508544921875, 0.09437179565429688, 0.098968505859375, 0.10356521606445312, 0.10816192626953125, 0.11275863647460938, 0.1173553466796875, 0.12195205688476562, 0.12654876708984375, 0.13114547729492188, 0.1357421875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 15.0, 815.0, 181.0, 7.0], "bins": [-0.1300075352191925, -0.12790335714817047, -0.12579917907714844, -0.1236949935555458, -0.12159080803394318, -0.11948662996292114, -0.11738245189189911, -0.11527826637029648, -0.11317408829927444, -0.11106991022825241, -0.10896572470664978, -0.10686154663562775, -0.10475736111402512, -0.10265318304300308, -0.10054899752140045, -0.09844481945037842, -0.09634064137935638, -0.09423646330833435, -0.09213227778673172, -0.09002809971570969, -0.08792391419410706, -0.08581973612308502, -0.08371555805206299, -0.08161137253046036, -0.07950718700885773, -0.0774030089378357, -0.07529882341623306, -0.07319464534521103, -0.0710904598236084, -0.06898628175258636, -0.06688210368156433, -0.0647779181599617, -0.06267374008893967, -0.060569558292627335, -0.058465376496315, -0.05636119842529297, -0.05425701662898064, -0.052152834832668304, -0.05004865303635597, -0.04794447124004364, -0.04584028944373131, -0.043736107647418976, -0.041631925851106644, -0.03952774405479431, -0.03742356598377228, -0.035319384187459946, -0.033215202391147614, -0.03111102059483528, -0.029006842523813248, -0.026902660727500916, -0.024798480793833733, -0.0226942989975214, -0.020590119063854218, -0.018485937267541885, -0.016381755471229553, -0.014277574606239796, -0.012173393741250038, -0.01006921287626028, -0.007965032011270523, -0.005860850214958191, -0.0037566693499684334, -0.0016524884849786758, 0.0004516933113336563, 0.002555874176323414, 0.004660055506974459]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 13.0, 10.0, 4.0, 12.0, 18.0, 23.0, 21.0, 18.0, 25.0, 28.0, 34.0, 24.0, 29.0, 28.0, 32.0, 45.0, 44.0, 32.0, 51.0, 27.0, 49.0, 43.0, 43.0, 37.0, 36.0, 27.0, 27.0, 23.0, 29.0, 25.0, 27.0, 16.0, 17.0, 21.0, 8.0, 7.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.003438889980316162, -0.0033280132338404655, -0.003217136487364769, -0.0031062597408890724, -0.002995382994413376, -0.0028845062479376793, -0.0027736295014619827, -0.002662752754986286, -0.0025518760085105896, -0.002440999262034893, -0.0023301225155591965, -0.0022192457690835, -0.0021083690226078033, -0.0019974922761321068, -0.0018866155296564102, -0.0017757387831807137, -0.001664862036705017, -0.0015539852902293205, -0.001443108543753624, -0.0013322317972779274, -0.0012213550508022308, -0.0011104783043265343, -0.0009996015578508377, -0.0008887248113751411, -0.0007778480648994446, -0.000666971318423748, -0.0005560945719480515, -0.0004452178254723549, -0.0003343410789966583, -0.00022346433252096176, -0.0001125875860452652, -1.710839569568634e-06, 0.00010916590690612793, 0.0002200426533818245, 0.00033091939985752106, 0.0004417961463332176, 0.0005526728928089142, 0.0006635496392846107, 0.0007744263857603073, 0.0008853031322360039, 0.0009961798787117004, 0.001107056625187397, 0.0012179333716630936, 0.0013288101181387901, 0.0014396868646144867, 0.0015505636110901833, 0.0016614403575658798, 0.0017723171040415764, 0.001883193850517273, 0.0019940705969929695, 0.002104947343468666, 0.0022158240899443626, 0.002326700836420059, 0.0024375775828957558, 0.0025484543293714523, 0.002659331075847149, 0.0027702078223228455, 0.002881084568798542, 0.0029919613152742386, 0.003102838061749935, 0.0032137148082256317, 0.0033245915547013283, 0.003435468301177025, 0.0035463450476527214, 0.003657221794128418]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 12.0, 17.0, 16.0, 12.0, 22.0, 20.0, 29.0, 43.0, 48.0, 42.0, 42.0, 52.0, 70.0, 63.0, 73.0, 82.0, 56.0, 42.0, 32.0, 29.0, 27.0, 25.0, 18.0, 16.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.7454833984375, -10.420654296875, -10.0958251953125, -9.77099609375, -9.4461669921875, -9.121337890625, -8.7965087890625, -8.4716796875, -8.1468505859375, -7.822021484375, -7.4971923828125, -7.17236328125, -6.8475341796875, -6.522705078125, -6.1978759765625, -5.873046875, -5.5482177734375, -5.223388671875, -4.8985595703125, -4.57373046875, -4.2489013671875, -3.924072265625, -3.5992431640625, -3.2744140625, -2.9495849609375, -2.624755859375, -2.2999267578125, -1.97509765625, -1.6502685546875, -1.325439453125, -1.0006103515625, -0.67578125, -0.3509521484375, -0.026123046875, 0.2987060546875, 0.62353515625, 0.9483642578125, 1.273193359375, 1.5980224609375, 1.9228515625, 2.2476806640625, 2.572509765625, 2.8973388671875, 3.22216796875, 3.5469970703125, 3.871826171875, 4.1966552734375, 4.521484375, 4.8463134765625, 5.171142578125, 5.4959716796875, 5.82080078125, 6.1456298828125, 6.470458984375, 6.7952880859375, 7.1201171875, 7.4449462890625, 7.769775390625, 8.0946044921875, 8.41943359375, 8.7442626953125, 9.069091796875, 9.3939208984375, 9.71875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 10.0, 14.0, 19.0, 28.0, 47.0, 58.0, 86.0, 100.0, 155.0, 191.0, 259.0, 408.0, 592.0, 794.0, 1351.0, 2153.0, 3904.0, 7965.0, 23276.0, 126887.0, 767699.0, 78603.0, 17875.0, 6872.0, 3338.0, 1985.0, 1249.0, 810.0, 530.0, 382.0, 249.0, 184.0, 113.0, 95.0, 66.0, 56.0, 28.0, 24.0, 20.0, 14.0, 12.0, 11.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0], "bins": [-20.65625, -20.0556640625, -19.455078125, -18.8544921875, -18.25390625, -17.6533203125, -17.052734375, -16.4521484375, -15.8515625, -15.2509765625, -14.650390625, -14.0498046875, -13.44921875, -12.8486328125, -12.248046875, -11.6474609375, -11.046875, -10.4462890625, -9.845703125, -9.2451171875, -8.64453125, -8.0439453125, -7.443359375, -6.8427734375, -6.2421875, -5.6416015625, -5.041015625, -4.4404296875, -3.83984375, -3.2392578125, -2.638671875, -2.0380859375, -1.4375, -0.8369140625, -0.236328125, 0.3642578125, 0.96484375, 1.5654296875, 2.166015625, 2.7666015625, 3.3671875, 3.9677734375, 4.568359375, 5.1689453125, 5.76953125, 6.3701171875, 6.970703125, 7.5712890625, 8.171875, 8.7724609375, 9.373046875, 9.9736328125, 10.57421875, 11.1748046875, 11.775390625, 12.3759765625, 12.9765625, 13.5771484375, 14.177734375, 14.7783203125, 15.37890625, 15.9794921875, 16.580078125, 17.1806640625, 17.78125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 17.0, 9.0, 7.0, 22.0, 25.0, 19.0, 22.0, 32.0, 31.0, 24.0, 46.0, 34.0, 43.0, 42.0, 54.0, 88.0, 355.0, 1591.0, 123.0, 51.0, 40.0, 44.0, 45.0, 27.0, 31.0, 26.0, 44.0, 25.0, 19.0, 17.0, 13.0, 14.0, 13.0, 7.0, 5.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.96875, -34.8818359375, -33.794921875, -32.7080078125, -31.62109375, -30.5341796875, -29.447265625, -28.3603515625, -27.2734375, -26.1865234375, -25.099609375, -24.0126953125, -22.92578125, -21.8388671875, -20.751953125, -19.6650390625, -18.578125, -17.4912109375, -16.404296875, -15.3173828125, -14.23046875, -13.1435546875, -12.056640625, -10.9697265625, -9.8828125, -8.7958984375, -7.708984375, -6.6220703125, -5.53515625, -4.4482421875, -3.361328125, -2.2744140625, -1.1875, -0.1005859375, 0.986328125, 2.0732421875, 3.16015625, 4.2470703125, 5.333984375, 6.4208984375, 7.5078125, 8.5947265625, 9.681640625, 10.7685546875, 11.85546875, 12.9423828125, 14.029296875, 15.1162109375, 16.203125, 17.2900390625, 18.376953125, 19.4638671875, 20.55078125, 21.6376953125, 22.724609375, 23.8115234375, 24.8984375, 25.9853515625, 27.072265625, 28.1591796875, 29.24609375, 30.3330078125, 31.419921875, 32.5068359375, 33.59375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 4.0, 6.0, 12.0, 9.0, 17.0, 19.0, 16.0, 24.0, 37.0, 63.0, 64.0, 61.0, 106.0, 163.0, 325.0, 843.0, 2232.0, 8037.0, 61823.0, 3028387.0, 33913.0, 6129.0, 1832.0, 706.0, 284.0, 148.0, 99.0, 71.0, 50.0, 44.0, 33.0, 25.0, 21.0, 17.0, 13.0, 18.0, 13.0, 11.0, 2.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.8310546875, -65.599609375, -63.3681640625, -61.13671875, -58.9052734375, -56.673828125, -54.4423828125, -52.2109375, -49.9794921875, -47.748046875, -45.5166015625, -43.28515625, -41.0537109375, -38.822265625, -36.5908203125, -34.359375, -32.1279296875, -29.896484375, -27.6650390625, -25.43359375, -23.2021484375, -20.970703125, -18.7392578125, -16.5078125, -14.2763671875, -12.044921875, -9.8134765625, -7.58203125, -5.3505859375, -3.119140625, -0.8876953125, 1.34375, 3.5751953125, 5.806640625, 8.0380859375, 10.26953125, 12.5009765625, 14.732421875, 16.9638671875, 19.1953125, 21.4267578125, 23.658203125, 25.8896484375, 28.12109375, 30.3525390625, 32.583984375, 34.8154296875, 37.046875, 39.2783203125, 41.509765625, 43.7412109375, 45.97265625, 48.2041015625, 50.435546875, 52.6669921875, 54.8984375, 57.1298828125, 59.361328125, 61.5927734375, 63.82421875, 66.0556640625, 68.287109375, 70.5185546875, 72.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [11.0, 973.0, 34.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40872573852539, -14.626548767089844, 9.155628204345703, 32.937801361083984, 56.7199821472168, 80.50216674804688, 104.28433227539062, 128.06651306152344, 151.84869384765625, 175.63087463378906, 199.41305541992188, 223.19522094726562, 246.97740173339844, 270.75958251953125, 294.541748046875, 318.32391357421875, 342.1061096191406, 365.8882751464844, 389.67047119140625, 413.45263671875, 437.23480224609375, 461.0169982910156, 484.7991638183594, 508.58135986328125, 532.363525390625, 556.1456909179688, 579.9278564453125, 603.7100830078125, 627.4922485351562, 651.2744140625, 675.0565795898438, 698.8387451171875, 722.6209716796875, 746.4031372070312, 770.185302734375, 793.967529296875, 817.7496948242188, 841.5318603515625, 865.3140258789062, 889.09619140625, 912.87841796875, 936.6605834960938, 960.4427490234375, 984.2249755859375, 1008.0071411132812, 1031.789306640625, 1055.571533203125, 1079.3536376953125, 1103.1357421875, 1126.91796875, 1150.7000732421875, 1174.4822998046875, 1198.264404296875, 1222.046630859375, 1245.828857421875, 1269.6109619140625, 1293.3931884765625, 1317.1754150390625, 1340.95751953125, 1364.73974609375, 1388.5218505859375, 1412.3040771484375, 1436.086181640625, 1459.868408203125, 1483.650634765625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 17.0, 16.0, 6.0, 8.0, 14.0, 16.0, 19.0, 22.0, 20.0, 30.0, 30.0, 37.0, 27.0, 37.0, 44.0, 35.0, 40.0, 25.0, 38.0, 45.0, 34.0, 34.0, 33.0, 28.0, 38.0, 38.0, 26.0, 33.0, 25.0, 25.0, 20.0, 17.0, 11.0, 25.0, 15.0, 12.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-100.50743103027344, -97.37393951416016, -94.2404556274414, -91.10696411132812, -87.97348022460938, -84.8399887084961, -81.70649719238281, -78.57301330566406, -75.43952178955078, -72.3060302734375, -69.17254638671875, -66.03905487060547, -62.90556716918945, -59.77207946777344, -56.63859176635742, -53.505104064941406, -50.37161636352539, -47.238128662109375, -44.10464096069336, -40.971153259277344, -37.83766174316406, -34.70417404174805, -31.57068634033203, -28.437196731567383, -25.303709030151367, -22.17022132873535, -19.036731719970703, -15.903244018554688, -12.769755363464355, -9.636266708374023, -6.502779006958008, -3.3692893981933594, -0.23580169677734375, 2.897686719894409, 6.031175136566162, 9.164663314819336, 12.298151969909668, 15.431640625, 18.565128326416016, 21.698617935180664, 24.83210563659668, 27.965593338012695, 31.099082946777344, 34.23257064819336, 37.366058349609375, 40.499549865722656, 43.633033752441406, 46.76652526855469, 49.9000129699707, 53.03350067138672, 56.166988372802734, 59.30047607421875, 62.43396759033203, 65.56745910644531, 68.70094299316406, 71.83443450927734, 74.9679183959961, 78.10140991210938, 81.23489379882812, 84.3683853149414, 87.50186920166016, 90.63536071777344, 93.76884460449219, 96.90233612060547, 100.03582763671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 6.0, 8.0, 7.0, 16.0, 19.0, 16.0, 16.0, 19.0, 30.0, 24.0, 42.0, 37.0, 40.0, 44.0, 59.0, 59.0, 71.0, 66.0, 63.0, 55.0, 57.0, 36.0, 33.0, 26.0, 22.0, 21.0, 12.0, 16.0, 7.0, 7.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.3671875, -11.03369140625, -10.7001953125, -10.36669921875, -10.033203125, -9.69970703125, -9.3662109375, -9.03271484375, -8.69921875, -8.36572265625, -8.0322265625, -7.69873046875, -7.365234375, -7.03173828125, -6.6982421875, -6.36474609375, -6.03125, -5.69775390625, -5.3642578125, -5.03076171875, -4.697265625, -4.36376953125, -4.0302734375, -3.69677734375, -3.36328125, -3.02978515625, -2.6962890625, -2.36279296875, -2.029296875, -1.69580078125, -1.3623046875, -1.02880859375, -0.6953125, -0.36181640625, -0.0283203125, 0.30517578125, 0.638671875, 0.97216796875, 1.3056640625, 1.63916015625, 1.97265625, 2.30615234375, 2.6396484375, 2.97314453125, 3.306640625, 3.64013671875, 3.9736328125, 4.30712890625, 4.640625, 4.97412109375, 5.3076171875, 5.64111328125, 5.974609375, 6.30810546875, 6.6416015625, 6.97509765625, 7.30859375, 7.64208984375, 7.9755859375, 8.30908203125, 8.642578125, 8.97607421875, 9.3095703125, 9.64306640625, 9.9765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 8.0, 11.0, 19.0, 23.0, 30.0, 54.0, 58.0, 108.0, 147.0, 228.0, 386.0, 624.0, 1138.0, 2163.0, 4442.0, 10333.0, 31791.0, 774644.0, 3251072.0, 91259.0, 14207.0, 5710.0, 2607.0, 1298.0, 720.0, 422.0, 258.0, 165.0, 79.0, 77.0, 52.0, 36.0, 26.0, 11.0, 21.0, 10.0, 9.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.947265625, -38.70703125, -37.466796875, -36.2265625, -34.986328125, -33.74609375, -32.505859375, -31.265625, -30.025390625, -28.78515625, -27.544921875, -26.3046875, -25.064453125, -23.82421875, -22.583984375, -21.34375, -20.103515625, -18.86328125, -17.623046875, -16.3828125, -15.142578125, -13.90234375, -12.662109375, -11.421875, -10.181640625, -8.94140625, -7.701171875, -6.4609375, -5.220703125, -3.98046875, -2.740234375, -1.5, -0.259765625, 0.98046875, 2.220703125, 3.4609375, 4.701171875, 5.94140625, 7.181640625, 8.421875, 9.662109375, 10.90234375, 12.142578125, 13.3828125, 14.623046875, 15.86328125, 17.103515625, 18.34375, 19.583984375, 20.82421875, 22.064453125, 23.3046875, 24.544921875, 25.78515625, 27.025390625, 28.265625, 29.505859375, 30.74609375, 31.986328125, 33.2265625, 34.466796875, 35.70703125, 36.947265625, 38.1875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 19.0, 16.0, 21.0, 21.0, 33.0, 30.0, 43.0, 75.0, 118.0, 180.0, 413.0, 591.0, 758.0, 630.0, 379.0, 226.0, 124.0, 81.0, 56.0, 40.0, 28.0, 26.0, 22.0, 10.0, 22.0, 8.0, 12.0, 8.0, 10.0, 6.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.6796875, -21.828125, -20.9765625, -20.125, -19.2734375, -18.421875, -17.5703125, -16.71875, -15.8671875, -15.015625, -14.1640625, -13.3125, -12.4609375, -11.609375, -10.7578125, -9.90625, -9.0546875, -8.203125, -7.3515625, -6.5, -5.6484375, -4.796875, -3.9453125, -3.09375, -2.2421875, -1.390625, -0.5390625, 0.3125, 1.1640625, 2.015625, 2.8671875, 3.71875, 4.5703125, 5.421875, 6.2734375, 7.125, 7.9765625, 8.828125, 9.6796875, 10.53125, 11.3828125, 12.234375, 13.0859375, 13.9375, 14.7890625, 15.640625, 16.4921875, 17.34375, 18.1953125, 19.046875, 19.8984375, 20.75, 21.6015625, 22.453125, 23.3046875, 24.15625, 25.0078125, 25.859375, 26.7109375, 27.5625, 28.4140625, 29.265625, 30.1171875, 30.96875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 11.0, 4.0, 10.0, 13.0, 22.0, 29.0, 57.0, 49.0, 99.0, 163.0, 247.0, 399.0, 817.0, 1568.0, 3360.0, 7678.0, 20301.0, 69365.0, 660917.0, 3173090.0, 194305.0, 38642.0, 12887.0, 5284.0, 2359.0, 1135.0, 579.0, 299.0, 192.0, 120.0, 97.0, 65.0, 37.0, 24.0, 12.0, 12.0, 7.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.96875, -34.650390625, -33.33203125, -32.013671875, -30.6953125, -29.376953125, -28.05859375, -26.740234375, -25.421875, -24.103515625, -22.78515625, -21.466796875, -20.1484375, -18.830078125, -17.51171875, -16.193359375, -14.875, -13.556640625, -12.23828125, -10.919921875, -9.6015625, -8.283203125, -6.96484375, -5.646484375, -4.328125, -3.009765625, -1.69140625, -0.373046875, 0.9453125, 2.263671875, 3.58203125, 4.900390625, 6.21875, 7.537109375, 8.85546875, 10.173828125, 11.4921875, 12.810546875, 14.12890625, 15.447265625, 16.765625, 18.083984375, 19.40234375, 20.720703125, 22.0390625, 23.357421875, 24.67578125, 25.994140625, 27.3125, 28.630859375, 29.94921875, 31.267578125, 32.5859375, 33.904296875, 35.22265625, 36.541015625, 37.859375, 39.177734375, 40.49609375, 41.814453125, 43.1328125, 44.451171875, 45.76953125, 47.087890625, 48.40625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 27.0, 81.0, 275.0, 378.0, 152.0, 57.0, 20.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.1268310546875, -237.38064575195312, -228.6344451904297, -219.8882598876953, -211.14205932617188, -202.3958740234375, -193.64968872070312, -184.90350341796875, -176.1573028564453, -167.41111755371094, -158.6649169921875, -149.91873168945312, -141.17254638671875, -132.4263458251953, -123.68016052246094, -114.93396759033203, -106.18777465820312, -97.44158172607422, -88.69538879394531, -79.94920349121094, -71.20301055908203, -62.456817626953125, -53.710628509521484, -44.964439392089844, -36.21824645996094, -27.472055435180664, -18.72586441040039, -9.979673385620117, -1.2334823608398438, 7.5127105712890625, 16.258899688720703, 25.005088806152344, 33.751251220703125, 42.49744415283203, 51.24363327026367, 59.98982238769531, 68.73601531982422, 77.48220825195312, 86.2283935546875, 94.9745864868164, 103.72077941894531, 112.46697235107422, 121.21316528320312, 129.9593505859375, 138.70553588867188, 147.4517364501953, 156.1979217529297, 164.94412231445312, 173.6903076171875, 182.43649291992188, 191.1826934814453, 199.9288787841797, 208.67507934570312, 217.4212646484375, 226.16744995117188, 234.91363525390625, 243.6598358154297, 252.40602111816406, 261.1522216796875, 269.8984069824219, 278.64459228515625, 287.39080810546875, 296.1369934082031, 304.8831787109375, 313.6293640136719]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 5.0, 9.0, 5.0, 10.0, 13.0, 16.0, 19.0, 23.0, 24.0, 24.0, 22.0, 34.0, 37.0, 33.0, 43.0, 47.0, 36.0, 49.0, 33.0, 38.0, 39.0, 44.0, 41.0, 21.0, 32.0, 34.0, 29.0, 30.0, 26.0, 21.0, 25.0, 15.0, 19.0, 14.0, 9.0, 19.0, 16.0, 5.0, 7.0, 10.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-88.31908416748047, -85.6746826171875, -83.03028869628906, -80.38589477539062, -77.74149322509766, -75.09709167480469, -72.45269775390625, -69.80830383300781, -67.16390228271484, -64.51950073242188, -61.87510681152344, -59.230709075927734, -56.58631134033203, -53.94191360473633, -51.297515869140625, -48.65311813354492, -46.00872039794922, -43.364322662353516, -40.71992492675781, -38.07552719116211, -35.431129455566406, -32.7867317199707, -30.142333984375, -27.497936248779297, -24.853538513183594, -22.20914077758789, -19.564743041992188, -16.920345306396484, -14.275947570800781, -11.631549835205078, -8.987152099609375, -6.342754364013672, -3.6983489990234375, -1.0539512634277344, 1.5904464721679688, 4.234844207763672, 6.879241943359375, 9.523639678955078, 12.168037414550781, 14.812435150146484, 17.456832885742188, 20.10123062133789, 22.745628356933594, 25.390026092529297, 28.034423828125, 30.678821563720703, 33.323219299316406, 35.96761703491211, 38.61201477050781, 41.256412506103516, 43.90081024169922, 46.54520797729492, 49.189605712890625, 51.83400344848633, 54.47840118408203, 57.122798919677734, 59.76719665527344, 62.41159439086914, 65.05599212646484, 67.70039367675781, 70.34478759765625, 72.98918151855469, 75.63358306884766, 78.27798461914062, 80.92237854003906]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 8.0, 7.0, 13.0, 17.0, 22.0, 20.0, 17.0, 26.0, 34.0, 33.0, 39.0, 44.0, 60.0, 45.0, 64.0, 57.0, 69.0, 53.0, 45.0, 45.0, 35.0, 47.0, 35.0, 29.0, 21.0, 14.0, 10.0, 6.0, 5.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8984375, -10.570068359375, -10.24169921875, -9.913330078125, -9.5849609375, -9.256591796875, -8.92822265625, -8.599853515625, -8.271484375, -7.943115234375, -7.61474609375, -7.286376953125, -6.9580078125, -6.629638671875, -6.30126953125, -5.972900390625, -5.64453125, -5.316162109375, -4.98779296875, -4.659423828125, -4.3310546875, -4.002685546875, -3.67431640625, -3.345947265625, -3.017578125, -2.689208984375, -2.36083984375, -2.032470703125, -1.7041015625, -1.375732421875, -1.04736328125, -0.718994140625, -0.390625, -0.062255859375, 0.26611328125, 0.594482421875, 0.9228515625, 1.251220703125, 1.57958984375, 1.907958984375, 2.236328125, 2.564697265625, 2.89306640625, 3.221435546875, 3.5498046875, 3.878173828125, 4.20654296875, 4.534912109375, 4.86328125, 5.191650390625, 5.52001953125, 5.848388671875, 6.1767578125, 6.505126953125, 6.83349609375, 7.161865234375, 7.490234375, 7.818603515625, 8.14697265625, 8.475341796875, 8.8037109375, 9.132080078125, 9.46044921875, 9.788818359375, 10.1171875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 12.0, 22.0, 18.0, 33.0, 52.0, 80.0, 97.0, 138.0, 186.0, 260.0, 361.0, 528.0, 742.0, 1032.0, 1428.0, 2045.0, 3067.0, 4300.0, 6546.0, 10278.0, 15941.0, 26144.0, 43446.0, 74776.0, 134874.0, 221942.0, 207578.0, 119500.0, 67131.0, 38980.0, 23328.0, 14451.0, 9469.0, 6055.0, 4149.0, 2820.0, 1943.0, 1429.0, 971.0, 667.0, 500.0, 364.0, 232.0, 186.0, 117.0, 95.0, 66.0, 59.0, 40.0, 22.0, 25.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.1103515625, -1.0755462646484375, -1.040740966796875, -1.0059356689453125, -0.97113037109375, -0.9363250732421875, -0.901519775390625, -0.8667144775390625, -0.8319091796875, -0.7971038818359375, -0.762298583984375, -0.7274932861328125, -0.69268798828125, -0.6578826904296875, -0.623077392578125, -0.5882720947265625, -0.553466796875, -0.5186614990234375, -0.483856201171875, -0.4490509033203125, -0.41424560546875, -0.3794403076171875, -0.344635009765625, -0.3098297119140625, -0.2750244140625, -0.2402191162109375, -0.205413818359375, -0.1706085205078125, -0.13580322265625, -0.1009979248046875, -0.066192626953125, -0.0313873291015625, 0.00341796875, 0.0382232666015625, 0.073028564453125, 0.1078338623046875, 0.14263916015625, 0.1774444580078125, 0.212249755859375, 0.2470550537109375, 0.2818603515625, 0.3166656494140625, 0.351470947265625, 0.3862762451171875, 0.42108154296875, 0.4558868408203125, 0.490692138671875, 0.5254974365234375, 0.560302734375, 0.5951080322265625, 0.629913330078125, 0.6647186279296875, 0.69952392578125, 0.7343292236328125, 0.769134521484375, 0.8039398193359375, 0.8387451171875, 0.8735504150390625, 0.908355712890625, 0.9431610107421875, 0.97796630859375, 1.0127716064453125, 1.047576904296875, 1.0823822021484375, 1.1171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 5.0, 8.0, 12.0, 15.0, 21.0, 16.0, 19.0, 29.0, 27.0, 29.0, 30.0, 32.0, 36.0, 33.0, 42.0, 33.0, 30.0, 1074.0, 34.0, 44.0, 39.0, 49.0, 34.0, 32.0, 24.0, 30.0, 33.0, 32.0, 18.0, 20.0, 18.0, 15.0, 12.0, 13.0, 9.0, 11.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.09661865234375, -4.9315185546875, -4.76641845703125, -4.601318359375, -4.43621826171875, -4.2711181640625, -4.10601806640625, -3.94091796875, -3.77581787109375, -3.6107177734375, -3.44561767578125, -3.280517578125, -3.11541748046875, -2.9503173828125, -2.78521728515625, -2.6201171875, -2.45501708984375, -2.2899169921875, -2.12481689453125, -1.959716796875, -1.79461669921875, -1.6295166015625, -1.46441650390625, -1.29931640625, -1.13421630859375, -0.9691162109375, -0.80401611328125, -0.638916015625, -0.47381591796875, -0.3087158203125, -0.14361572265625, 0.021484375, 0.18658447265625, 0.3516845703125, 0.51678466796875, 0.681884765625, 0.84698486328125, 1.0120849609375, 1.17718505859375, 1.34228515625, 1.50738525390625, 1.6724853515625, 1.83758544921875, 2.002685546875, 2.16778564453125, 2.3328857421875, 2.49798583984375, 2.6630859375, 2.82818603515625, 2.9932861328125, 3.15838623046875, 3.323486328125, 3.48858642578125, 3.6536865234375, 3.81878662109375, 3.98388671875, 4.14898681640625, 4.3140869140625, 4.47918701171875, 4.644287109375, 4.80938720703125, 4.9744873046875, 5.13958740234375, 5.3046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 17.0, 20.0, 32.0, 51.0, 66.0, 126.0, 158.0, 247.0, 381.0, 591.0, 899.0, 1429.0, 2114.0, 3394.0, 5392.0, 8580.0, 14164.0, 24307.0, 42070.0, 74483.0, 131884.0, 478216.0, 994125.0, 133425.0, 75433.0, 42635.0, 24482.0, 14548.0, 8734.0, 5471.0, 3481.0, 2131.0, 1403.0, 887.0, 628.0, 333.0, 262.0, 178.0, 111.0, 65.0, 67.0, 31.0, 26.0, 19.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.82861328125, -0.8035125732421875, -0.778411865234375, -0.7533111572265625, -0.72821044921875, -0.7031097412109375, -0.678009033203125, -0.6529083251953125, -0.6278076171875, -0.6027069091796875, -0.577606201171875, -0.5525054931640625, -0.52740478515625, -0.5023040771484375, -0.477203369140625, -0.4521026611328125, -0.427001953125, -0.4019012451171875, -0.376800537109375, -0.3516998291015625, -0.32659912109375, -0.3014984130859375, -0.276397705078125, -0.2512969970703125, -0.2261962890625, -0.2010955810546875, -0.175994873046875, -0.1508941650390625, -0.12579345703125, -0.1006927490234375, -0.075592041015625, -0.0504913330078125, -0.025390625, -0.0002899169921875, 0.024810791015625, 0.0499114990234375, 0.07501220703125, 0.1001129150390625, 0.125213623046875, 0.1503143310546875, 0.1754150390625, 0.2005157470703125, 0.225616455078125, 0.2507171630859375, 0.27581787109375, 0.3009185791015625, 0.326019287109375, 0.3511199951171875, 0.376220703125, 0.4013214111328125, 0.426422119140625, 0.4515228271484375, 0.47662353515625, 0.5017242431640625, 0.526824951171875, 0.5519256591796875, 0.5770263671875, 0.6021270751953125, 0.627227783203125, 0.6523284912109375, 0.67742919921875, 0.7025299072265625, 0.727630615234375, 0.7527313232421875, 0.77783203125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 6.0, 13.0, 10.0, 13.0, 16.0, 24.0, 27.0, 38.0, 45.0, 47.0, 71.0, 90.0, 112.0, 95.0, 82.0, 57.0, 48.0, 41.0, 16.0, 18.0, 24.0, 18.0, 16.0, 11.0, 14.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00861358642578125, -0.00835716724395752, -0.008100748062133789, -0.007844328880310059, -0.007587909698486328, -0.007331490516662598, -0.007075071334838867, -0.006818652153015137, -0.006562232971191406, -0.006305813789367676, -0.006049394607543945, -0.005792975425720215, -0.005536556243896484, -0.005280137062072754, -0.0050237178802490234, -0.004767298698425293, -0.0045108795166015625, -0.004254460334777832, -0.0039980411529541016, -0.003741621971130371, -0.0034852027893066406, -0.00322878360748291, -0.0029723644256591797, -0.0027159452438354492, -0.0024595260620117188, -0.0022031068801879883, -0.0019466876983642578, -0.0016902685165405273, -0.0014338493347167969, -0.0011774301528930664, -0.0009210109710693359, -0.0006645917892456055, -0.000408172607421875, -0.00015175342559814453, 0.00010466575622558594, 0.0003610849380493164, 0.0006175041198730469, 0.0008739233016967773, 0.0011303424835205078, 0.0013867616653442383, 0.0016431808471679688, 0.0018996000289916992, 0.0021560192108154297, 0.00241243839263916, 0.0026688575744628906, 0.002925276756286621, 0.0031816959381103516, 0.003438115119934082, 0.0036945343017578125, 0.003950953483581543, 0.0042073726654052734, 0.004463791847229004, 0.004720211029052734, 0.004976630210876465, 0.005233049392700195, 0.005489468574523926, 0.005745887756347656, 0.006002306938171387, 0.006258726119995117, 0.006515145301818848, 0.006771564483642578, 0.007027983665466309, 0.007284402847290039, 0.0075408220291137695, 0.0077972412109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 11.0, 12.0, 8.0, 14.0, 19.0, 21.0, 28.0, 31.0, 61.0, 67.0, 66.0, 104.0, 143.0, 257.0, 515.0, 2864.0, 952007.0, 89949.0, 1226.0, 399.0, 199.0, 111.0, 89.0, 61.0, 47.0, 47.0, 35.0, 27.0, 23.0, 19.0, 20.0, 14.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.1671142578125, -0.16245079040527344, -0.15778732299804688, -0.1531238555908203, -0.14846038818359375, -0.1437969207763672, -0.13913345336914062, -0.13446998596191406, -0.1298065185546875, -0.12514305114746094, -0.12047958374023438, -0.11581611633300781, -0.11115264892578125, -0.10648918151855469, -0.10182571411132812, -0.09716224670410156, -0.092498779296875, -0.08783531188964844, -0.08317184448242188, -0.07850837707519531, -0.07384490966796875, -0.06918144226074219, -0.06451797485351562, -0.05985450744628906, -0.0551910400390625, -0.05052757263183594, -0.045864105224609375, -0.04120063781738281, -0.03653717041015625, -0.03187370300292969, -0.027210235595703125, -0.022546768188476562, -0.01788330078125, -0.013219833374023438, -0.008556365966796875, -0.0038928985595703125, 0.00077056884765625, 0.0054340362548828125, 0.010097503662109375, 0.014760971069335938, 0.0194244384765625, 0.024087905883789062, 0.028751373291015625, 0.03341484069824219, 0.03807830810546875, 0.04274177551269531, 0.047405242919921875, 0.05206871032714844, 0.056732177734375, 0.06139564514160156, 0.06605911254882812, 0.07072257995605469, 0.07538604736328125, 0.08004951477050781, 0.08471298217773438, 0.08937644958496094, 0.0940399169921875, 0.09870338439941406, 0.10336685180664062, 0.10803031921386719, 0.11269378662109375, 0.11735725402832031, 0.12202072143554688, 0.12668418884277344, 0.13134765625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 14.0, 767.0, 230.0, 5.0, 1.0], "bins": [-0.14893925189971924, -0.14648935198783875, -0.14403945207595825, -0.14158955216407776, -0.13913966715335846, -0.13668976724147797, -0.13423986732959747, -0.13178996741771698, -0.1293400675058365, -0.126890167593956, -0.1244402751326561, -0.1219903752207756, -0.11954047530889511, -0.11709058284759521, -0.11464068293571472, -0.11219078302383423, -0.10974089056253433, -0.10729099065065384, -0.10484109818935394, -0.10239119827747345, -0.09994129836559296, -0.09749139845371246, -0.09504150599241257, -0.09259160608053207, -0.09014171361923218, -0.08769181370735168, -0.08524192124605179, -0.0827920213341713, -0.0803421214222908, -0.0778922289609909, -0.07544232904911041, -0.07299242913722992, -0.07054253667593002, -0.06809263676404953, -0.06564274430274963, -0.06319284439086914, -0.06074294447898865, -0.05829304829239845, -0.05584315210580826, -0.053393252193927765, -0.05094335600733757, -0.048493459820747375, -0.04604355990886688, -0.04359366372227669, -0.04114376753568649, -0.038693867623806, -0.036243971437215805, -0.03379407525062561, -0.03134417533874512, -0.028894277289509773, -0.02644437924027443, -0.023994483053684235, -0.02154458500444889, -0.019094686955213547, -0.016644790768623352, -0.014194892719388008, -0.01174499373883009, -0.00929509662091732, -0.006845198571681976, -0.00439530098810792, -0.001945403404533863, 0.0005044946447014809, 0.00295439176261425, 0.0054042888805270195, 0.007854186929762363]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 11.0, 10.0, 7.0, 5.0, 5.0, 15.0, 8.0, 14.0, 18.0, 16.0, 21.0, 31.0, 30.0, 21.0, 24.0, 23.0, 30.0, 38.0, 33.0, 31.0, 28.0, 45.0, 29.0, 27.0, 33.0, 39.0, 38.0, 36.0, 31.0, 23.0, 35.0, 33.0, 24.0, 27.0, 18.0, 23.0, 25.0, 18.0, 16.0, 12.0, 6.0, 8.0, 14.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038304924964904785, -0.003705178387463093, -0.003579864278435707, -0.0034545501694083214, -0.0033292360603809357, -0.00320392195135355, -0.0030786078423261642, -0.0029532937332987785, -0.002827979624271393, -0.002702665515244007, -0.0025773514062166214, -0.0024520372971892357, -0.00232672318816185, -0.0022014090791344643, -0.0020760949701070786, -0.0019507808610796928, -0.0018254667520523071, -0.0017001526430249214, -0.0015748385339975357, -0.00144952442497015, -0.0013242103159427643, -0.0011988962069153786, -0.0010735820978879929, -0.0009482679888606071, -0.0008229538798332214, -0.0006976397708058357, -0.00057232566177845, -0.0004470115527510643, -0.0003216974437236786, -0.00019638333469629288, -7.106922566890717e-05, 5.4244883358478546e-05, 0.00017955899238586426, 0.00030487310141324997, 0.0004301872104406357, 0.0005555013194680214, 0.0006808154284954071, 0.0008061295375227928, 0.0009314436465501785, 0.0010567577555775642, 0.00118207186460495, 0.0013073859736323357, 0.0014327000826597214, 0.001558014191687107, 0.0016833283007144928, 0.0018086424097418785, 0.0019339565187692642, 0.00205927062779665, 0.0021845847368240356, 0.0023098988458514214, 0.002435212954878807, 0.0025605270639061928, 0.0026858411729335785, 0.002811155281960964, 0.00293646939098835, 0.0030617835000157356, 0.0031870976090431213, 0.003312411718070507, 0.0034377258270978928, 0.0035630399361252785, 0.003688354045152664, 0.00381366815418005, 0.003938982263207436, 0.004064296372234821, 0.004189610481262207]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 8.0, 7.0, 13.0, 17.0, 22.0, 20.0, 17.0, 26.0, 34.0, 33.0, 39.0, 44.0, 60.0, 45.0, 64.0, 57.0, 69.0, 53.0, 45.0, 45.0, 35.0, 47.0, 35.0, 29.0, 21.0, 14.0, 10.0, 6.0, 5.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8984375, -10.570068359375, -10.24169921875, -9.913330078125, -9.5849609375, -9.256591796875, -8.92822265625, -8.599853515625, -8.271484375, -7.943115234375, -7.61474609375, -7.286376953125, -6.9580078125, -6.629638671875, -6.30126953125, -5.972900390625, -5.64453125, -5.316162109375, -4.98779296875, -4.659423828125, -4.3310546875, -4.002685546875, -3.67431640625, -3.345947265625, -3.017578125, -2.689208984375, -2.36083984375, -2.032470703125, -1.7041015625, -1.375732421875, -1.04736328125, -0.718994140625, -0.390625, -0.062255859375, 0.26611328125, 0.594482421875, 0.9228515625, 1.251220703125, 1.57958984375, 1.907958984375, 2.236328125, 2.564697265625, 2.89306640625, 3.221435546875, 3.5498046875, 3.878173828125, 4.20654296875, 4.534912109375, 4.86328125, 5.191650390625, 5.52001953125, 5.848388671875, 6.1767578125, 6.505126953125, 6.83349609375, 7.161865234375, 7.490234375, 7.818603515625, 8.14697265625, 8.475341796875, 8.8037109375, 9.132080078125, 9.46044921875, 9.788818359375, 10.1171875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 10.0, 15.0, 19.0, 14.0, 33.0, 43.0, 50.0, 73.0, 111.0, 153.0, 213.0, 272.0, 421.0, 663.0, 952.0, 1565.0, 2742.0, 5209.0, 12235.0, 37259.0, 210956.0, 654152.0, 83007.0, 20911.0, 7756.0, 3763.0, 2058.0, 1275.0, 843.0, 557.0, 353.0, 256.0, 194.0, 119.0, 85.0, 51.0, 43.0, 33.0, 25.0, 15.0, 18.0, 12.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-16.5, -16.0184326171875, -15.536865234375, -15.0552978515625, -14.57373046875, -14.0921630859375, -13.610595703125, -13.1290283203125, -12.6474609375, -12.1658935546875, -11.684326171875, -11.2027587890625, -10.72119140625, -10.2396240234375, -9.758056640625, -9.2764892578125, -8.794921875, -8.3133544921875, -7.831787109375, -7.3502197265625, -6.86865234375, -6.3870849609375, -5.905517578125, -5.4239501953125, -4.9423828125, -4.4608154296875, -3.979248046875, -3.4976806640625, -3.01611328125, -2.5345458984375, -2.052978515625, -1.5714111328125, -1.08984375, -0.6082763671875, -0.126708984375, 0.3548583984375, 0.83642578125, 1.3179931640625, 1.799560546875, 2.2811279296875, 2.7626953125, 3.2442626953125, 3.725830078125, 4.2073974609375, 4.68896484375, 5.1705322265625, 5.652099609375, 6.1336669921875, 6.615234375, 7.0968017578125, 7.578369140625, 8.0599365234375, 8.54150390625, 9.0230712890625, 9.504638671875, 9.9862060546875, 10.4677734375, 10.9493408203125, 11.430908203125, 11.9124755859375, 12.39404296875, 12.8756103515625, 13.357177734375, 13.8387451171875, 14.3203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 12.0, 4.0, 10.0, 11.0, 18.0, 16.0, 21.0, 14.0, 22.0, 39.0, 24.0, 49.0, 37.0, 40.0, 46.0, 58.0, 86.0, 225.0, 1694.0, 156.0, 69.0, 62.0, 45.0, 31.0, 40.0, 28.0, 38.0, 25.0, 22.0, 28.0, 18.0, 11.0, 11.0, 11.0, 9.0, 3.0, 8.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.71875, -35.50732421875, -34.2958984375, -33.08447265625, -31.873046875, -30.66162109375, -29.4501953125, -28.23876953125, -27.02734375, -25.81591796875, -24.6044921875, -23.39306640625, -22.181640625, -20.97021484375, -19.7587890625, -18.54736328125, -17.3359375, -16.12451171875, -14.9130859375, -13.70166015625, -12.490234375, -11.27880859375, -10.0673828125, -8.85595703125, -7.64453125, -6.43310546875, -5.2216796875, -4.01025390625, -2.798828125, -1.58740234375, -0.3759765625, 0.83544921875, 2.046875, 3.25830078125, 4.4697265625, 5.68115234375, 6.892578125, 8.10400390625, 9.3154296875, 10.52685546875, 11.73828125, 12.94970703125, 14.1611328125, 15.37255859375, 16.583984375, 17.79541015625, 19.0068359375, 20.21826171875, 21.4296875, 22.64111328125, 23.8525390625, 25.06396484375, 26.275390625, 27.48681640625, 28.6982421875, 29.90966796875, 31.12109375, 32.33251953125, 33.5439453125, 34.75537109375, 35.966796875, 37.17822265625, 38.3896484375, 39.60107421875, 40.8125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 4.0, 3.0, 6.0, 5.0, 12.0, 10.0, 15.0, 23.0, 28.0, 28.0, 53.0, 57.0, 79.0, 139.0, 266.0, 665.0, 2412.0, 19540.0, 2893719.0, 219074.0, 7158.0, 1332.0, 442.0, 210.0, 107.0, 91.0, 58.0, 37.0, 21.0, 21.0, 16.0, 21.0, 12.0, 13.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.0, -65.017578125, -63.03515625, -61.052734375, -59.0703125, -57.087890625, -55.10546875, -53.123046875, -51.140625, -49.158203125, -47.17578125, -45.193359375, -43.2109375, -41.228515625, -39.24609375, -37.263671875, -35.28125, -33.298828125, -31.31640625, -29.333984375, -27.3515625, -25.369140625, -23.38671875, -21.404296875, -19.421875, -17.439453125, -15.45703125, -13.474609375, -11.4921875, -9.509765625, -7.52734375, -5.544921875, -3.5625, -1.580078125, 0.40234375, 2.384765625, 4.3671875, 6.349609375, 8.33203125, 10.314453125, 12.296875, 14.279296875, 16.26171875, 18.244140625, 20.2265625, 22.208984375, 24.19140625, 26.173828125, 28.15625, 30.138671875, 32.12109375, 34.103515625, 36.0859375, 38.068359375, 40.05078125, 42.033203125, 44.015625, 45.998046875, 47.98046875, 49.962890625, 51.9453125, 53.927734375, 55.91015625, 57.892578125, 59.875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 8.0, 56.0, 189.0, 351.0, 260.0, 107.0, 24.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.969234466552734, -60.372314453125, -56.775394439697266, -53.17847442626953, -49.58155059814453, -45.9846305847168, -42.38771057128906, -38.79078674316406, -35.193870544433594, -31.59695053100586, -28.000028610229492, -24.403108596801758, -20.80618667602539, -17.209266662597656, -13.612346649169922, -10.015424728393555, -6.4185028076171875, -2.821582078933716, 0.7753386497497559, 4.372259140014648, 7.969180107116699, 11.56610107421875, 15.163021087646484, 18.75994300842285, 22.356863021850586, 25.95378303527832, 29.550704956054688, 33.14762496948242, 36.744544982910156, 40.341468811035156, 43.938385009765625, 47.535308837890625, 51.132225036621094, 54.72914505004883, 58.32606506347656, 61.92298889160156, 65.51990509033203, 69.11682891845703, 72.7137451171875, 76.3106689453125, 79.9075927734375, 83.5045166015625, 87.10143280029297, 90.69835662841797, 94.29527282714844, 97.89219665527344, 101.48912048339844, 105.0860366821289, 108.68295288085938, 112.27987670898438, 115.87679290771484, 119.47371673583984, 123.07063293457031, 126.66755676269531, 130.2644805908203, 133.8614044189453, 137.4583282470703, 141.0552520751953, 144.6521759033203, 148.24908447265625, 151.84600830078125, 155.44293212890625, 159.03985595703125, 162.63677978515625, 166.2336883544922]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 9.0, 8.0, 10.0, 10.0, 14.0, 10.0, 12.0, 21.0, 35.0, 27.0, 31.0, 26.0, 30.0, 37.0, 41.0, 43.0, 29.0, 30.0, 39.0, 37.0, 35.0, 43.0, 34.0, 47.0, 37.0, 28.0, 28.0, 23.0, 27.0, 27.0, 27.0, 20.0, 18.0, 9.0, 17.0, 13.0, 16.0, 11.0, 4.0, 6.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-111.24638366699219, -107.84172058105469, -104.43705749511719, -101.03239440917969, -97.62772369384766, -94.22306060791016, -90.81839752197266, -87.41373443603516, -84.00907135009766, -80.60440826416016, -77.19974517822266, -73.79507446289062, -70.39041137695312, -66.98574829101562, -63.581085205078125, -60.176422119140625, -56.77175521850586, -53.36709213256836, -49.962425231933594, -46.557762145996094, -43.153099060058594, -39.748435974121094, -36.34376907348633, -32.93910598754883, -29.534440994262695, -26.129776000976562, -22.725112915039062, -19.32044792175293, -15.915783882141113, -12.511119842529297, -9.106454849243164, -5.701791763305664, -2.2971267700195312, 1.1075375080108643, 4.51220178604126, 7.916866302490234, 11.32153034210205, 14.726194381713867, 18.130859375, 21.5355224609375, 24.940187454223633, 28.344852447509766, 31.749515533447266, 35.15418243408203, 38.55884552001953, 41.96350860595703, 45.36817169189453, 48.77283477783203, 52.1775016784668, 55.5821647644043, 58.98683166503906, 62.39149475097656, 65.79615783691406, 69.20082092285156, 72.60548400878906, 76.01014709472656, 79.4148178100586, 82.8194808959961, 86.2241439819336, 89.62881469726562, 93.03347778320312, 96.43814086914062, 99.84280395507812, 103.24746704101562, 106.65213012695312]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 13.0, 7.0, 9.0, 14.0, 19.0, 20.0, 21.0, 27.0, 27.0, 32.0, 31.0, 55.0, 34.0, 54.0, 55.0, 58.0, 65.0, 56.0, 47.0, 45.0, 37.0, 40.0, 39.0, 35.0, 23.0, 24.0, 13.0, 12.0, 6.0, 10.0, 5.0, 10.0, 5.0, 5.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.203125, -10.8714599609375, -10.539794921875, -10.2081298828125, -9.87646484375, -9.5447998046875, -9.213134765625, -8.8814697265625, -8.5498046875, -8.2181396484375, -7.886474609375, -7.5548095703125, -7.22314453125, -6.8914794921875, -6.559814453125, -6.2281494140625, -5.896484375, -5.5648193359375, -5.233154296875, -4.9014892578125, -4.56982421875, -4.2381591796875, -3.906494140625, -3.5748291015625, -3.2431640625, -2.9114990234375, -2.579833984375, -2.2481689453125, -1.91650390625, -1.5848388671875, -1.253173828125, -0.9215087890625, -0.58984375, -0.2581787109375, 0.073486328125, 0.4051513671875, 0.73681640625, 1.0684814453125, 1.400146484375, 1.7318115234375, 2.0634765625, 2.3951416015625, 2.726806640625, 3.0584716796875, 3.39013671875, 3.7218017578125, 4.053466796875, 4.3851318359375, 4.716796875, 5.0484619140625, 5.380126953125, 5.7117919921875, 6.04345703125, 6.3751220703125, 6.706787109375, 7.0384521484375, 7.3701171875, 7.7017822265625, 8.033447265625, 8.3651123046875, 8.69677734375, 9.0284423828125, 9.360107421875, 9.6917724609375, 10.0234375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 15.0, 22.0, 17.0, 31.0, 37.0, 71.0, 96.0, 124.0, 196.0, 313.0, 459.0, 728.0, 1174.0, 1936.0, 3171.0, 5975.0, 11482.0, 27569.0, 229251.0, 3214204.0, 623324.0, 44475.0, 13755.0, 6625.0, 3585.0, 2044.0, 1235.0, 746.0, 499.0, 346.0, 244.0, 157.0, 102.0, 69.0, 67.0, 35.0, 25.0, 25.0, 18.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.796875, -29.823974609375, -28.85107421875, -27.878173828125, -26.9052734375, -25.932373046875, -24.95947265625, -23.986572265625, -23.013671875, -22.040771484375, -21.06787109375, -20.094970703125, -19.1220703125, -18.149169921875, -17.17626953125, -16.203369140625, -15.23046875, -14.257568359375, -13.28466796875, -12.311767578125, -11.3388671875, -10.365966796875, -9.39306640625, -8.420166015625, -7.447265625, -6.474365234375, -5.50146484375, -4.528564453125, -3.5556640625, -2.582763671875, -1.60986328125, -0.636962890625, 0.3359375, 1.308837890625, 2.28173828125, 3.254638671875, 4.2275390625, 5.200439453125, 6.17333984375, 7.146240234375, 8.119140625, 9.092041015625, 10.06494140625, 11.037841796875, 12.0107421875, 12.983642578125, 13.95654296875, 14.929443359375, 15.90234375, 16.875244140625, 17.84814453125, 18.821044921875, 19.7939453125, 20.766845703125, 21.73974609375, 22.712646484375, 23.685546875, 24.658447265625, 25.63134765625, 26.604248046875, 27.5771484375, 28.550048828125, 29.52294921875, 30.495849609375, 31.46875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 6.0, 10.0, 10.0, 13.0, 16.0, 16.0, 19.0, 35.0, 50.0, 47.0, 99.0, 161.0, 284.0, 550.0, 875.0, 781.0, 463.0, 215.0, 116.0, 79.0, 44.0, 29.0, 15.0, 22.0, 23.0, 14.0, 13.0, 6.0, 8.0, 8.0, 13.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.9375, -23.93408203125, -22.9306640625, -21.92724609375, -20.923828125, -19.92041015625, -18.9169921875, -17.91357421875, -16.91015625, -15.90673828125, -14.9033203125, -13.89990234375, -12.896484375, -11.89306640625, -10.8896484375, -9.88623046875, -8.8828125, -7.87939453125, -6.8759765625, -5.87255859375, -4.869140625, -3.86572265625, -2.8623046875, -1.85888671875, -0.85546875, 0.14794921875, 1.1513671875, 2.15478515625, 3.158203125, 4.16162109375, 5.1650390625, 6.16845703125, 7.171875, 8.17529296875, 9.1787109375, 10.18212890625, 11.185546875, 12.18896484375, 13.1923828125, 14.19580078125, 15.19921875, 16.20263671875, 17.2060546875, 18.20947265625, 19.212890625, 20.21630859375, 21.2197265625, 22.22314453125, 23.2265625, 24.22998046875, 25.2333984375, 26.23681640625, 27.240234375, 28.24365234375, 29.2470703125, 30.25048828125, 31.25390625, 32.25732421875, 33.2607421875, 34.26416015625, 35.267578125, 36.27099609375, 37.2744140625, 38.27783203125, 39.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 4.0, 10.0, 10.0, 28.0, 13.0, 23.0, 37.0, 41.0, 93.0, 136.0, 260.0, 463.0, 953.0, 2280.0, 6371.0, 20356.0, 94510.0, 2987260.0, 1000242.0, 57987.0, 14681.0, 4917.0, 1796.0, 805.0, 433.0, 211.0, 121.0, 72.0, 47.0, 33.0, 23.0, 17.0, 11.0, 12.0, 8.0, 10.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-69.375, -67.54296875, -65.7109375, -63.87890625, -62.046875, -60.21484375, -58.3828125, -56.55078125, -54.71875, -52.88671875, -51.0546875, -49.22265625, -47.390625, -45.55859375, -43.7265625, -41.89453125, -40.0625, -38.23046875, -36.3984375, -34.56640625, -32.734375, -30.90234375, -29.0703125, -27.23828125, -25.40625, -23.57421875, -21.7421875, -19.91015625, -18.078125, -16.24609375, -14.4140625, -12.58203125, -10.75, -8.91796875, -7.0859375, -5.25390625, -3.421875, -1.58984375, 0.2421875, 2.07421875, 3.90625, 5.73828125, 7.5703125, 9.40234375, 11.234375, 13.06640625, 14.8984375, 16.73046875, 18.5625, 20.39453125, 22.2265625, 24.05859375, 25.890625, 27.72265625, 29.5546875, 31.38671875, 33.21875, 35.05078125, 36.8828125, 38.71484375, 40.546875, 42.37890625, 44.2109375, 46.04296875, 47.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 23.0, 76.0, 255.0, 426.0, 164.0, 50.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.32477569580078, -72.90100860595703, -61.47724533081055, -50.05348205566406, -38.62971496582031, -27.205947875976562, -15.782188415527344, -4.358421325683594, 7.065345764160156, 18.489110946655273, 29.91287612915039, 41.336639404296875, 52.760406494140625, 64.18417358398438, 75.6079330444336, 87.03170013427734, 98.4554672241211, 109.87923431396484, 121.30299377441406, 132.7267608642578, 144.15052795410156, 155.5742950439453, 166.998046875, 178.42181396484375, 189.8455810546875, 201.26934814453125, 212.693115234375, 224.11688232421875, 235.5406494140625, 246.96441650390625, 258.38818359375, 269.81195068359375, 281.2357177734375, 292.65948486328125, 304.083251953125, 315.50701904296875, 326.9307861328125, 338.35455322265625, 349.7783203125, 361.20208740234375, 372.6258544921875, 384.04962158203125, 395.473388671875, 406.89715576171875, 418.3209228515625, 429.74468994140625, 441.16845703125, 452.59222412109375, 464.0159606933594, 475.4397277832031, 486.8634948730469, 498.2872619628906, 509.7110290527344, 521.134765625, 532.5585327148438, 543.9822998046875, 555.4060668945312, 566.829833984375, 578.2536010742188, 589.6773681640625, 601.1011352539062, 612.52490234375, 623.9486694335938, 635.3724365234375, 646.7962036132812]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 9.0, 7.0, 9.0, 8.0, 5.0, 19.0, 19.0, 23.0, 23.0, 14.0, 28.0, 31.0, 38.0, 30.0, 38.0, 39.0, 35.0, 44.0, 38.0, 42.0, 35.0, 37.0, 41.0, 35.0, 44.0, 39.0, 39.0, 28.0, 30.0, 27.0, 20.0, 17.0, 21.0, 16.0, 18.0, 8.0, 8.0, 15.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-95.60651397705078, -92.955810546875, -90.30509948730469, -87.6543960571289, -85.00369262695312, -82.35298156738281, -79.70227813720703, -77.05157470703125, -74.40086364746094, -71.75016021728516, -69.09944915771484, -66.44874572753906, -63.79804229736328, -61.147335052490234, -58.49662780761719, -55.845924377441406, -53.195220947265625, -50.54451370239258, -47.8938102722168, -45.24310302734375, -42.59239959716797, -39.94169235229492, -37.290985107421875, -34.640281677246094, -31.989574432373047, -29.338869094848633, -26.68816375732422, -24.037456512451172, -21.386751174926758, -18.736045837402344, -16.085338592529297, -13.434633255004883, -10.783920288085938, -8.133214950561523, -5.482508659362793, -2.8318028450012207, -0.18109703063964844, 2.4696083068847656, 5.120314598083496, 7.771020889282227, 10.42172622680664, 13.072431564331055, 15.723137855529785, 18.373844146728516, 21.02454948425293, 23.675254821777344, 26.32596206665039, 28.976667404174805, 31.62737274169922, 34.278079986572266, 36.92878341674805, 39.579490661621094, 42.230194091796875, 44.88090133666992, 47.53160858154297, 50.18231201171875, 52.8330192565918, 55.483726501464844, 58.134429931640625, 60.78513717651367, 63.43584442138672, 66.0865478515625, 68.73725128173828, 71.3879623413086, 74.03866577148438]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 13.0, 14.0, 14.0, 20.0, 20.0, 22.0, 28.0, 27.0, 34.0, 36.0, 48.0, 40.0, 50.0, 61.0, 53.0, 68.0, 47.0, 48.0, 40.0, 38.0, 35.0, 49.0, 19.0, 24.0, 15.0, 19.0, 11.0, 16.0, 7.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3297119140625, -10.003173828125, -9.6766357421875, -9.35009765625, -9.0235595703125, -8.697021484375, -8.3704833984375, -8.0439453125, -7.7174072265625, -7.390869140625, -7.0643310546875, -6.73779296875, -6.4112548828125, -6.084716796875, -5.7581787109375, -5.431640625, -5.1051025390625, -4.778564453125, -4.4520263671875, -4.12548828125, -3.7989501953125, -3.472412109375, -3.1458740234375, -2.8193359375, -2.4927978515625, -2.166259765625, -1.8397216796875, -1.51318359375, -1.1866455078125, -0.860107421875, -0.5335693359375, -0.20703125, 0.1195068359375, 0.446044921875, 0.7725830078125, 1.09912109375, 1.4256591796875, 1.752197265625, 2.0787353515625, 2.4052734375, 2.7318115234375, 3.058349609375, 3.3848876953125, 3.71142578125, 4.0379638671875, 4.364501953125, 4.6910400390625, 5.017578125, 5.3441162109375, 5.670654296875, 5.9971923828125, 6.32373046875, 6.6502685546875, 6.976806640625, 7.3033447265625, 7.6298828125, 7.9564208984375, 8.282958984375, 8.6094970703125, 8.93603515625, 9.2625732421875, 9.589111328125, 9.9156494140625, 10.2421875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 13.0, 16.0, 27.0, 29.0, 48.0, 89.0, 96.0, 133.0, 209.0, 280.0, 407.0, 542.0, 816.0, 1119.0, 1564.0, 2261.0, 3373.0, 4885.0, 7411.0, 11764.0, 18823.0, 30548.0, 52299.0, 90433.0, 154708.0, 229833.0, 177486.0, 103611.0, 60232.0, 35162.0, 21050.0, 13157.0, 8323.0, 5546.0, 3804.0, 2558.0, 1738.0, 1192.0, 809.0, 640.0, 432.0, 297.0, 234.0, 157.0, 122.0, 91.0, 58.0, 38.0, 24.0, 19.0, 21.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1689453125, -1.131988525390625, -1.09503173828125, -1.058074951171875, -1.0211181640625, -0.984161376953125, -0.94720458984375, -0.910247802734375, -0.873291015625, -0.836334228515625, -0.79937744140625, -0.762420654296875, -0.7254638671875, -0.688507080078125, -0.65155029296875, -0.614593505859375, -0.57763671875, -0.540679931640625, -0.50372314453125, -0.466766357421875, -0.4298095703125, -0.392852783203125, -0.35589599609375, -0.318939208984375, -0.281982421875, -0.245025634765625, -0.20806884765625, -0.171112060546875, -0.1341552734375, -0.097198486328125, -0.06024169921875, -0.023284912109375, 0.013671875, 0.050628662109375, 0.08758544921875, 0.124542236328125, 0.1614990234375, 0.198455810546875, 0.23541259765625, 0.272369384765625, 0.309326171875, 0.346282958984375, 0.38323974609375, 0.420196533203125, 0.4571533203125, 0.494110107421875, 0.53106689453125, 0.568023681640625, 0.60498046875, 0.641937255859375, 0.67889404296875, 0.715850830078125, 0.7528076171875, 0.789764404296875, 0.82672119140625, 0.863677978515625, 0.900634765625, 0.937591552734375, 0.97454833984375, 1.011505126953125, 1.0484619140625, 1.085418701171875, 1.12237548828125, 1.159332275390625, 1.1962890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 15.0, 9.0, 8.0, 8.0, 12.0, 20.0, 16.0, 23.0, 25.0, 29.0, 27.0, 39.0, 29.0, 30.0, 48.0, 43.0, 46.0, 36.0, 39.0, 1053.0, 35.0, 48.0, 36.0, 39.0, 43.0, 33.0, 32.0, 27.0, 31.0, 24.0, 16.0, 19.0, 9.0, 15.0, 13.0, 7.0, 6.0, 11.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.62109375, -5.440185546875, -5.25927734375, -5.078369140625, -4.8974609375, -4.716552734375, -4.53564453125, -4.354736328125, -4.173828125, -3.992919921875, -3.81201171875, -3.631103515625, -3.4501953125, -3.269287109375, -3.08837890625, -2.907470703125, -2.7265625, -2.545654296875, -2.36474609375, -2.183837890625, -2.0029296875, -1.822021484375, -1.64111328125, -1.460205078125, -1.279296875, -1.098388671875, -0.91748046875, -0.736572265625, -0.5556640625, -0.374755859375, -0.19384765625, -0.012939453125, 0.16796875, 0.348876953125, 0.52978515625, 0.710693359375, 0.8916015625, 1.072509765625, 1.25341796875, 1.434326171875, 1.615234375, 1.796142578125, 1.97705078125, 2.157958984375, 2.3388671875, 2.519775390625, 2.70068359375, 2.881591796875, 3.0625, 3.243408203125, 3.42431640625, 3.605224609375, 3.7861328125, 3.967041015625, 4.14794921875, 4.328857421875, 4.509765625, 4.690673828125, 4.87158203125, 5.052490234375, 5.2333984375, 5.414306640625, 5.59521484375, 5.776123046875, 5.95703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 8.0, 9.0, 25.0, 30.0, 32.0, 68.0, 108.0, 148.0, 216.0, 342.0, 483.0, 784.0, 1250.0, 1863.0, 3038.0, 4701.0, 7758.0, 12336.0, 20387.0, 33734.0, 58616.0, 101907.0, 171788.0, 1271815.0, 166824.0, 97901.0, 55815.0, 32982.0, 19824.0, 11997.0, 7375.0, 4666.0, 3045.0, 1876.0, 1148.0, 742.0, 502.0, 330.0, 242.0, 137.0, 88.0, 64.0, 39.0, 31.0, 17.0, 13.0, 7.0, 8.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7783203125, -0.7527694702148438, -0.7272186279296875, -0.7016677856445312, -0.676116943359375, -0.6505661010742188, -0.6250152587890625, -0.5994644165039062, -0.57391357421875, -0.5483627319335938, -0.5228118896484375, -0.49726104736328125, -0.471710205078125, -0.44615936279296875, -0.4206085205078125, -0.39505767822265625, -0.3695068359375, -0.34395599365234375, -0.3184051513671875, -0.29285430908203125, -0.267303466796875, -0.24175262451171875, -0.2162017822265625, -0.19065093994140625, -0.16510009765625, -0.13954925537109375, -0.1139984130859375, -0.08844757080078125, -0.062896728515625, -0.03734588623046875, -0.0117950439453125, 0.01375579833984375, 0.039306640625, 0.06485748291015625, 0.0904083251953125, 0.11595916748046875, 0.141510009765625, 0.16706085205078125, 0.1926116943359375, 0.21816253662109375, 0.24371337890625, 0.26926422119140625, 0.2948150634765625, 0.32036590576171875, 0.345916748046875, 0.37146759033203125, 0.3970184326171875, 0.42256927490234375, 0.4481201171875, 0.47367095947265625, 0.4992218017578125, 0.5247726440429688, 0.550323486328125, 0.5758743286132812, 0.6014251708984375, 0.6269760131835938, 0.65252685546875, 0.6780776977539062, 0.7036285400390625, 0.7291793823242188, 0.754730224609375, 0.7802810668945312, 0.8058319091796875, 0.8313827514648438, 0.85693359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 14.0, 16.0, 20.0, 27.0, 24.0, 43.0, 41.0, 48.0, 52.0, 72.0, 80.0, 79.0, 59.0, 70.0, 63.0, 55.0, 34.0, 38.0, 25.0, 19.0, 18.0, 15.0, 11.0, 10.0, 5.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00630950927734375, -0.006094157695770264, -0.005878806114196777, -0.005663454532623291, -0.005448102951049805, -0.005232751369476318, -0.005017399787902832, -0.004802048206329346, -0.004586696624755859, -0.004371345043182373, -0.004155993461608887, -0.0039406418800354, -0.003725290298461914, -0.0035099387168884277, -0.0032945871353149414, -0.003079235553741455, -0.0028638839721679688, -0.0026485323905944824, -0.002433180809020996, -0.0022178292274475098, -0.0020024776458740234, -0.0017871260643005371, -0.0015717744827270508, -0.0013564229011535645, -0.0011410713195800781, -0.0009257197380065918, -0.0007103681564331055, -0.0004950165748596191, -0.0002796649932861328, -6.431341171264648e-05, 0.00015103816986083984, 0.00036638975143432617, 0.0005817413330078125, 0.0007970929145812988, 0.0010124444961547852, 0.0012277960777282715, 0.0014431476593017578, 0.0016584992408752441, 0.0018738508224487305, 0.002089202404022217, 0.002304553985595703, 0.0025199055671691895, 0.0027352571487426758, 0.002950608730316162, 0.0031659603118896484, 0.0033813118934631348, 0.003596663475036621, 0.0038120150566101074, 0.004027366638183594, 0.00424271821975708, 0.004458069801330566, 0.004673421382904053, 0.004888772964477539, 0.005104124546051025, 0.005319476127624512, 0.005534827709197998, 0.005750179290771484, 0.005965530872344971, 0.006180882453918457, 0.006396234035491943, 0.00661158561706543, 0.006826937198638916, 0.007042288780212402, 0.007257640361785889, 0.007472991943359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 11.0, 14.0, 21.0, 29.0, 44.0, 56.0, 76.0, 116.0, 160.0, 280.0, 632.0, 10015.0, 1027356.0, 8335.0, 580.0, 293.0, 141.0, 111.0, 70.0, 56.0, 31.0, 29.0, 31.0, 19.0, 11.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16729354858398438, -0.16197967529296875, -0.15666580200195312, -0.1513519287109375, -0.14603805541992188, -0.14072418212890625, -0.13541030883789062, -0.130096435546875, -0.12478256225585938, -0.11946868896484375, -0.11415481567382812, -0.1088409423828125, -0.10352706909179688, -0.09821319580078125, -0.09289932250976562, -0.08758544921875, -0.08227157592773438, -0.07695770263671875, -0.07164382934570312, -0.0663299560546875, -0.061016082763671875, -0.05570220947265625, -0.050388336181640625, -0.045074462890625, -0.039760589599609375, -0.03444671630859375, -0.029132843017578125, -0.0238189697265625, -0.018505096435546875, -0.01319122314453125, -0.007877349853515625, -0.0025634765625, 0.002750396728515625, 0.00806427001953125, 0.013378143310546875, 0.0186920166015625, 0.024005889892578125, 0.02931976318359375, 0.034633636474609375, 0.039947509765625, 0.045261383056640625, 0.05057525634765625, 0.055889129638671875, 0.0612030029296875, 0.06651687622070312, 0.07183074951171875, 0.07714462280273438, 0.08245849609375, 0.08777236938476562, 0.09308624267578125, 0.09840011596679688, 0.1037139892578125, 0.10902786254882812, 0.11434173583984375, 0.11965560913085938, 0.124969482421875, 0.13028335571289062, 0.13559722900390625, 0.14091110229492188, 0.1462249755859375, 0.15153884887695312, 0.15685272216796875, 0.16216659545898438, 0.16748046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 779.0, 219.0, 8.0, 0.0, 1.0], "bins": [-0.1506684273481369, -0.14814729988574982, -0.14562615752220154, -0.14310503005981445, -0.14058390259742737, -0.13806277513504028, -0.135541632771492, -0.13302050530910492, -0.13049937784671783, -0.12797825038433075, -0.12545710802078247, -0.12293598055839539, -0.1204148530960083, -0.11789371818304062, -0.11537259072065353, -0.11285145580768585, -0.11033032834529877, -0.10780919343233109, -0.105288065969944, -0.10276693105697632, -0.10024580359458923, -0.09772466868162155, -0.09520354121923447, -0.09268240630626678, -0.0901612713932991, -0.08764013648033142, -0.08511900901794434, -0.08259787410497665, -0.08007674664258957, -0.07755561172962189, -0.0750344842672348, -0.07251334935426712, -0.06999222189188004, -0.06747108697891235, -0.06494995951652527, -0.062428828328847885, -0.0599076971411705, -0.05738656595349312, -0.054865434765815735, -0.05234429985284805, -0.04982317239046097, -0.047302041202783585, -0.0447809100151062, -0.04225977882742882, -0.039738647639751434, -0.03721751645207405, -0.03469638526439667, -0.032175250351428986, -0.0296541228890419, -0.027132991701364517, -0.024611860513687134, -0.02209072932600975, -0.019569598138332367, -0.017048466950654984, -0.01452733390033245, -0.012006202712655067, -0.00948507059365511, -0.006963939405977726, -0.004442807752639055, -0.0019216760993003845, 0.0005994550883769989, 0.0031205862760543823, 0.00564171839505434, 0.008162849582731724, 0.010683980770409107]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 1.0, 0.0, 7.0, 5.0, 4.0, 11.0, 9.0, 7.0, 13.0, 16.0, 13.0, 11.0, 19.0, 25.0, 24.0, 33.0, 35.0, 39.0, 25.0, 35.0, 34.0, 33.0, 35.0, 36.0, 35.0, 42.0, 42.0, 36.0, 43.0, 36.0, 24.0, 29.0, 26.0, 32.0, 24.0, 33.0, 16.0, 17.0, 14.0, 14.0, 14.0, 12.0, 11.0, 16.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004801034927368164, -0.004662330262362957, -0.00452362559735775, -0.004384920932352543, -0.004246216267347336, -0.004107511602342129, -0.003968806937336922, -0.0038301022723317146, -0.0036913976073265076, -0.0035526929423213005, -0.0034139882773160934, -0.0032752836123108864, -0.0031365789473056793, -0.0029978742823004723, -0.002859169617295265, -0.002720464952290058, -0.002581760287284851, -0.002443055622279644, -0.002304350957274437, -0.00216564629226923, -0.002026941627264023, -0.0018882369622588158, -0.0017495322972536087, -0.0016108276322484016, -0.0014721229672431946, -0.0013334183022379875, -0.0011947136372327805, -0.0010560089722275734, -0.0009173043072223663, -0.0007785996422171593, -0.0006398949772119522, -0.0005011903122067451, -0.0003624856472015381, -0.00022378098219633102, -8.507631719112396e-05, 5.36283478140831e-05, 0.00019233301281929016, 0.0003310376778244972, 0.0004697423428297043, 0.0006084470078349113, 0.0007471516728401184, 0.0008858563378453255, 0.0010245610028505325, 0.0011632656678557396, 0.0013019703328609467, 0.0014406749978661537, 0.0015793796628713608, 0.0017180843278765678, 0.001856788992881775, 0.001995493657886982, 0.002134198322892189, 0.002272902987897396, 0.002411607652902603, 0.00255031231790781, 0.0026890169829130173, 0.0028277216479182243, 0.0029664263129234314, 0.0031051309779286385, 0.0032438356429338455, 0.0033825403079390526, 0.0035212449729442596, 0.0036599496379494667, 0.0037986543029546738, 0.003937358967959881, 0.004076063632965088]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 13.0, 14.0, 14.0, 20.0, 20.0, 22.0, 28.0, 27.0, 34.0, 36.0, 48.0, 40.0, 50.0, 61.0, 53.0, 68.0, 47.0, 48.0, 40.0, 38.0, 35.0, 49.0, 19.0, 24.0, 15.0, 19.0, 11.0, 16.0, 7.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3297119140625, -10.003173828125, -9.6766357421875, -9.35009765625, -9.0235595703125, -8.697021484375, -8.3704833984375, -8.0439453125, -7.7174072265625, -7.390869140625, -7.0643310546875, -6.73779296875, -6.4112548828125, -6.084716796875, -5.7581787109375, -5.431640625, -5.1051025390625, -4.778564453125, -4.4520263671875, -4.12548828125, -3.7989501953125, -3.472412109375, -3.1458740234375, -2.8193359375, -2.4927978515625, -2.166259765625, -1.8397216796875, -1.51318359375, -1.1866455078125, -0.860107421875, -0.5335693359375, -0.20703125, 0.1195068359375, 0.446044921875, 0.7725830078125, 1.09912109375, 1.4256591796875, 1.752197265625, 2.0787353515625, 2.4052734375, 2.7318115234375, 3.058349609375, 3.3848876953125, 3.71142578125, 4.0379638671875, 4.364501953125, 4.6910400390625, 5.017578125, 5.3441162109375, 5.670654296875, 5.9971923828125, 6.32373046875, 6.6502685546875, 6.976806640625, 7.3033447265625, 7.6298828125, 7.9564208984375, 8.282958984375, 8.6094970703125, 8.93603515625, 9.2625732421875, 9.589111328125, 9.9156494140625, 10.2421875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 9.0, 8.0, 21.0, 27.0, 21.0, 31.0, 52.0, 53.0, 79.0, 97.0, 138.0, 171.0, 229.0, 299.0, 455.0, 617.0, 942.0, 1381.0, 2217.0, 4193.0, 9225.0, 29436.0, 204233.0, 697053.0, 67266.0, 15721.0, 5982.0, 2951.0, 1769.0, 1115.0, 710.0, 518.0, 406.0, 299.0, 205.0, 162.0, 118.0, 65.0, 65.0, 61.0, 38.0, 19.0, 29.0, 14.0, 13.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-13.484375, -13.078857421875, -12.67333984375, -12.267822265625, -11.8623046875, -11.456787109375, -11.05126953125, -10.645751953125, -10.240234375, -9.834716796875, -9.42919921875, -9.023681640625, -8.6181640625, -8.212646484375, -7.80712890625, -7.401611328125, -6.99609375, -6.590576171875, -6.18505859375, -5.779541015625, -5.3740234375, -4.968505859375, -4.56298828125, -4.157470703125, -3.751953125, -3.346435546875, -2.94091796875, -2.535400390625, -2.1298828125, -1.724365234375, -1.31884765625, -0.913330078125, -0.5078125, -0.102294921875, 0.30322265625, 0.708740234375, 1.1142578125, 1.519775390625, 1.92529296875, 2.330810546875, 2.736328125, 3.141845703125, 3.54736328125, 3.952880859375, 4.3583984375, 4.763916015625, 5.16943359375, 5.574951171875, 5.98046875, 6.385986328125, 6.79150390625, 7.197021484375, 7.6025390625, 8.008056640625, 8.41357421875, 8.819091796875, 9.224609375, 9.630126953125, 10.03564453125, 10.441162109375, 10.8466796875, 11.252197265625, 11.65771484375, 12.063232421875, 12.46875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 12.0, 13.0, 17.0, 11.0, 12.0, 13.0, 18.0, 28.0, 27.0, 32.0, 37.0, 35.0, 49.0, 53.0, 68.0, 137.0, 1808.0, 163.0, 83.0, 49.0, 51.0, 38.0, 36.0, 27.0, 33.0, 20.0, 24.0, 26.0, 26.0, 12.0, 12.0, 13.0, 8.0, 6.0, 6.0, 9.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.40625, -36.29248046875, -35.1787109375, -34.06494140625, -32.951171875, -31.83740234375, -30.7236328125, -29.60986328125, -28.49609375, -27.38232421875, -26.2685546875, -25.15478515625, -24.041015625, -22.92724609375, -21.8134765625, -20.69970703125, -19.5859375, -18.47216796875, -17.3583984375, -16.24462890625, -15.130859375, -14.01708984375, -12.9033203125, -11.78955078125, -10.67578125, -9.56201171875, -8.4482421875, -7.33447265625, -6.220703125, -5.10693359375, -3.9931640625, -2.87939453125, -1.765625, -0.65185546875, 0.4619140625, 1.57568359375, 2.689453125, 3.80322265625, 4.9169921875, 6.03076171875, 7.14453125, 8.25830078125, 9.3720703125, 10.48583984375, 11.599609375, 12.71337890625, 13.8271484375, 14.94091796875, 16.0546875, 17.16845703125, 18.2822265625, 19.39599609375, 20.509765625, 21.62353515625, 22.7373046875, 23.85107421875, 24.96484375, 26.07861328125, 27.1923828125, 28.30615234375, 29.419921875, 30.53369140625, 31.6474609375, 32.76123046875, 33.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 7.0, 5.0, 10.0, 14.0, 7.0, 16.0, 21.0, 35.0, 30.0, 31.0, 59.0, 77.0, 103.0, 180.0, 367.0, 1012.0, 4116.0, 94638.0, 3027201.0, 14352.0, 2013.0, 635.0, 265.0, 145.0, 91.0, 59.0, 40.0, 32.0, 19.0, 16.0, 12.0, 19.0, 12.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.34375, -50.61474609375, -48.8857421875, -47.15673828125, -45.427734375, -43.69873046875, -41.9697265625, -40.24072265625, -38.51171875, -36.78271484375, -35.0537109375, -33.32470703125, -31.595703125, -29.86669921875, -28.1376953125, -26.40869140625, -24.6796875, -22.95068359375, -21.2216796875, -19.49267578125, -17.763671875, -16.03466796875, -14.3056640625, -12.57666015625, -10.84765625, -9.11865234375, -7.3896484375, -5.66064453125, -3.931640625, -2.20263671875, -0.4736328125, 1.25537109375, 2.984375, 4.71337890625, 6.4423828125, 8.17138671875, 9.900390625, 11.62939453125, 13.3583984375, 15.08740234375, 16.81640625, 18.54541015625, 20.2744140625, 22.00341796875, 23.732421875, 25.46142578125, 27.1904296875, 28.91943359375, 30.6484375, 32.37744140625, 34.1064453125, 35.83544921875, 37.564453125, 39.29345703125, 41.0224609375, 42.75146484375, 44.48046875, 46.20947265625, 47.9384765625, 49.66748046875, 51.396484375, 53.12548828125, 54.8544921875, 56.58349609375, 58.3125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 95.0, 795.0, 118.0, 3.0], "bins": [-491.91143798828125, -483.9143981933594, -475.9173583984375, -467.9203186035156, -459.92327880859375, -451.92626953125, -443.92919921875, -435.93218994140625, -427.9351501464844, -419.9381103515625, -411.9410705566406, -403.94403076171875, -395.9469909667969, -387.949951171875, -379.95294189453125, -371.9559020996094, -363.9588623046875, -355.9618225097656, -347.96478271484375, -339.9677429199219, -331.970703125, -323.97369384765625, -315.97662353515625, -307.9796142578125, -299.9825439453125, -291.9855041503906, -283.98846435546875, -275.9914245605469, -267.994384765625, -259.99737548828125, -252.0003204345703, -244.00328063964844, -236.0062713623047, -228.0092315673828, -220.01219177246094, -212.01516723632812, -204.01812744140625, -196.02108764648438, -188.0240478515625, -180.02700805664062, -172.02996826171875, -164.03292846679688, -156.035888671875, -148.03884887695312, -140.0418243408203, -132.04478454589844, -124.04774475097656, -116.05070495605469, -108.05368041992188, -100.056640625, -92.05960845947266, -84.06256866455078, -76.06553649902344, -68.06849670410156, -60.07145690917969, -52.07442092895508, -44.07738494873047, -36.08034896850586, -28.083311080932617, -20.086273193359375, -12.089237213134766, -4.092201232910156, 3.9048385620117188, 11.901874542236328, 19.89891242980957]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 7.0, 6.0, 7.0, 12.0, 13.0, 19.0, 14.0, 12.0, 26.0, 20.0, 25.0, 27.0, 30.0, 43.0, 27.0, 30.0, 37.0, 44.0, 40.0, 47.0, 37.0, 36.0, 38.0, 37.0, 32.0, 38.0, 43.0, 24.0, 24.0, 16.0, 22.0, 15.0, 21.0, 21.0, 25.0, 9.0, 11.0, 6.0, 7.0, 9.0, 2.0, 5.0, 6.0, 3.0, 7.0, 5.0, 3.0, 3.0], "bins": [-105.17705535888672, -102.18560028076172, -99.19414520263672, -96.20269012451172, -93.21123504638672, -90.21978759765625, -87.22833251953125, -84.23687744140625, -81.24542236328125, -78.25396728515625, -75.26251220703125, -72.27105712890625, -69.27960205078125, -66.28814697265625, -63.296695709228516, -60.30524444580078, -57.313785552978516, -54.322330474853516, -51.330875396728516, -48.33942413330078, -45.34796905517578, -42.35651397705078, -39.36505889892578, -36.37360382080078, -33.38214874267578, -30.39069366455078, -27.399240493774414, -24.407785415649414, -21.416332244873047, -18.424877166748047, -15.433422088623047, -12.44196891784668, -9.450515747070312, -6.459061622619629, -3.467607021331787, -0.4761524200439453, 2.5153017044067383, 5.506755828857422, 8.498210906982422, 11.489664077758789, 14.481119155883789, 17.47257423400879, 20.464027404785156, 23.455482482910156, 26.446937561035156, 29.438390731811523, 32.429847717285156, 35.42129898071289, 38.41275405883789, 41.40420913696289, 44.39566421508789, 47.387115478515625, 50.378570556640625, 53.370025634765625, 56.361480712890625, 59.352935791015625, 62.344390869140625, 65.33584594726562, 68.32730102539062, 71.31875610351562, 74.31021118164062, 77.30166625976562, 80.29312133789062, 83.2845687866211, 86.2760238647461]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 8.0, 10.0, 11.0, 11.0, 16.0, 17.0, 18.0, 24.0, 18.0, 30.0, 25.0, 31.0, 35.0, 46.0, 46.0, 45.0, 60.0, 59.0, 60.0, 54.0, 40.0, 40.0, 34.0, 44.0, 28.0, 41.0, 19.0, 16.0, 15.0, 14.0, 15.0, 11.0, 12.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3203125, -9.995361328125, -9.67041015625, -9.345458984375, -9.0205078125, -8.695556640625, -8.37060546875, -8.045654296875, -7.720703125, -7.395751953125, -7.07080078125, -6.745849609375, -6.4208984375, -6.095947265625, -5.77099609375, -5.446044921875, -5.12109375, -4.796142578125, -4.47119140625, -4.146240234375, -3.8212890625, -3.496337890625, -3.17138671875, -2.846435546875, -2.521484375, -2.196533203125, -1.87158203125, -1.546630859375, -1.2216796875, -0.896728515625, -0.57177734375, -0.246826171875, 0.078125, 0.403076171875, 0.72802734375, 1.052978515625, 1.3779296875, 1.702880859375, 2.02783203125, 2.352783203125, 2.677734375, 3.002685546875, 3.32763671875, 3.652587890625, 3.9775390625, 4.302490234375, 4.62744140625, 4.952392578125, 5.27734375, 5.602294921875, 5.92724609375, 6.252197265625, 6.5771484375, 6.902099609375, 7.22705078125, 7.552001953125, 7.876953125, 8.201904296875, 8.52685546875, 8.851806640625, 9.1767578125, 9.501708984375, 9.82666015625, 10.151611328125, 10.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 14.0, 22.0, 16.0, 37.0, 48.0, 76.0, 121.0, 228.0, 465.0, 901.0, 2005.0, 4749.0, 13385.0, 96449.0, 3554730.0, 487646.0, 21765.0, 6385.0, 2576.0, 1225.0, 613.0, 291.0, 186.0, 111.0, 62.0, 49.0, 29.0, 21.0, 10.0, 3.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.3125, -43.9267578125, -42.541015625, -41.1552734375, -39.76953125, -38.3837890625, -36.998046875, -35.6123046875, -34.2265625, -32.8408203125, -31.455078125, -30.0693359375, -28.68359375, -27.2978515625, -25.912109375, -24.5263671875, -23.140625, -21.7548828125, -20.369140625, -18.9833984375, -17.59765625, -16.2119140625, -14.826171875, -13.4404296875, -12.0546875, -10.6689453125, -9.283203125, -7.8974609375, -6.51171875, -5.1259765625, -3.740234375, -2.3544921875, -0.96875, 0.4169921875, 1.802734375, 3.1884765625, 4.57421875, 5.9599609375, 7.345703125, 8.7314453125, 10.1171875, 11.5029296875, 12.888671875, 14.2744140625, 15.66015625, 17.0458984375, 18.431640625, 19.8173828125, 21.203125, 22.5888671875, 23.974609375, 25.3603515625, 26.74609375, 28.1318359375, 29.517578125, 30.9033203125, 32.2890625, 33.6748046875, 35.060546875, 36.4462890625, 37.83203125, 39.2177734375, 40.603515625, 41.9892578125, 43.375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 5.0, 10.0, 14.0, 6.0, 9.0, 19.0, 27.0, 25.0, 45.0, 67.0, 95.0, 179.0, 359.0, 641.0, 955.0, 716.0, 364.0, 179.0, 98.0, 57.0, 51.0, 37.0, 21.0, 17.0, 15.0, 11.0, 10.0, 4.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.53173828125, -25.5322265625, -24.53271484375, -23.533203125, -22.53369140625, -21.5341796875, -20.53466796875, -19.53515625, -18.53564453125, -17.5361328125, -16.53662109375, -15.537109375, -14.53759765625, -13.5380859375, -12.53857421875, -11.5390625, -10.53955078125, -9.5400390625, -8.54052734375, -7.541015625, -6.54150390625, -5.5419921875, -4.54248046875, -3.54296875, -2.54345703125, -1.5439453125, -0.54443359375, 0.455078125, 1.45458984375, 2.4541015625, 3.45361328125, 4.453125, 5.45263671875, 6.4521484375, 7.45166015625, 8.451171875, 9.45068359375, 10.4501953125, 11.44970703125, 12.44921875, 13.44873046875, 14.4482421875, 15.44775390625, 16.447265625, 17.44677734375, 18.4462890625, 19.44580078125, 20.4453125, 21.44482421875, 22.4443359375, 23.44384765625, 24.443359375, 25.44287109375, 26.4423828125, 27.44189453125, 28.44140625, 29.44091796875, 30.4404296875, 31.43994140625, 32.439453125, 33.43896484375, 34.4384765625, 35.43798828125, 36.4375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 12.0, 22.0, 24.0, 39.0, 58.0, 76.0, 147.0, 216.0, 327.0, 548.0, 1003.0, 1911.0, 3869.0, 8470.0, 21250.0, 72595.0, 645828.0, 3141900.0, 226295.0, 42455.0, 14481.0, 6234.0, 2890.0, 1534.0, 803.0, 488.0, 269.0, 178.0, 124.0, 64.0, 46.0, 37.0, 22.0, 19.0, 13.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.65625, -36.49072265625, -35.3251953125, -34.15966796875, -32.994140625, -31.82861328125, -30.6630859375, -29.49755859375, -28.33203125, -27.16650390625, -26.0009765625, -24.83544921875, -23.669921875, -22.50439453125, -21.3388671875, -20.17333984375, -19.0078125, -17.84228515625, -16.6767578125, -15.51123046875, -14.345703125, -13.18017578125, -12.0146484375, -10.84912109375, -9.68359375, -8.51806640625, -7.3525390625, -6.18701171875, -5.021484375, -3.85595703125, -2.6904296875, -1.52490234375, -0.359375, 0.80615234375, 1.9716796875, 3.13720703125, 4.302734375, 5.46826171875, 6.6337890625, 7.79931640625, 8.96484375, 10.13037109375, 11.2958984375, 12.46142578125, 13.626953125, 14.79248046875, 15.9580078125, 17.12353515625, 18.2890625, 19.45458984375, 20.6201171875, 21.78564453125, 22.951171875, 24.11669921875, 25.2822265625, 26.44775390625, 27.61328125, 28.77880859375, 29.9443359375, 31.10986328125, 32.275390625, 33.44091796875, 34.6064453125, 35.77197265625, 36.9375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 16.0, 45.0, 62.0, 159.0, 193.0, 211.0, 168.0, 80.0, 36.0, 16.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.83331298828125, -135.94273376464844, -130.05215454101562, -124.16157531738281, -118.27099609375, -112.38041687011719, -106.48983764648438, -100.59925842285156, -94.70867919921875, -88.81809997558594, -82.92752075195312, -77.03694152832031, -71.1463623046875, -65.25578308105469, -59.36520004272461, -53.4746208190918, -47.58403778076172, -41.693458557128906, -35.802879333496094, -29.91229820251465, -24.021718978881836, -18.131139755249023, -12.240558624267578, -6.349979400634766, -0.4594001770019531, 5.431179523468018, 11.321759223937988, 17.212339401245117, 23.10291862487793, 28.993497848510742, 34.88407897949219, 40.774658203125, 46.66523742675781, 52.555816650390625, 58.44639587402344, 64.33697509765625, 70.22755432128906, 76.11813354492188, 82.00871276855469, 87.8992919921875, 93.78987121582031, 99.68045043945312, 105.57102966308594, 111.46160888671875, 117.35218811035156, 123.24276733398438, 129.1333465576172, 135.02392578125, 140.91452026367188, 146.8050994873047, 152.6956787109375, 158.5862579345703, 164.47683715820312, 170.36741638183594, 176.25799560546875, 182.14857482910156, 188.03915405273438, 193.9297332763672, 199.8203125, 205.7108917236328, 211.60147094726562, 217.49205017089844, 223.38262939453125, 229.27320861816406, 235.16378784179688]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 13.0, 7.0, 16.0, 13.0, 19.0, 14.0, 19.0, 18.0, 18.0, 34.0, 40.0, 32.0, 45.0, 34.0, 34.0, 37.0, 34.0, 40.0, 47.0, 45.0, 40.0, 41.0, 35.0, 40.0, 33.0, 26.0, 23.0, 26.0, 28.0, 15.0, 26.0, 19.0, 15.0, 8.0, 11.0, 8.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-76.81509399414062, -74.3446273803711, -71.87415313720703, -69.4036865234375, -66.93321228027344, -64.4627456665039, -61.992279052734375, -59.52180862426758, -57.05133819580078, -54.580867767333984, -52.11039733886719, -49.639930725097656, -47.16946029663086, -44.69898986816406, -42.22852325439453, -39.758052825927734, -37.28758239746094, -34.81711196899414, -32.346641540527344, -29.876174926757812, -27.405704498291016, -24.93523406982422, -22.464765548706055, -19.99429702758789, -17.523826599121094, -15.053357124328613, -12.582887649536133, -10.112418174743652, -7.641948699951172, -5.171479225158691, -2.701009750366211, -0.23054122924804688, 2.23992919921875, 4.7103986740112305, 7.180868148803711, 9.651337623596191, 12.121807098388672, 14.592276573181152, 17.062746047973633, 19.533214569091797, 22.003684997558594, 24.47415542602539, 26.944623947143555, 29.41509246826172, 31.885562896728516, 34.35603332519531, 36.826499938964844, 39.29697036743164, 41.76744079589844, 44.237911224365234, 46.70838165283203, 49.17884826660156, 51.64931869506836, 54.119789123535156, 56.59025573730469, 59.060726165771484, 61.53119659423828, 64.00166320800781, 66.47213745117188, 68.9426040649414, 71.41307067871094, 73.883544921875, 76.35401153564453, 78.82447814941406, 81.29495239257812]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 17.0, 15.0, 22.0, 22.0, 33.0, 27.0, 29.0, 49.0, 37.0, 39.0, 59.0, 56.0, 38.0, 53.0, 58.0, 53.0, 42.0, 35.0, 31.0, 36.0, 26.0, 27.0, 20.0, 24.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.9765625, -9.6607666015625, -9.344970703125, -9.0291748046875, -8.71337890625, -8.3975830078125, -8.081787109375, -7.7659912109375, -7.4501953125, -7.1343994140625, -6.818603515625, -6.5028076171875, -6.18701171875, -5.8712158203125, -5.555419921875, -5.2396240234375, -4.923828125, -4.6080322265625, -4.292236328125, -3.9764404296875, -3.66064453125, -3.3448486328125, -3.029052734375, -2.7132568359375, -2.3974609375, -2.0816650390625, -1.765869140625, -1.4500732421875, -1.13427734375, -0.8184814453125, -0.502685546875, -0.1868896484375, 0.12890625, 0.4447021484375, 0.760498046875, 1.0762939453125, 1.39208984375, 1.7078857421875, 2.023681640625, 2.3394775390625, 2.6552734375, 2.9710693359375, 3.286865234375, 3.6026611328125, 3.91845703125, 4.2342529296875, 4.550048828125, 4.8658447265625, 5.181640625, 5.4974365234375, 5.813232421875, 6.1290283203125, 6.44482421875, 6.7606201171875, 7.076416015625, 7.3922119140625, 7.7080078125, 8.0238037109375, 8.339599609375, 8.6553955078125, 8.97119140625, 9.2869873046875, 9.602783203125, 9.9185791015625, 10.234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 8.0, 8.0, 16.0, 24.0, 30.0, 50.0, 49.0, 56.0, 84.0, 103.0, 211.0, 250.0, 302.0, 435.0, 577.0, 861.0, 1105.0, 1550.0, 2134.0, 2973.0, 4112.0, 5888.0, 8509.0, 12735.0, 19994.0, 31104.0, 49934.0, 81938.0, 130359.0, 186549.0, 178077.0, 120865.0, 74997.0, 46115.0, 28688.0, 18375.0, 11967.0, 7856.0, 5649.0, 3892.0, 2800.0, 1932.0, 1406.0, 1083.0, 807.0, 571.0, 401.0, 300.0, 219.0, 168.0, 131.0, 99.0, 62.0, 53.0, 34.0, 24.0, 18.0, 16.0, 14.0, 4.0, 1.0, 1.0], "bins": [-1.064453125, -1.031097412109375, -0.99774169921875, -0.964385986328125, -0.9310302734375, -0.897674560546875, -0.86431884765625, -0.830963134765625, -0.797607421875, -0.764251708984375, -0.73089599609375, -0.697540283203125, -0.6641845703125, -0.630828857421875, -0.59747314453125, -0.564117431640625, -0.53076171875, -0.497406005859375, -0.46405029296875, -0.430694580078125, -0.3973388671875, -0.363983154296875, -0.33062744140625, -0.297271728515625, -0.263916015625, -0.230560302734375, -0.19720458984375, -0.163848876953125, -0.1304931640625, -0.097137451171875, -0.06378173828125, -0.030426025390625, 0.0029296875, 0.036285400390625, 0.06964111328125, 0.102996826171875, 0.1363525390625, 0.169708251953125, 0.20306396484375, 0.236419677734375, 0.269775390625, 0.303131103515625, 0.33648681640625, 0.369842529296875, 0.4031982421875, 0.436553955078125, 0.46990966796875, 0.503265380859375, 0.53662109375, 0.569976806640625, 0.60333251953125, 0.636688232421875, 0.6700439453125, 0.703399658203125, 0.73675537109375, 0.770111083984375, 0.803466796875, 0.836822509765625, 0.87017822265625, 0.903533935546875, 0.9368896484375, 0.970245361328125, 1.00360107421875, 1.036956787109375, 1.0703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 5.0, 7.0, 15.0, 12.0, 16.0, 13.0, 21.0, 21.0, 20.0, 27.0, 26.0, 21.0, 39.0, 43.0, 41.0, 31.0, 34.0, 49.0, 1062.0, 43.0, 39.0, 44.0, 36.0, 40.0, 27.0, 28.0, 33.0, 26.0, 30.0, 22.0, 18.0, 24.0, 21.0, 17.0, 7.0, 8.0, 9.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.070068359375, -4.89404296875, -4.718017578125, -4.5419921875, -4.365966796875, -4.18994140625, -4.013916015625, -3.837890625, -3.661865234375, -3.48583984375, -3.309814453125, -3.1337890625, -2.957763671875, -2.78173828125, -2.605712890625, -2.4296875, -2.253662109375, -2.07763671875, -1.901611328125, -1.7255859375, -1.549560546875, -1.37353515625, -1.197509765625, -1.021484375, -0.845458984375, -0.66943359375, -0.493408203125, -0.3173828125, -0.141357421875, 0.03466796875, 0.210693359375, 0.38671875, 0.562744140625, 0.73876953125, 0.914794921875, 1.0908203125, 1.266845703125, 1.44287109375, 1.618896484375, 1.794921875, 1.970947265625, 2.14697265625, 2.322998046875, 2.4990234375, 2.675048828125, 2.85107421875, 3.027099609375, 3.203125, 3.379150390625, 3.55517578125, 3.731201171875, 3.9072265625, 4.083251953125, 4.25927734375, 4.435302734375, 4.611328125, 4.787353515625, 4.96337890625, 5.139404296875, 5.3154296875, 5.491455078125, 5.66748046875, 5.843505859375, 6.01953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 13.0, 10.0, 10.0, 19.0, 28.0, 27.0, 59.0, 79.0, 94.0, 165.0, 207.0, 329.0, 421.0, 644.0, 915.0, 1351.0, 2000.0, 2767.0, 4281.0, 6324.0, 9389.0, 13880.0, 20428.0, 30842.0, 46700.0, 71030.0, 107523.0, 152171.0, 1217361.0, 135336.0, 91901.0, 60933.0, 39823.0, 26412.0, 17422.0, 11559.0, 7999.0, 5283.0, 3547.0, 2509.0, 1631.0, 1080.0, 833.0, 545.0, 398.0, 247.0, 168.0, 126.0, 92.0, 70.0, 46.0, 41.0, 17.0, 21.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0], "bins": [-0.64208984375, -0.6222152709960938, -0.6023406982421875, -0.5824661254882812, -0.562591552734375, -0.5427169799804688, -0.5228424072265625, -0.5029678344726562, -0.48309326171875, -0.46321868896484375, -0.4433441162109375, -0.42346954345703125, -0.403594970703125, -0.38372039794921875, -0.3638458251953125, -0.34397125244140625, -0.3240966796875, -0.30422210693359375, -0.2843475341796875, -0.26447296142578125, -0.244598388671875, -0.22472381591796875, -0.2048492431640625, -0.18497467041015625, -0.16510009765625, -0.14522552490234375, -0.1253509521484375, -0.10547637939453125, -0.085601806640625, -0.06572723388671875, -0.0458526611328125, -0.02597808837890625, -0.006103515625, 0.01377105712890625, 0.0336456298828125, 0.05352020263671875, 0.073394775390625, 0.09326934814453125, 0.1131439208984375, 0.13301849365234375, 0.15289306640625, 0.17276763916015625, 0.1926422119140625, 0.21251678466796875, 0.232391357421875, 0.25226593017578125, 0.2721405029296875, 0.29201507568359375, 0.3118896484375, 0.33176422119140625, 0.3516387939453125, 0.37151336669921875, 0.391387939453125, 0.41126251220703125, 0.4311370849609375, 0.45101165771484375, 0.47088623046875, 0.49076080322265625, 0.5106353759765625, 0.5305099487304688, 0.550384521484375, 0.5702590942382812, 0.5901336669921875, 0.6100082397460938, 0.6298828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 9.0, 13.0, 20.0, 20.0, 23.0, 35.0, 48.0, 52.0, 82.0, 102.0, 103.0, 95.0, 69.0, 66.0, 50.0, 27.0, 24.0, 27.0, 17.0, 14.0, 10.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00994110107421875, -0.009652495384216309, -0.009363889694213867, -0.009075284004211426, -0.008786678314208984, -0.008498072624206543, -0.008209466934204102, -0.00792086124420166, -0.007632255554199219, -0.007343649864196777, -0.007055044174194336, -0.0067664384841918945, -0.006477832794189453, -0.006189227104187012, -0.00590062141418457, -0.005612015724182129, -0.0053234100341796875, -0.005034804344177246, -0.004746198654174805, -0.004457592964172363, -0.004168987274169922, -0.0038803815841674805, -0.003591775894165039, -0.0033031702041625977, -0.0030145645141601562, -0.002725958824157715, -0.0024373531341552734, -0.002148747444152832, -0.0018601417541503906, -0.0015715360641479492, -0.0012829303741455078, -0.0009943246841430664, -0.000705718994140625, -0.0004171133041381836, -0.0001285076141357422, 0.00016009807586669922, 0.0004487037658691406, 0.000737309455871582, 0.0010259151458740234, 0.0013145208358764648, 0.0016031265258789062, 0.0018917322158813477, 0.002180337905883789, 0.0024689435958862305, 0.002757549285888672, 0.0030461549758911133, 0.0033347606658935547, 0.003623366355895996, 0.0039119720458984375, 0.004200577735900879, 0.00448918342590332, 0.004777789115905762, 0.005066394805908203, 0.0053550004959106445, 0.005643606185913086, 0.005932211875915527, 0.006220817565917969, 0.00650942325592041, 0.0067980289459228516, 0.007086634635925293, 0.007375240325927734, 0.007663846015930176, 0.007952451705932617, 0.008241057395935059, 0.0085296630859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 5.0, 20.0, 15.0, 19.0, 34.0, 43.0, 75.0, 107.0, 191.0, 285.0, 566.0, 4957.0, 974949.0, 65131.0, 1101.0, 384.0, 222.0, 124.0, 92.0, 60.0, 37.0, 27.0, 20.0, 21.0, 5.0, 9.0, 5.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.17176055908203125, -0.1657867431640625, -0.15981292724609375, -0.153839111328125, -0.14786529541015625, -0.1418914794921875, -0.13591766357421875, -0.12994384765625, -0.12397003173828125, -0.1179962158203125, -0.11202239990234375, -0.106048583984375, -0.10007476806640625, -0.0941009521484375, -0.08812713623046875, -0.0821533203125, -0.07617950439453125, -0.0702056884765625, -0.06423187255859375, -0.058258056640625, -0.05228424072265625, -0.0463104248046875, -0.04033660888671875, -0.03436279296875, -0.02838897705078125, -0.0224151611328125, -0.01644134521484375, -0.010467529296875, -0.00449371337890625, 0.0014801025390625, 0.00745391845703125, 0.013427734375, 0.01940155029296875, 0.0253753662109375, 0.03134918212890625, 0.037322998046875, 0.04329681396484375, 0.0492706298828125, 0.05524444580078125, 0.06121826171875, 0.06719207763671875, 0.0731658935546875, 0.07913970947265625, 0.085113525390625, 0.09108734130859375, 0.0970611572265625, 0.10303497314453125, 0.1090087890625, 0.11498260498046875, 0.1209564208984375, 0.12693023681640625, 0.132904052734375, 0.13887786865234375, 0.1448516845703125, 0.15082550048828125, 0.15679931640625, 0.16277313232421875, 0.1687469482421875, 0.17472076416015625, 0.180694580078125, 0.18666839599609375, 0.1926422119140625, 0.19861602783203125, 0.20458984375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 222.0, 707.0, 71.0, 8.0], "bins": [-0.1481674164533615, -0.14574740827083588, -0.14332741498947144, -0.1409074068069458, -0.13848741352558136, -0.13606740534305573, -0.13364741206169128, -0.13122740387916565, -0.1288074105978012, -0.12638740241527557, -0.12396740913391113, -0.1215474084019661, -0.11912740767002106, -0.11670740693807602, -0.11428740620613098, -0.11186739802360535, -0.10944739729166031, -0.10702739655971527, -0.10460739582777023, -0.1021873950958252, -0.09976739436388016, -0.09734739363193512, -0.09492739289999008, -0.09250739216804504, -0.09008738398551941, -0.08766738325357437, -0.08524738252162933, -0.0828273817896843, -0.08040738105773926, -0.07798738032579422, -0.07556737959384918, -0.07314737141132355, -0.0707273855805397, -0.06830738484859467, -0.06588738411664963, -0.06346738338470459, -0.06104738265275955, -0.058627381920814514, -0.05620737746357918, -0.05378737673163414, -0.0513673759996891, -0.048947375267744064, -0.046527374535799026, -0.04410737380385399, -0.04168736934661865, -0.039267368614673615, -0.03684736788272858, -0.03442736715078354, -0.0320073664188385, -0.029587365686893463, -0.027167364954948425, -0.024747362360358238, -0.0223273616284132, -0.019907360896468163, -0.017487358301877975, -0.015067357569932938, -0.0126473568379879, -0.010227356106042862, -0.0078073544427752495, -0.005387353245168924, -0.002967352047562599, -0.0005473513156175613, 0.0018726503476500511, 0.004292652010917664, 0.006712652742862701]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 6.0, 8.0, 15.0, 8.0, 14.0, 12.0, 20.0, 31.0, 27.0, 29.0, 25.0, 32.0, 41.0, 42.0, 37.0, 34.0, 40.0, 49.0, 41.0, 40.0, 35.0, 37.0, 42.0, 36.0, 39.0, 33.0, 32.0, 26.0, 17.0, 22.0, 23.0, 16.0, 13.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006248652935028076, -0.006037823855876923, -0.005826994776725769, -0.0056161656975746155, -0.005405336618423462, -0.005194507539272308, -0.004983678460121155, -0.004772849380970001, -0.004562020301818848, -0.004351191222667694, -0.0041403621435165405, -0.003929533064365387, -0.0037187039852142334, -0.00350787490606308, -0.0032970458269119263, -0.0030862167477607727, -0.002875387668609619, -0.0026645585894584656, -0.002453729510307312, -0.0022429004311561584, -0.002032071352005005, -0.0018212422728538513, -0.0016104131937026978, -0.0013995841145515442, -0.0011887550354003906, -0.000977925956249237, -0.0007670968770980835, -0.0005562677979469299, -0.00034543871879577637, -0.0001346096396446228, 7.621943950653076e-05, 0.0002870485186576843, 0.0004978775978088379, 0.0007087066769599915, 0.000919535756111145, 0.0011303648352622986, 0.0013411939144134521, 0.0015520229935646057, 0.0017628520727157593, 0.001973681151866913, 0.0021845102310180664, 0.00239533931016922, 0.0026061683893203735, 0.002816997468471527, 0.0030278265476226807, 0.0032386556267738342, 0.003449484705924988, 0.0036603137850761414, 0.003871142864227295, 0.0040819719433784485, 0.004292801022529602, 0.004503630101680756, 0.004714459180831909, 0.004925288259983063, 0.005136117339134216, 0.00534694641828537, 0.0055577754974365234, 0.005768604576587677, 0.005979433655738831, 0.006190262734889984, 0.006401091814041138, 0.006611920893192291, 0.006822749972343445, 0.007033579051494598, 0.007244408130645752]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 17.0, 15.0, 22.0, 22.0, 33.0, 27.0, 29.0, 49.0, 37.0, 39.0, 59.0, 56.0, 38.0, 53.0, 58.0, 52.0, 43.0, 35.0, 31.0, 36.0, 26.0, 27.0, 20.0, 24.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.9765625, -9.6607666015625, -9.344970703125, -9.0291748046875, -8.71337890625, -8.3975830078125, -8.081787109375, -7.7659912109375, -7.4501953125, -7.1343994140625, -6.818603515625, -6.5028076171875, -6.18701171875, -5.8712158203125, -5.555419921875, -5.2396240234375, -4.923828125, -4.6080322265625, -4.292236328125, -3.9764404296875, -3.66064453125, -3.3448486328125, -3.029052734375, -2.7132568359375, -2.3974609375, -2.0816650390625, -1.765869140625, -1.4500732421875, -1.13427734375, -0.8184814453125, -0.502685546875, -0.1868896484375, 0.12890625, 0.4447021484375, 0.760498046875, 1.0762939453125, 1.39208984375, 1.7078857421875, 2.023681640625, 2.3394775390625, 2.6552734375, 2.9710693359375, 3.286865234375, 3.6026611328125, 3.91845703125, 4.2342529296875, 4.550048828125, 4.8658447265625, 5.181640625, 5.4974365234375, 5.813232421875, 6.1290283203125, 6.44482421875, 6.7606201171875, 7.076416015625, 7.3922119140625, 7.7080078125, 8.0238037109375, 8.339599609375, 8.6553955078125, 8.97119140625, 9.2869873046875, 9.602783203125, 9.9185791015625, 10.234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 14.0, 19.0, 23.0, 30.0, 53.0, 76.0, 106.0, 138.0, 214.0, 345.0, 483.0, 774.0, 1219.0, 2003.0, 3761.0, 7378.0, 18414.0, 80399.0, 786125.0, 107586.0, 21218.0, 8221.0, 4052.0, 2163.0, 1294.0, 807.0, 514.0, 346.0, 231.0, 168.0, 104.0, 77.0, 49.0, 33.0, 34.0, 12.0, 16.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.5849609375, -19.888671875, -19.1923828125, -18.49609375, -17.7998046875, -17.103515625, -16.4072265625, -15.7109375, -15.0146484375, -14.318359375, -13.6220703125, -12.92578125, -12.2294921875, -11.533203125, -10.8369140625, -10.140625, -9.4443359375, -8.748046875, -8.0517578125, -7.35546875, -6.6591796875, -5.962890625, -5.2666015625, -4.5703125, -3.8740234375, -3.177734375, -2.4814453125, -1.78515625, -1.0888671875, -0.392578125, 0.3037109375, 1.0, 1.6962890625, 2.392578125, 3.0888671875, 3.78515625, 4.4814453125, 5.177734375, 5.8740234375, 6.5703125, 7.2666015625, 7.962890625, 8.6591796875, 9.35546875, 10.0517578125, 10.748046875, 11.4443359375, 12.140625, 12.8369140625, 13.533203125, 14.2294921875, 14.92578125, 15.6220703125, 16.318359375, 17.0146484375, 17.7109375, 18.4072265625, 19.103515625, 19.7998046875, 20.49609375, 21.1923828125, 21.888671875, 22.5849609375, 23.28125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 6.0, 8.0, 13.0, 20.0, 14.0, 25.0, 21.0, 18.0, 35.0, 31.0, 42.0, 48.0, 56.0, 71.0, 103.0, 282.0, 1604.0, 131.0, 85.0, 60.0, 45.0, 51.0, 45.0, 25.0, 32.0, 21.0, 23.0, 19.0, 19.0, 18.0, 14.0, 5.0, 7.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-40.75, -39.624267578125, -38.49853515625, -37.372802734375, -36.2470703125, -35.121337890625, -33.99560546875, -32.869873046875, -31.744140625, -30.618408203125, -29.49267578125, -28.366943359375, -27.2412109375, -26.115478515625, -24.98974609375, -23.864013671875, -22.73828125, -21.612548828125, -20.48681640625, -19.361083984375, -18.2353515625, -17.109619140625, -15.98388671875, -14.858154296875, -13.732421875, -12.606689453125, -11.48095703125, -10.355224609375, -9.2294921875, -8.103759765625, -6.97802734375, -5.852294921875, -4.7265625, -3.600830078125, -2.47509765625, -1.349365234375, -0.2236328125, 0.902099609375, 2.02783203125, 3.153564453125, 4.279296875, 5.405029296875, 6.53076171875, 7.656494140625, 8.7822265625, 9.907958984375, 11.03369140625, 12.159423828125, 13.28515625, 14.410888671875, 15.53662109375, 16.662353515625, 17.7880859375, 18.913818359375, 20.03955078125, 21.165283203125, 22.291015625, 23.416748046875, 24.54248046875, 25.668212890625, 26.7939453125, 27.919677734375, 29.04541015625, 30.171142578125, 31.296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 9.0, 4.0, 13.0, 24.0, 19.0, 19.0, 18.0, 27.0, 33.0, 51.0, 79.0, 121.0, 234.0, 553.0, 1495.0, 5098.0, 23486.0, 740817.0, 2335068.0, 29638.0, 5904.0, 1712.0, 596.0, 262.0, 110.0, 60.0, 57.0, 29.0, 22.0, 22.0, 14.0, 14.0, 22.0, 10.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875, -46.2275390625, -44.580078125, -42.9326171875, -41.28515625, -39.6376953125, -37.990234375, -36.3427734375, -34.6953125, -33.0478515625, -31.400390625, -29.7529296875, -28.10546875, -26.4580078125, -24.810546875, -23.1630859375, -21.515625, -19.8681640625, -18.220703125, -16.5732421875, -14.92578125, -13.2783203125, -11.630859375, -9.9833984375, -8.3359375, -6.6884765625, -5.041015625, -3.3935546875, -1.74609375, -0.0986328125, 1.548828125, 3.1962890625, 4.84375, 6.4912109375, 8.138671875, 9.7861328125, 11.43359375, 13.0810546875, 14.728515625, 16.3759765625, 18.0234375, 19.6708984375, 21.318359375, 22.9658203125, 24.61328125, 26.2607421875, 27.908203125, 29.5556640625, 31.203125, 32.8505859375, 34.498046875, 36.1455078125, 37.79296875, 39.4404296875, 41.087890625, 42.7353515625, 44.3828125, 46.0302734375, 47.677734375, 49.3251953125, 50.97265625, 52.6201171875, 54.267578125, 55.9150390625, 57.5625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 26.0, 37.0, 77.0, 106.0, 170.0, 207.0, 155.0, 83.0, 66.0, 35.0, 15.0, 14.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.27699279785156, -50.88579177856445, -48.494590759277344, -46.10338592529297, -43.71218490600586, -41.32098388671875, -38.929779052734375, -36.538578033447266, -34.147377014160156, -31.756175994873047, -29.364973068237305, -26.973770141601562, -24.582569122314453, -22.191368103027344, -19.8001651763916, -17.40896224975586, -15.01776123046875, -12.626559257507324, -10.235357284545898, -7.844155311584473, -5.452953338623047, -3.061751365661621, -0.6705493927001953, 1.7206535339355469, 4.111854553222656, 6.503056526184082, 8.894258499145508, 11.285460472106934, 13.67666244506836, 16.06786346435547, 18.45906639099121, 20.850269317626953, 23.241470336914062, 25.632671356201172, 28.023874282836914, 30.415077209472656, 32.806278228759766, 35.197479248046875, 37.58868408203125, 39.97988510131836, 42.37108612060547, 44.76228713989258, 47.15348815917969, 49.54469299316406, 51.93589401245117, 54.32709503173828, 56.718299865722656, 59.109500885009766, 61.500701904296875, 63.891902923583984, 66.2831039428711, 68.67430877685547, 71.06550598144531, 73.45671081542969, 75.84791564941406, 78.23912048339844, 80.63031768798828, 83.02152252197266, 85.4127197265625, 87.80392456054688, 90.19512939453125, 92.5863265991211, 94.97753143310547, 97.36872863769531, 99.75993347167969]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 9.0, 6.0, 14.0, 8.0, 12.0, 12.0, 17.0, 22.0, 27.0, 23.0, 30.0, 20.0, 33.0, 39.0, 40.0, 37.0, 32.0, 35.0, 39.0, 39.0, 37.0, 54.0, 44.0, 33.0, 36.0, 47.0, 27.0, 29.0, 25.0, 28.0, 16.0, 22.0, 21.0, 14.0, 13.0, 8.0, 13.0, 6.0, 5.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-110.80199432373047, -107.41445922851562, -104.02693176269531, -100.63939666748047, -97.25186157226562, -93.86433410644531, -90.47679901123047, -87.08926391601562, -83.70173645019531, -80.31420135498047, -76.92667388916016, -73.53913879394531, -70.15160369873047, -66.76406860351562, -63.37654113769531, -59.98900604248047, -56.601470947265625, -53.21393966674805, -49.8264045715332, -46.438873291015625, -43.05133819580078, -39.6638069152832, -36.276275634765625, -32.88874053955078, -29.501209259033203, -26.113676071166992, -22.72614288330078, -19.338611602783203, -15.951078414916992, -12.563545227050781, -9.176013946533203, -5.788480758666992, -2.4009475708007812, 0.9865851402282715, 4.374117851257324, 7.761650085449219, 11.14918327331543, 14.53671646118164, 17.92424774169922, 21.31178092956543, 24.69931411743164, 28.08684730529785, 31.474380493164062, 34.86191177368164, 38.24944305419922, 41.63697814941406, 45.02450942993164, 48.41204071044922, 51.79957580566406, 55.18710708618164, 58.574642181396484, 61.96217346191406, 65.3497085571289, 68.73724365234375, 72.12477111816406, 75.5123062133789, 78.89984130859375, 82.2873764038086, 85.6749038696289, 89.06243896484375, 92.4499740600586, 95.83750915527344, 99.22503662109375, 102.6125717163086, 106.0000991821289]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 3.0, 4.0, 9.0, 12.0, 12.0, 13.0, 22.0, 13.0, 22.0, 23.0, 34.0, 23.0, 36.0, 31.0, 40.0, 42.0, 56.0, 40.0, 42.0, 53.0, 42.0, 52.0, 50.0, 44.0, 31.0, 33.0, 32.0, 36.0, 25.0, 16.0, 16.0, 14.0, 11.0, 9.0, 5.0, 9.0, 8.0, 6.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.6097412109375, -9.289794921875, -8.9698486328125, -8.64990234375, -8.3299560546875, -8.010009765625, -7.6900634765625, -7.3701171875, -7.0501708984375, -6.730224609375, -6.4102783203125, -6.09033203125, -5.7703857421875, -5.450439453125, -5.1304931640625, -4.810546875, -4.4906005859375, -4.170654296875, -3.8507080078125, -3.53076171875, -3.2108154296875, -2.890869140625, -2.5709228515625, -2.2509765625, -1.9310302734375, -1.611083984375, -1.2911376953125, -0.97119140625, -0.6512451171875, -0.331298828125, -0.0113525390625, 0.30859375, 0.6285400390625, 0.948486328125, 1.2684326171875, 1.58837890625, 1.9083251953125, 2.228271484375, 2.5482177734375, 2.8681640625, 3.1881103515625, 3.508056640625, 3.8280029296875, 4.14794921875, 4.4678955078125, 4.787841796875, 5.1077880859375, 5.427734375, 5.7476806640625, 6.067626953125, 6.3875732421875, 6.70751953125, 7.0274658203125, 7.347412109375, 7.6673583984375, 7.9873046875, 8.3072509765625, 8.627197265625, 8.9471435546875, 9.26708984375, 9.5870361328125, 9.906982421875, 10.2269287109375, 10.546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 11.0, 7.0, 21.0, 25.0, 33.0, 43.0, 65.0, 94.0, 142.0, 224.0, 308.0, 456.0, 677.0, 994.0, 1598.0, 2513.0, 4122.0, 7476.0, 17233.0, 81643.0, 646542.0, 2703633.0, 620354.0, 72907.0, 15806.0, 7021.0, 3642.0, 2226.0, 1425.0, 931.0, 604.0, 433.0, 309.0, 192.0, 155.0, 112.0, 86.0, 60.0, 38.0, 36.0, 26.0, 19.0, 9.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.625, -18.981201171875, -18.33740234375, -17.693603515625, -17.0498046875, -16.406005859375, -15.76220703125, -15.118408203125, -14.474609375, -13.830810546875, -13.18701171875, -12.543212890625, -11.8994140625, -11.255615234375, -10.61181640625, -9.968017578125, -9.32421875, -8.680419921875, -8.03662109375, -7.392822265625, -6.7490234375, -6.105224609375, -5.46142578125, -4.817626953125, -4.173828125, -3.530029296875, -2.88623046875, -2.242431640625, -1.5986328125, -0.954833984375, -0.31103515625, 0.332763671875, 0.9765625, 1.620361328125, 2.26416015625, 2.907958984375, 3.5517578125, 4.195556640625, 4.83935546875, 5.483154296875, 6.126953125, 6.770751953125, 7.41455078125, 8.058349609375, 8.7021484375, 9.345947265625, 9.98974609375, 10.633544921875, 11.27734375, 11.921142578125, 12.56494140625, 13.208740234375, 13.8525390625, 14.496337890625, 15.14013671875, 15.783935546875, 16.427734375, 17.071533203125, 17.71533203125, 18.359130859375, 19.0029296875, 19.646728515625, 20.29052734375, 20.934326171875, 21.578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 15.0, 16.0, 19.0, 25.0, 24.0, 27.0, 49.0, 80.0, 125.0, 188.0, 341.0, 533.0, 714.0, 645.0, 464.0, 275.0, 167.0, 95.0, 62.0, 37.0, 30.0, 20.0, 17.0, 11.0, 7.0, 11.0, 11.0, 13.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.609375, -23.78173828125, -22.9541015625, -22.12646484375, -21.298828125, -20.47119140625, -19.6435546875, -18.81591796875, -17.98828125, -17.16064453125, -16.3330078125, -15.50537109375, -14.677734375, -13.85009765625, -13.0224609375, -12.19482421875, -11.3671875, -10.53955078125, -9.7119140625, -8.88427734375, -8.056640625, -7.22900390625, -6.4013671875, -5.57373046875, -4.74609375, -3.91845703125, -3.0908203125, -2.26318359375, -1.435546875, -0.60791015625, 0.2197265625, 1.04736328125, 1.875, 2.70263671875, 3.5302734375, 4.35791015625, 5.185546875, 6.01318359375, 6.8408203125, 7.66845703125, 8.49609375, 9.32373046875, 10.1513671875, 10.97900390625, 11.806640625, 12.63427734375, 13.4619140625, 14.28955078125, 15.1171875, 15.94482421875, 16.7724609375, 17.60009765625, 18.427734375, 19.25537109375, 20.0830078125, 20.91064453125, 21.73828125, 22.56591796875, 23.3935546875, 24.22119140625, 25.048828125, 25.87646484375, 26.7041015625, 27.53173828125, 28.359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 12.0, 11.0, 25.0, 31.0, 36.0, 71.0, 59.0, 118.0, 228.0, 380.0, 701.0, 1265.0, 2395.0, 4977.0, 11509.0, 31392.0, 130552.0, 1744004.0, 2063849.0, 145910.0, 33916.0, 11978.0, 5285.0, 2528.0, 1280.0, 705.0, 393.0, 243.0, 138.0, 89.0, 56.0, 32.0, 36.0, 17.0, 16.0, 8.0, 6.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -32.787109375, -31.73046875, -30.673828125, -29.6171875, -28.560546875, -27.50390625, -26.447265625, -25.390625, -24.333984375, -23.27734375, -22.220703125, -21.1640625, -20.107421875, -19.05078125, -17.994140625, -16.9375, -15.880859375, -14.82421875, -13.767578125, -12.7109375, -11.654296875, -10.59765625, -9.541015625, -8.484375, -7.427734375, -6.37109375, -5.314453125, -4.2578125, -3.201171875, -2.14453125, -1.087890625, -0.03125, 1.025390625, 2.08203125, 3.138671875, 4.1953125, 5.251953125, 6.30859375, 7.365234375, 8.421875, 9.478515625, 10.53515625, 11.591796875, 12.6484375, 13.705078125, 14.76171875, 15.818359375, 16.875, 17.931640625, 18.98828125, 20.044921875, 21.1015625, 22.158203125, 23.21484375, 24.271484375, 25.328125, 26.384765625, 27.44140625, 28.498046875, 29.5546875, 30.611328125, 31.66796875, 32.724609375, 33.78125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 14.0, 39.0, 92.0, 238.0, 326.0, 186.0, 68.0, 27.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.39427185058594, -103.94099426269531, -95.48771667480469, -87.03443908691406, -78.58116149902344, -70.12788391113281, -61.67461395263672, -53.221336364746094, -44.76805877685547, -36.314781188964844, -27.86150550842285, -19.40822982788086, -10.954952239990234, -2.5016746520996094, 5.95159912109375, 14.404876708984375, 22.858154296875, 31.311431884765625, 39.76470947265625, 48.21798324584961, 56.671260833740234, 65.12454223632812, 73.57781219482422, 82.03108978271484, 90.48436737060547, 98.9376449584961, 107.39092254638672, 115.84419250488281, 124.29747009277344, 132.75074768066406, 141.2040252685547, 149.6573028564453, 158.110595703125, 166.56387329101562, 175.01715087890625, 183.47042846679688, 191.9237060546875, 200.37698364257812, 208.83026123046875, 217.28353881835938, 225.73681640625, 234.19009399414062, 242.64337158203125, 251.09664916992188, 259.5499267578125, 268.0032043457031, 276.45648193359375, 284.9097595214844, 293.363037109375, 301.8163146972656, 310.26959228515625, 318.7228698730469, 327.1761474609375, 335.6294250488281, 344.08270263671875, 352.5359802246094, 360.9892272949219, 369.4425048828125, 377.8957824707031, 386.34906005859375, 394.8023376464844, 403.255615234375, 411.7088928222656, 420.16217041015625, 428.6154479980469]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 9.0, 8.0, 15.0, 11.0, 15.0, 13.0, 15.0, 16.0, 22.0, 26.0, 27.0, 42.0, 40.0, 36.0, 59.0, 43.0, 42.0, 37.0, 28.0, 45.0, 38.0, 37.0, 40.0, 40.0, 32.0, 24.0, 23.0, 27.0, 23.0, 21.0, 15.0, 22.0, 8.0, 17.0, 15.0, 11.0, 8.0, 4.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-81.27159881591797, -78.85063171386719, -76.4296646118164, -74.00869750976562, -71.58773040771484, -69.16676330566406, -66.74579620361328, -64.3248291015625, -61.90386199951172, -59.48289489746094, -57.061927795410156, -54.640960693359375, -52.219993591308594, -49.79902648925781, -47.37805938720703, -44.95709228515625, -42.53612518310547, -40.11515808105469, -37.694190979003906, -35.273223876953125, -32.852256774902344, -30.431289672851562, -28.01032257080078, -25.58935546875, -23.16838836669922, -20.747421264648438, -18.326454162597656, -15.905487060546875, -13.484519958496094, -11.063552856445312, -8.642585754394531, -6.22161865234375, -3.8006591796875, -1.3796920776367188, 1.0412750244140625, 3.4622421264648438, 5.883209228515625, 8.304176330566406, 10.725143432617188, 13.146110534667969, 15.56707763671875, 17.98804473876953, 20.409011840820312, 22.829978942871094, 25.250946044921875, 27.671913146972656, 30.092880249023438, 32.51384735107422, 34.934814453125, 37.35578155517578, 39.77674865722656, 42.197715759277344, 44.618682861328125, 47.039649963378906, 49.46061706542969, 51.88158416748047, 54.30255126953125, 56.72351837158203, 59.14448547363281, 61.565452575683594, 63.986419677734375, 66.40738677978516, 68.82835388183594, 71.24932098388672, 73.6702880859375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 5.0, 13.0, 10.0, 22.0, 19.0, 9.0, 34.0, 26.0, 30.0, 31.0, 31.0, 39.0, 47.0, 49.0, 52.0, 42.0, 54.0, 51.0, 57.0, 47.0, 38.0, 43.0, 33.0, 25.0, 35.0, 22.0, 22.0, 17.0, 15.0, 9.0, 7.0, 7.0, 11.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.291748046875, -9.95068359375, -9.609619140625, -9.2685546875, -8.927490234375, -8.58642578125, -8.245361328125, -7.904296875, -7.563232421875, -7.22216796875, -6.881103515625, -6.5400390625, -6.198974609375, -5.85791015625, -5.516845703125, -5.17578125, -4.834716796875, -4.49365234375, -4.152587890625, -3.8115234375, -3.470458984375, -3.12939453125, -2.788330078125, -2.447265625, -2.106201171875, -1.76513671875, -1.424072265625, -1.0830078125, -0.741943359375, -0.40087890625, -0.059814453125, 0.28125, 0.622314453125, 0.96337890625, 1.304443359375, 1.6455078125, 1.986572265625, 2.32763671875, 2.668701171875, 3.009765625, 3.350830078125, 3.69189453125, 4.032958984375, 4.3740234375, 4.715087890625, 5.05615234375, 5.397216796875, 5.73828125, 6.079345703125, 6.42041015625, 6.761474609375, 7.1025390625, 7.443603515625, 7.78466796875, 8.125732421875, 8.466796875, 8.807861328125, 9.14892578125, 9.489990234375, 9.8310546875, 10.172119140625, 10.51318359375, 10.854248046875, 11.1953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 16.0, 13.0, 19.0, 33.0, 49.0, 78.0, 123.0, 141.0, 261.0, 324.0, 447.0, 664.0, 1081.0, 1525.0, 2186.0, 3410.0, 5137.0, 8130.0, 12706.0, 20750.0, 34848.0, 60252.0, 106765.0, 177581.0, 221964.0, 160500.0, 93472.0, 53665.0, 30789.0, 18759.0, 11553.0, 7221.0, 4651.0, 3023.0, 2059.0, 1446.0, 932.0, 613.0, 420.0, 291.0, 206.0, 135.0, 85.0, 77.0, 45.0, 35.0, 26.0, 18.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.400390625, -1.35577392578125, -1.3111572265625, -1.26654052734375, -1.221923828125, -1.17730712890625, -1.1326904296875, -1.08807373046875, -1.04345703125, -0.99884033203125, -0.9542236328125, -0.90960693359375, -0.864990234375, -0.82037353515625, -0.7757568359375, -0.73114013671875, -0.6865234375, -0.64190673828125, -0.5972900390625, -0.55267333984375, -0.508056640625, -0.46343994140625, -0.4188232421875, -0.37420654296875, -0.32958984375, -0.28497314453125, -0.2403564453125, -0.19573974609375, -0.151123046875, -0.10650634765625, -0.0618896484375, -0.01727294921875, 0.02734375, 0.07196044921875, 0.1165771484375, 0.16119384765625, 0.205810546875, 0.25042724609375, 0.2950439453125, 0.33966064453125, 0.38427734375, 0.42889404296875, 0.4735107421875, 0.51812744140625, 0.562744140625, 0.60736083984375, 0.6519775390625, 0.69659423828125, 0.7412109375, 0.78582763671875, 0.8304443359375, 0.87506103515625, 0.919677734375, 0.96429443359375, 1.0089111328125, 1.05352783203125, 1.09814453125, 1.14276123046875, 1.1873779296875, 1.23199462890625, 1.276611328125, 1.32122802734375, 1.3658447265625, 1.41046142578125, 1.455078125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 4.0, 12.0, 8.0, 15.0, 7.0, 28.0, 15.0, 24.0, 14.0, 24.0, 26.0, 28.0, 30.0, 36.0, 20.0, 32.0, 32.0, 44.0, 38.0, 35.0, 1062.0, 35.0, 44.0, 42.0, 40.0, 21.0, 44.0, 26.0, 21.0, 30.0, 25.0, 17.0, 19.0, 9.0, 15.0, 14.0, 13.0, 13.0, 12.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.2421875, -5.068603515625, -4.89501953125, -4.721435546875, -4.5478515625, -4.374267578125, -4.20068359375, -4.027099609375, -3.853515625, -3.679931640625, -3.50634765625, -3.332763671875, -3.1591796875, -2.985595703125, -2.81201171875, -2.638427734375, -2.46484375, -2.291259765625, -2.11767578125, -1.944091796875, -1.7705078125, -1.596923828125, -1.42333984375, -1.249755859375, -1.076171875, -0.902587890625, -0.72900390625, -0.555419921875, -0.3818359375, -0.208251953125, -0.03466796875, 0.138916015625, 0.3125, 0.486083984375, 0.65966796875, 0.833251953125, 1.0068359375, 1.180419921875, 1.35400390625, 1.527587890625, 1.701171875, 1.874755859375, 2.04833984375, 2.221923828125, 2.3955078125, 2.569091796875, 2.74267578125, 2.916259765625, 3.08984375, 3.263427734375, 3.43701171875, 3.610595703125, 3.7841796875, 3.957763671875, 4.13134765625, 4.304931640625, 4.478515625, 4.652099609375, 4.82568359375, 4.999267578125, 5.1728515625, 5.346435546875, 5.52001953125, 5.693603515625, 5.8671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 17.0, 26.0, 38.0, 53.0, 80.0, 117.0, 175.0, 245.0, 350.0, 546.0, 833.0, 1133.0, 1710.0, 2665.0, 3997.0, 6266.0, 9328.0, 14682.0, 23558.0, 38428.0, 64266.0, 106372.0, 167493.0, 1250008.0, 154798.0, 96498.0, 58432.0, 35348.0, 21287.0, 13352.0, 8643.0, 5403.0, 3800.0, 2292.0, 1647.0, 1062.0, 683.0, 463.0, 310.0, 238.0, 158.0, 78.0, 87.0, 46.0, 35.0, 27.0, 15.0, 12.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.8486328125, -0.8232269287109375, -0.797821044921875, -0.7724151611328125, -0.74700927734375, -0.7216033935546875, -0.696197509765625, -0.6707916259765625, -0.6453857421875, -0.6199798583984375, -0.594573974609375, -0.5691680908203125, -0.54376220703125, -0.5183563232421875, -0.492950439453125, -0.4675445556640625, -0.442138671875, -0.4167327880859375, -0.391326904296875, -0.3659210205078125, -0.34051513671875, -0.3151092529296875, -0.289703369140625, -0.2642974853515625, -0.2388916015625, -0.2134857177734375, -0.188079833984375, -0.1626739501953125, -0.13726806640625, -0.1118621826171875, -0.086456298828125, -0.0610504150390625, -0.03564453125, -0.0102386474609375, 0.015167236328125, 0.0405731201171875, 0.06597900390625, 0.0913848876953125, 0.116790771484375, 0.1421966552734375, 0.1676025390625, 0.1930084228515625, 0.218414306640625, 0.2438201904296875, 0.26922607421875, 0.2946319580078125, 0.320037841796875, 0.3454437255859375, 0.370849609375, 0.3962554931640625, 0.421661376953125, 0.4470672607421875, 0.47247314453125, 0.4978790283203125, 0.523284912109375, 0.5486907958984375, 0.5740966796875, 0.5995025634765625, 0.624908447265625, 0.6503143310546875, 0.67572021484375, 0.7011260986328125, 0.726531982421875, 0.7519378662109375, 0.77734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 11.0, 1.0, 11.0, 8.0, 8.0, 11.0, 16.0, 14.0, 27.0, 28.0, 24.0, 38.0, 54.0, 44.0, 69.0, 103.0, 97.0, 74.0, 71.0, 49.0, 45.0, 31.0, 34.0, 18.0, 15.0, 13.0, 7.0, 7.0, 13.0, 6.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01247406005859375, -0.012099504470825195, -0.01172494888305664, -0.011350393295288086, -0.010975837707519531, -0.010601282119750977, -0.010226726531982422, -0.009852170944213867, -0.009477615356445312, -0.009103059768676758, -0.008728504180908203, -0.008353948593139648, -0.007979393005371094, -0.007604837417602539, -0.007230281829833984, -0.00685572624206543, -0.006481170654296875, -0.00610661506652832, -0.005732059478759766, -0.005357503890991211, -0.004982948303222656, -0.0046083927154541016, -0.004233837127685547, -0.003859281539916992, -0.0034847259521484375, -0.003110170364379883, -0.002735614776611328, -0.0023610591888427734, -0.0019865036010742188, -0.001611948013305664, -0.0012373924255371094, -0.0008628368377685547, -0.00048828125, -0.00011372566223144531, 0.0002608299255371094, 0.0006353855133056641, 0.0010099411010742188, 0.0013844966888427734, 0.0017590522766113281, 0.002133607864379883, 0.0025081634521484375, 0.002882719039916992, 0.003257274627685547, 0.0036318302154541016, 0.004006385803222656, 0.004380941390991211, 0.004755496978759766, 0.00513005256652832, 0.005504608154296875, 0.00587916374206543, 0.006253719329833984, 0.006628274917602539, 0.007002830505371094, 0.0073773860931396484, 0.007751941680908203, 0.008126497268676758, 0.008501052856445312, 0.008875608444213867, 0.009250164031982422, 0.009624719619750977, 0.009999275207519531, 0.010373830795288086, 0.01074838638305664, 0.011122941970825195, 0.01149749755859375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 12.0, 19.0, 15.0, 20.0, 42.0, 53.0, 65.0, 82.0, 123.0, 205.0, 320.0, 981.0, 17788.0, 989723.0, 36567.0, 1465.0, 350.0, 183.0, 149.0, 102.0, 57.0, 43.0, 36.0, 23.0, 24.0, 16.0, 19.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2275390625, -0.2198486328125, -0.212158203125, -0.2044677734375, -0.19677734375, -0.1890869140625, -0.181396484375, -0.1737060546875, -0.166015625, -0.1583251953125, -0.150634765625, -0.1429443359375, -0.13525390625, -0.1275634765625, -0.119873046875, -0.1121826171875, -0.1044921875, -0.0968017578125, -0.089111328125, -0.0814208984375, -0.07373046875, -0.0660400390625, -0.058349609375, -0.0506591796875, -0.04296875, -0.0352783203125, -0.027587890625, -0.0198974609375, -0.01220703125, -0.0045166015625, 0.003173828125, 0.0108642578125, 0.0185546875, 0.0262451171875, 0.033935546875, 0.0416259765625, 0.04931640625, 0.0570068359375, 0.064697265625, 0.0723876953125, 0.080078125, 0.0877685546875, 0.095458984375, 0.1031494140625, 0.11083984375, 0.1185302734375, 0.126220703125, 0.1339111328125, 0.1416015625, 0.1492919921875, 0.156982421875, 0.1646728515625, 0.17236328125, 0.1800537109375, 0.187744140625, 0.1954345703125, 0.203125, 0.2108154296875, 0.218505859375, 0.2261962890625, 0.23388671875, 0.2415771484375, 0.249267578125, 0.2569580078125, 0.2646484375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 25.0, 248.0, 595.0, 125.0, 16.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13521601259708405, -0.1322910189628601, -0.12936602532863617, -0.12644103169441223, -0.12351604551076889, -0.12059105187654495, -0.11766606569290161, -0.11474107205867767, -0.11181607842445374, -0.1088910847902298, -0.10596609860658646, -0.10304110497236252, -0.10011611133813858, -0.09719111770391464, -0.0942661315202713, -0.09134113788604736, -0.08841614425182343, -0.08549115061759949, -0.08256616443395615, -0.07964117079973221, -0.07671617716550827, -0.07379118353128433, -0.07086619734764099, -0.06794120371341705, -0.06501621752977371, -0.06209122762084007, -0.059166233986616135, -0.056241244077682495, -0.05331625044345856, -0.05039126053452492, -0.04746627062559128, -0.04454127699136734, -0.041616279631853104, -0.038691289722919464, -0.035766296088695526, -0.03284130617976189, -0.02991631254553795, -0.02699132263660431, -0.02406633086502552, -0.02114133909344673, -0.018216347321867943, -0.015291355550289154, -0.012366363778710365, -0.009441372938454151, -0.006516381166875362, -0.0035913893952965736, -0.0006663985550403595, 0.0022585932165384293, 0.005183584988117218, 0.008108576759696007, 0.011033568531274796, 0.01395855937153101, 0.016883552074432373, 0.019808541983366013, 0.0227335337549448, 0.02565852552652359, 0.02858351729810238, 0.03150850906968117, 0.03443349897861481, 0.037358492612838745, 0.040283482521772385, 0.04320847615599632, 0.04613346606492996, 0.0490584596991539, 0.05198344960808754]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 14.0, 13.0, 15.0, 23.0, 24.0, 28.0, 40.0, 34.0, 42.0, 21.0, 44.0, 45.0, 41.0, 52.0, 39.0, 48.0, 59.0, 33.0, 42.0, 43.0, 32.0, 31.0, 29.0, 22.0, 25.0, 16.0, 21.0, 15.0, 16.0, 11.0, 11.0, 11.0, 5.0, 5.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0074086785316467285, -0.007179425098001957, -0.006950171664357185, -0.006720918230712414, -0.006491664797067642, -0.006262411363422871, -0.006033157929778099, -0.0058039044961333275, -0.005574651062488556, -0.005345397628843784, -0.005116144195199013, -0.004886890761554241, -0.00465763732790947, -0.004428383894264698, -0.0041991304606199265, -0.003969877026975155, -0.0037406235933303833, -0.0035113701596856117, -0.00328211672604084, -0.0030528632923960686, -0.002823609858751297, -0.0025943564251065254, -0.002365102991461754, -0.0021358495578169823, -0.0019065961241722107, -0.0016773426905274391, -0.0014480892568826675, -0.001218835823237896, -0.0009895823895931244, -0.0007603289559483528, -0.0005310755223035812, -0.00030182208865880966, -7.256865501403809e-05, 0.0001566847786307335, 0.00038593821227550507, 0.0006151916459202766, 0.0008444450795650482, 0.0010736985132098198, 0.0013029519468545914, 0.001532205380499363, 0.0017614588141441345, 0.001990712247788906, 0.0022199656814336777, 0.0024492191150784492, 0.002678472548723221, 0.0029077259823679924, 0.003136979416012764, 0.0033662328496575356, 0.003595486283302307, 0.0038247397169470787, 0.00405399315059185, 0.004283246584236622, 0.004512500017881393, 0.004741753451526165, 0.004971006885170937, 0.005200260318815708, 0.00542951375246048, 0.005658767186105251, 0.005888020619750023, 0.0061172740533947945, 0.006346527487039566, 0.006575780920684338, 0.006805034354329109, 0.007034287787973881, 0.007263541221618652]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 5.0, 13.0, 10.0, 22.0, 18.0, 10.0, 33.0, 26.0, 31.0, 31.0, 31.0, 38.0, 48.0, 49.0, 51.0, 43.0, 54.0, 51.0, 56.0, 48.0, 38.0, 43.0, 33.0, 25.0, 35.0, 22.0, 22.0, 17.0, 15.0, 9.0, 7.0, 7.0, 11.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.2918701171875, -9.950927734375, -9.6099853515625, -9.26904296875, -8.9281005859375, -8.587158203125, -8.2462158203125, -7.9052734375, -7.5643310546875, -7.223388671875, -6.8824462890625, -6.54150390625, -6.2005615234375, -5.859619140625, -5.5186767578125, -5.177734375, -4.8367919921875, -4.495849609375, -4.1549072265625, -3.81396484375, -3.4730224609375, -3.132080078125, -2.7911376953125, -2.4501953125, -2.1092529296875, -1.768310546875, -1.4273681640625, -1.08642578125, -0.7454833984375, -0.404541015625, -0.0635986328125, 0.27734375, 0.6182861328125, 0.959228515625, 1.3001708984375, 1.64111328125, 1.9820556640625, 2.322998046875, 2.6639404296875, 3.0048828125, 3.3458251953125, 3.686767578125, 4.0277099609375, 4.36865234375, 4.7095947265625, 5.050537109375, 5.3914794921875, 5.732421875, 6.0733642578125, 6.414306640625, 6.7552490234375, 7.09619140625, 7.4371337890625, 7.778076171875, 8.1190185546875, 8.4599609375, 8.8009033203125, 9.141845703125, 9.4827880859375, 9.82373046875, 10.1646728515625, 10.505615234375, 10.8465576171875, 11.1875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 7.0, 7.0, 12.0, 23.0, 28.0, 36.0, 39.0, 48.0, 66.0, 113.0, 138.0, 210.0, 236.0, 356.0, 522.0, 730.0, 1045.0, 1615.0, 2536.0, 3978.0, 6383.0, 11465.0, 21668.0, 49421.0, 195198.0, 589794.0, 90840.0, 32837.0, 15684.0, 8782.0, 5080.0, 3160.0, 1953.0, 1376.0, 857.0, 632.0, 438.0, 315.0, 238.0, 179.0, 133.0, 89.0, 61.0, 42.0, 44.0, 31.0, 26.0, 20.0, 14.0, 10.0, 8.0, 11.0, 7.0, 4.0, 1.0, 2.0], "bins": [-19.46875, -18.883544921875, -18.29833984375, -17.713134765625, -17.1279296875, -16.542724609375, -15.95751953125, -15.372314453125, -14.787109375, -14.201904296875, -13.61669921875, -13.031494140625, -12.4462890625, -11.861083984375, -11.27587890625, -10.690673828125, -10.10546875, -9.520263671875, -8.93505859375, -8.349853515625, -7.7646484375, -7.179443359375, -6.59423828125, -6.009033203125, -5.423828125, -4.838623046875, -4.25341796875, -3.668212890625, -3.0830078125, -2.497802734375, -1.91259765625, -1.327392578125, -0.7421875, -0.156982421875, 0.42822265625, 1.013427734375, 1.5986328125, 2.183837890625, 2.76904296875, 3.354248046875, 3.939453125, 4.524658203125, 5.10986328125, 5.695068359375, 6.2802734375, 6.865478515625, 7.45068359375, 8.035888671875, 8.62109375, 9.206298828125, 9.79150390625, 10.376708984375, 10.9619140625, 11.547119140625, 12.13232421875, 12.717529296875, 13.302734375, 13.887939453125, 14.47314453125, 15.058349609375, 15.6435546875, 16.228759765625, 16.81396484375, 17.399169921875, 17.984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 10.0, 6.0, 9.0, 10.0, 14.0, 24.0, 21.0, 22.0, 16.0, 18.0, 37.0, 40.0, 46.0, 55.0, 63.0, 85.0, 150.0, 1478.0, 344.0, 122.0, 89.0, 63.0, 31.0, 41.0, 35.0, 29.0, 27.0, 25.0, 20.0, 26.0, 12.0, 8.0, 16.0, 4.0, 6.0, 15.0, 7.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.65576171875, -32.5302734375, -31.40478515625, -30.279296875, -29.15380859375, -28.0283203125, -26.90283203125, -25.77734375, -24.65185546875, -23.5263671875, -22.40087890625, -21.275390625, -20.14990234375, -19.0244140625, -17.89892578125, -16.7734375, -15.64794921875, -14.5224609375, -13.39697265625, -12.271484375, -11.14599609375, -10.0205078125, -8.89501953125, -7.76953125, -6.64404296875, -5.5185546875, -4.39306640625, -3.267578125, -2.14208984375, -1.0166015625, 0.10888671875, 1.234375, 2.35986328125, 3.4853515625, 4.61083984375, 5.736328125, 6.86181640625, 7.9873046875, 9.11279296875, 10.23828125, 11.36376953125, 12.4892578125, 13.61474609375, 14.740234375, 15.86572265625, 16.9912109375, 18.11669921875, 19.2421875, 20.36767578125, 21.4931640625, 22.61865234375, 23.744140625, 24.86962890625, 25.9951171875, 27.12060546875, 28.24609375, 29.37158203125, 30.4970703125, 31.62255859375, 32.748046875, 33.87353515625, 34.9990234375, 36.12451171875, 37.25]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 11.0, 9.0, 18.0, 20.0, 23.0, 36.0, 52.0, 60.0, 73.0, 115.0, 173.0, 385.0, 1368.0, 6561.0, 59855.0, 2935590.0, 128125.0, 10068.0, 1914.0, 492.0, 268.0, 129.0, 81.0, 58.0, 42.0, 36.0, 28.0, 15.0, 15.0, 14.0, 11.0, 7.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.75, -75.50390625, -73.2578125, -71.01171875, -68.765625, -66.51953125, -64.2734375, -62.02734375, -59.78125, -57.53515625, -55.2890625, -53.04296875, -50.796875, -48.55078125, -46.3046875, -44.05859375, -41.8125, -39.56640625, -37.3203125, -35.07421875, -32.828125, -30.58203125, -28.3359375, -26.08984375, -23.84375, -21.59765625, -19.3515625, -17.10546875, -14.859375, -12.61328125, -10.3671875, -8.12109375, -5.875, -3.62890625, -1.3828125, 0.86328125, 3.109375, 5.35546875, 7.6015625, 9.84765625, 12.09375, 14.33984375, 16.5859375, 18.83203125, 21.078125, 23.32421875, 25.5703125, 27.81640625, 30.0625, 32.30859375, 34.5546875, 36.80078125, 39.046875, 41.29296875, 43.5390625, 45.78515625, 48.03125, 50.27734375, 52.5234375, 54.76953125, 57.015625, 59.26171875, 61.5078125, 63.75390625, 66.0]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 14.0, 73.0, 266.0, 384.0, 186.0, 67.0, 14.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.6368408203125, -361.59356689453125, -354.55029296875, -347.5070495605469, -340.4637756347656, -333.4205017089844, -326.3772277832031, -319.333984375, -312.29071044921875, -305.2474365234375, -298.20416259765625, -291.1609191894531, -284.1176452636719, -277.0743713378906, -270.0310974121094, -262.98785400390625, -255.94456481933594, -248.9012908935547, -241.8580322265625, -234.81475830078125, -227.77149963378906, -220.7282257080078, -213.68496704101562, -206.64169311523438, -199.59841918945312, -192.55514526367188, -185.5118865966797, -178.46861267089844, -171.42535400390625, -164.382080078125, -157.33880615234375, -150.29554748535156, -143.25228881835938, -136.20901489257812, -129.16575622558594, -122.12248229980469, -115.0792236328125, -108.03594970703125, -100.99268341064453, -93.94941711425781, -86.90615844726562, -79.8628921508789, -72.81962585449219, -65.77635192871094, -58.733089447021484, -51.689823150634766, -44.64655303955078, -37.60328674316406, -30.560020446777344, -23.516754150390625, -16.473485946655273, -9.430217742919922, -2.386951446533203, 4.656314849853516, 11.6995849609375, 18.74285125732422, 25.786117553710938, 32.829383850097656, 39.872650146484375, 46.91592025756836, 53.95918655395508, 61.0024528503418, 68.04572296142578, 75.0889892578125, 82.13225555419922]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 13.0, 11.0, 12.0, 13.0, 20.0, 11.0, 23.0, 12.0, 27.0, 38.0, 25.0, 33.0, 43.0, 30.0, 37.0, 34.0, 40.0, 48.0, 47.0, 48.0, 35.0, 27.0, 31.0, 38.0, 38.0, 28.0, 31.0, 29.0, 30.0, 30.0, 22.0, 13.0, 18.0, 12.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.90230560302734, -93.67972564697266, -90.45713806152344, -87.23455810546875, -84.01197814941406, -80.78939819335938, -77.56681823730469, -74.34423065185547, -71.12165069580078, -67.8990707397461, -64.67648315429688, -61.45390319824219, -58.2313232421875, -55.00874328613281, -51.78615951538086, -48.563575744628906, -45.34099578857422, -42.11841583251953, -38.89583206176758, -35.673248291015625, -32.45066833496094, -29.228086471557617, -26.005504608154297, -22.782922744750977, -19.560340881347656, -16.337759017944336, -13.115177154541016, -9.892595291137695, -6.670013427734375, -3.4474315643310547, -0.22484970092773438, 2.997732162475586, 6.2203216552734375, 9.442903518676758, 12.665485382080078, 15.888067245483398, 19.11064910888672, 22.33323097229004, 25.55581283569336, 28.77839469909668, 32.0009765625, 35.22355651855469, 38.44614028930664, 41.668724060058594, 44.89130401611328, 48.11388397216797, 51.33646774291992, 54.559051513671875, 57.78163146972656, 61.00421142578125, 64.22679138183594, 67.44937896728516, 70.67195892333984, 73.89453887939453, 77.11712646484375, 80.33970642089844, 83.56228637695312, 86.78486633300781, 90.0074462890625, 93.23003387451172, 96.4526138305664, 99.6751937866211, 102.89778137207031, 106.120361328125, 109.34294128417969]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 2.0, 8.0, 12.0, 10.0, 18.0, 17.0, 26.0, 21.0, 28.0, 37.0, 35.0, 33.0, 54.0, 37.0, 45.0, 54.0, 50.0, 53.0, 55.0, 53.0, 47.0, 42.0, 35.0, 47.0, 28.0, 24.0, 17.0, 26.0, 14.0, 9.0, 7.0, 9.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.26416015625, -10.8876953125, -10.51123046875, -10.134765625, -9.75830078125, -9.3818359375, -9.00537109375, -8.62890625, -8.25244140625, -7.8759765625, -7.49951171875, -7.123046875, -6.74658203125, -6.3701171875, -5.99365234375, -5.6171875, -5.24072265625, -4.8642578125, -4.48779296875, -4.111328125, -3.73486328125, -3.3583984375, -2.98193359375, -2.60546875, -2.22900390625, -1.8525390625, -1.47607421875, -1.099609375, -0.72314453125, -0.3466796875, 0.02978515625, 0.40625, 0.78271484375, 1.1591796875, 1.53564453125, 1.912109375, 2.28857421875, 2.6650390625, 3.04150390625, 3.41796875, 3.79443359375, 4.1708984375, 4.54736328125, 4.923828125, 5.30029296875, 5.6767578125, 6.05322265625, 6.4296875, 6.80615234375, 7.1826171875, 7.55908203125, 7.935546875, 8.31201171875, 8.6884765625, 9.06494140625, 9.44140625, 9.81787109375, 10.1943359375, 10.57080078125, 10.947265625, 11.32373046875, 11.7001953125, 12.07666015625, 12.453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 14.0, 14.0, 28.0, 36.0, 56.0, 68.0, 93.0, 108.0, 165.0, 234.0, 319.0, 417.0, 573.0, 853.0, 1301.0, 1895.0, 2904.0, 4708.0, 8461.0, 18414.0, 65945.0, 437932.0, 2315248.0, 1121977.0, 155314.0, 29889.0, 11277.0, 5809.0, 3420.0, 2082.0, 1385.0, 942.0, 658.0, 425.0, 350.0, 261.0, 181.0, 110.0, 89.0, 83.0, 58.0, 43.0, 29.0, 27.0, 20.0, 15.0, 11.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.734375, -17.137939453125, -16.54150390625, -15.945068359375, -15.3486328125, -14.752197265625, -14.15576171875, -13.559326171875, -12.962890625, -12.366455078125, -11.77001953125, -11.173583984375, -10.5771484375, -9.980712890625, -9.38427734375, -8.787841796875, -8.19140625, -7.594970703125, -6.99853515625, -6.402099609375, -5.8056640625, -5.209228515625, -4.61279296875, -4.016357421875, -3.419921875, -2.823486328125, -2.22705078125, -1.630615234375, -1.0341796875, -0.437744140625, 0.15869140625, 0.755126953125, 1.3515625, 1.947998046875, 2.54443359375, 3.140869140625, 3.7373046875, 4.333740234375, 4.93017578125, 5.526611328125, 6.123046875, 6.719482421875, 7.31591796875, 7.912353515625, 8.5087890625, 9.105224609375, 9.70166015625, 10.298095703125, 10.89453125, 11.490966796875, 12.08740234375, 12.683837890625, 13.2802734375, 13.876708984375, 14.47314453125, 15.069580078125, 15.666015625, 16.262451171875, 16.85888671875, 17.455322265625, 18.0517578125, 18.648193359375, 19.24462890625, 19.841064453125, 20.4375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 6.0, 20.0, 19.0, 17.0, 29.0, 34.0, 59.0, 95.0, 134.0, 223.0, 332.0, 628.0, 720.0, 645.0, 388.0, 224.0, 134.0, 97.0, 58.0, 43.0, 30.0, 25.0, 19.0, 11.0, 16.0, 9.0, 7.0, 4.0, 8.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.34375, -29.465576171875, -28.58740234375, -27.709228515625, -26.8310546875, -25.952880859375, -25.07470703125, -24.196533203125, -23.318359375, -22.440185546875, -21.56201171875, -20.683837890625, -19.8056640625, -18.927490234375, -18.04931640625, -17.171142578125, -16.29296875, -15.414794921875, -14.53662109375, -13.658447265625, -12.7802734375, -11.902099609375, -11.02392578125, -10.145751953125, -9.267578125, -8.389404296875, -7.51123046875, -6.633056640625, -5.7548828125, -4.876708984375, -3.99853515625, -3.120361328125, -2.2421875, -1.364013671875, -0.48583984375, 0.392333984375, 1.2705078125, 2.148681640625, 3.02685546875, 3.905029296875, 4.783203125, 5.661376953125, 6.53955078125, 7.417724609375, 8.2958984375, 9.174072265625, 10.05224609375, 10.930419921875, 11.80859375, 12.686767578125, 13.56494140625, 14.443115234375, 15.3212890625, 16.199462890625, 17.07763671875, 17.955810546875, 18.833984375, 19.712158203125, 20.59033203125, 21.468505859375, 22.3466796875, 23.224853515625, 24.10302734375, 24.981201171875, 25.859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 3.0, 6.0, 8.0, 16.0, 28.0, 31.0, 57.0, 59.0, 108.0, 148.0, 216.0, 405.0, 678.0, 1199.0, 2273.0, 4266.0, 8707.0, 19847.0, 55775.0, 258609.0, 2553017.0, 1093003.0, 131269.0, 36278.0, 14309.0, 6531.0, 3311.0, 1674.0, 975.0, 549.0, 348.0, 198.0, 123.0, 89.0, 53.0, 32.0, 26.0, 20.0, 11.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.93994140625, -26.0361328125, -25.13232421875, -24.228515625, -23.32470703125, -22.4208984375, -21.51708984375, -20.61328125, -19.70947265625, -18.8056640625, -17.90185546875, -16.998046875, -16.09423828125, -15.1904296875, -14.28662109375, -13.3828125, -12.47900390625, -11.5751953125, -10.67138671875, -9.767578125, -8.86376953125, -7.9599609375, -7.05615234375, -6.15234375, -5.24853515625, -4.3447265625, -3.44091796875, -2.537109375, -1.63330078125, -0.7294921875, 0.17431640625, 1.078125, 1.98193359375, 2.8857421875, 3.78955078125, 4.693359375, 5.59716796875, 6.5009765625, 7.40478515625, 8.30859375, 9.21240234375, 10.1162109375, 11.02001953125, 11.923828125, 12.82763671875, 13.7314453125, 14.63525390625, 15.5390625, 16.44287109375, 17.3466796875, 18.25048828125, 19.154296875, 20.05810546875, 20.9619140625, 21.86572265625, 22.76953125, 23.67333984375, 24.5771484375, 25.48095703125, 26.384765625, 27.28857421875, 28.1923828125, 29.09619140625, 30.0]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 17.0, 39.0, 69.0, 142.0, 244.0, 242.0, 124.0, 64.0, 34.0, 13.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-326.5813293457031, -320.16802978515625, -313.7547302246094, -307.3414306640625, -300.9281311035156, -294.51483154296875, -288.1015319824219, -281.688232421875, -275.2749328613281, -268.86163330078125, -262.4483337402344, -256.0350341796875, -249.62173461914062, -243.20843505859375, -236.79513549804688, -230.38185119628906, -223.96856689453125, -217.55526733398438, -211.1419677734375, -204.72866821289062, -198.31536865234375, -191.90206909179688, -185.48876953125, -179.0754852294922, -172.66217041015625, -166.24887084960938, -159.8355712890625, -153.42227172851562, -147.00897216796875, -140.59567260742188, -134.182373046875, -127.76908874511719, -121.35579681396484, -114.94249725341797, -108.5291976928711, -102.11590576171875, -95.70260620117188, -89.289306640625, -82.87600708007812, -76.46270751953125, -70.04940795898438, -63.6361083984375, -57.22281265258789, -50.809513092041016, -44.396217346191406, -37.98291778564453, -31.569618225097656, -25.156322479248047, -18.743026733398438, -12.329729080200195, -5.916430473327637, 0.4968681335449219, 6.910165786743164, 13.323463439941406, 19.73676300048828, 26.15005874633789, 32.563358306884766, 38.97665786743164, 45.38995361328125, 51.803253173828125, 58.216552734375, 64.62985229492188, 71.04315185546875, 77.4564437866211, 83.86974334716797]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 6.0, 8.0, 11.0, 16.0, 9.0, 18.0, 20.0, 19.0, 21.0, 23.0, 25.0, 29.0, 26.0, 40.0, 37.0, 35.0, 53.0, 51.0, 45.0, 39.0, 46.0, 43.0, 34.0, 37.0, 36.0, 29.0, 36.0, 28.0, 16.0, 24.0, 23.0, 21.0, 12.0, 10.0, 8.0, 14.0, 13.0, 5.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-73.432861328125, -71.07173919677734, -68.71062469482422, -66.34950256347656, -63.988380432128906, -61.627262115478516, -59.266143798828125, -56.90502166748047, -54.54390335083008, -52.18278503417969, -49.82166290283203, -47.46054458618164, -45.09942626953125, -42.738304138183594, -40.3771858215332, -38.01606750488281, -35.654945373535156, -33.293827056884766, -30.93270492553711, -28.57158660888672, -26.210466384887695, -23.849346160888672, -21.48822784423828, -19.127107620239258, -16.765987396240234, -14.404867172241211, -12.043747901916504, -9.682628631591797, -7.321508407592773, -4.96038818359375, -2.599268913269043, -0.23814964294433594, 2.1229705810546875, 4.484090328216553, 6.845210075378418, 9.206329345703125, 11.567449569702148, 13.928569793701172, 16.289688110351562, 18.650808334350586, 21.01192855834961, 23.373048782348633, 25.734169006347656, 28.095287322998047, 30.45640754699707, 32.817527770996094, 35.178646087646484, 37.539764404296875, 39.90088653564453, 42.26200485229492, 44.62312698364258, 46.98424530029297, 49.345367431640625, 51.706485748291016, 54.067604064941406, 56.42872619628906, 58.78984451293945, 61.150962829589844, 63.5120849609375, 65.87320709228516, 68.23432159423828, 70.59544372558594, 72.9565658569336, 75.31768035888672, 77.67880249023438]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 12.0, 6.0, 11.0, 22.0, 28.0, 23.0, 31.0, 43.0, 39.0, 31.0, 49.0, 43.0, 52.0, 48.0, 64.0, 57.0, 56.0, 46.0, 39.0, 39.0, 37.0, 28.0, 32.0, 31.0, 23.0, 19.0, 14.0, 14.0, 10.0, 11.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.280029296875, -9.89599609375, -9.511962890625, -9.1279296875, -8.743896484375, -8.35986328125, -7.975830078125, -7.591796875, -7.207763671875, -6.82373046875, -6.439697265625, -6.0556640625, -5.671630859375, -5.28759765625, -4.903564453125, -4.51953125, -4.135498046875, -3.75146484375, -3.367431640625, -2.9833984375, -2.599365234375, -2.21533203125, -1.831298828125, -1.447265625, -1.063232421875, -0.67919921875, -0.295166015625, 0.0888671875, 0.472900390625, 0.85693359375, 1.240966796875, 1.625, 2.009033203125, 2.39306640625, 2.777099609375, 3.1611328125, 3.545166015625, 3.92919921875, 4.313232421875, 4.697265625, 5.081298828125, 5.46533203125, 5.849365234375, 6.2333984375, 6.617431640625, 7.00146484375, 7.385498046875, 7.76953125, 8.153564453125, 8.53759765625, 8.921630859375, 9.3056640625, 9.689697265625, 10.07373046875, 10.457763671875, 10.841796875, 11.225830078125, 11.60986328125, 11.993896484375, 12.3779296875, 12.761962890625, 13.14599609375, 13.530029296875, 13.9140625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 12.0, 6.0, 19.0, 32.0, 32.0, 41.0, 63.0, 109.0, 193.0, 252.0, 356.0, 526.0, 767.0, 1202.0, 1837.0, 2849.0, 4349.0, 7026.0, 11473.0, 19069.0, 32395.0, 56542.0, 99919.0, 170593.0, 230651.0, 170168.0, 99281.0, 56376.0, 32433.0, 19086.0, 11342.0, 7010.0, 4313.0, 2822.0, 1776.0, 1172.0, 784.0, 529.0, 396.0, 267.0, 163.0, 109.0, 73.0, 41.0, 33.0, 20.0, 17.0, 18.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.634765625, -1.5811614990234375, -1.527557373046875, -1.4739532470703125, -1.42034912109375, -1.3667449951171875, -1.313140869140625, -1.2595367431640625, -1.2059326171875, -1.1523284912109375, -1.098724365234375, -1.0451202392578125, -0.99151611328125, -0.9379119873046875, -0.884307861328125, -0.8307037353515625, -0.777099609375, -0.7234954833984375, -0.669891357421875, -0.6162872314453125, -0.56268310546875, -0.5090789794921875, -0.455474853515625, -0.4018707275390625, -0.3482666015625, -0.2946624755859375, -0.241058349609375, -0.1874542236328125, -0.13385009765625, -0.0802459716796875, -0.026641845703125, 0.0269622802734375, 0.08056640625, 0.1341705322265625, 0.187774658203125, 0.2413787841796875, 0.29498291015625, 0.3485870361328125, 0.402191162109375, 0.4557952880859375, 0.5093994140625, 0.5630035400390625, 0.616607666015625, 0.6702117919921875, 0.72381591796875, 0.7774200439453125, 0.831024169921875, 0.8846282958984375, 0.938232421875, 0.9918365478515625, 1.045440673828125, 1.0990447998046875, 1.15264892578125, 1.2062530517578125, 1.259857177734375, 1.3134613037109375, 1.3670654296875, 1.4206695556640625, 1.474273681640625, 1.5278778076171875, 1.58148193359375, 1.6350860595703125, 1.688690185546875, 1.7422943115234375, 1.7958984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 11.0, 5.0, 7.0, 12.0, 11.0, 16.0, 14.0, 18.0, 16.0, 27.0, 28.0, 40.0, 39.0, 36.0, 42.0, 35.0, 34.0, 41.0, 35.0, 1058.0, 35.0, 36.0, 35.0, 30.0, 48.0, 28.0, 38.0, 27.0, 32.0, 30.0, 18.0, 19.0, 16.0, 20.0, 12.0, 16.0, 10.0, 11.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.69140625, -6.4918212890625, -6.292236328125, -6.0926513671875, -5.89306640625, -5.6934814453125, -5.493896484375, -5.2943115234375, -5.0947265625, -4.8951416015625, -4.695556640625, -4.4959716796875, -4.29638671875, -4.0968017578125, -3.897216796875, -3.6976318359375, -3.498046875, -3.2984619140625, -3.098876953125, -2.8992919921875, -2.69970703125, -2.5001220703125, -2.300537109375, -2.1009521484375, -1.9013671875, -1.7017822265625, -1.502197265625, -1.3026123046875, -1.10302734375, -0.9034423828125, -0.703857421875, -0.5042724609375, -0.3046875, -0.1051025390625, 0.094482421875, 0.2940673828125, 0.49365234375, 0.6932373046875, 0.892822265625, 1.0924072265625, 1.2919921875, 1.4915771484375, 1.691162109375, 1.8907470703125, 2.09033203125, 2.2899169921875, 2.489501953125, 2.6890869140625, 2.888671875, 3.0882568359375, 3.287841796875, 3.4874267578125, 3.68701171875, 3.8865966796875, 4.086181640625, 4.2857666015625, 4.4853515625, 4.6849365234375, 4.884521484375, 5.0841064453125, 5.28369140625, 5.4832763671875, 5.682861328125, 5.8824462890625, 6.08203125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 17.0, 29.0, 33.0, 41.0, 85.0, 120.0, 194.0, 278.0, 403.0, 642.0, 1039.0, 1591.0, 2607.0, 4137.0, 6715.0, 10921.0, 18210.0, 29683.0, 50187.0, 84048.0, 137713.0, 1233394.0, 202355.0, 124209.0, 74867.0, 44609.0, 26636.0, 16153.0, 9844.0, 6025.0, 3853.0, 2333.0, 1487.0, 914.0, 604.0, 404.0, 256.0, 164.0, 108.0, 81.0, 38.0, 37.0, 22.0, 13.0, 8.0, 12.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.91748046875, -0.8877792358398438, -0.8580780029296875, -0.8283767700195312, -0.798675537109375, -0.7689743041992188, -0.7392730712890625, -0.7095718383789062, -0.67987060546875, -0.6501693725585938, -0.6204681396484375, -0.5907669067382812, -0.561065673828125, -0.5313644409179688, -0.5016632080078125, -0.47196197509765625, -0.4422607421875, -0.41255950927734375, -0.3828582763671875, -0.35315704345703125, -0.323455810546875, -0.29375457763671875, -0.2640533447265625, -0.23435211181640625, -0.20465087890625, -0.17494964599609375, -0.1452484130859375, -0.11554718017578125, -0.085845947265625, -0.05614471435546875, -0.0264434814453125, 0.00325775146484375, 0.032958984375, 0.06266021728515625, 0.0923614501953125, 0.12206268310546875, 0.151763916015625, 0.18146514892578125, 0.2111663818359375, 0.24086761474609375, 0.27056884765625, 0.30027008056640625, 0.3299713134765625, 0.35967254638671875, 0.389373779296875, 0.41907501220703125, 0.4487762451171875, 0.47847747802734375, 0.5081787109375, 0.5378799438476562, 0.5675811767578125, 0.5972824096679688, 0.626983642578125, 0.6566848754882812, 0.6863861083984375, 0.7160873413085938, 0.74578857421875, 0.7754898071289062, 0.8051910400390625, 0.8348922729492188, 0.864593505859375, 0.8942947387695312, 0.9239959716796875, 0.9536972045898438, 0.9833984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 3.0, 15.0, 10.0, 12.0, 15.0, 8.0, 32.0, 28.0, 44.0, 56.0, 59.0, 78.0, 95.0, 83.0, 100.0, 82.0, 41.0, 51.0, 36.0, 26.0, 14.0, 14.0, 16.0, 9.0, 10.0, 18.0, 2.0, 4.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01508331298828125, -0.014626264572143555, -0.01416921615600586, -0.013712167739868164, -0.013255119323730469, -0.012798070907592773, -0.012341022491455078, -0.011883974075317383, -0.011426925659179688, -0.010969877243041992, -0.010512828826904297, -0.010055780410766602, -0.009598731994628906, -0.009141683578491211, -0.008684635162353516, -0.00822758674621582, -0.007770538330078125, -0.00731348991394043, -0.006856441497802734, -0.006399393081665039, -0.005942344665527344, -0.0054852962493896484, -0.005028247833251953, -0.004571199417114258, -0.0041141510009765625, -0.003657102584838867, -0.003200054168701172, -0.0027430057525634766, -0.0022859573364257812, -0.001828908920288086, -0.0013718605041503906, -0.0009148120880126953, -0.000457763671875, -7.152557373046875e-07, 0.0004563331604003906, 0.0009133815765380859, 0.0013704299926757812, 0.0018274784088134766, 0.002284526824951172, 0.002741575241088867, 0.0031986236572265625, 0.003655672073364258, 0.004112720489501953, 0.0045697689056396484, 0.005026817321777344, 0.005483865737915039, 0.005940914154052734, 0.00639796257019043, 0.006855010986328125, 0.00731205940246582, 0.007769107818603516, 0.008226156234741211, 0.008683204650878906, 0.009140253067016602, 0.009597301483154297, 0.010054349899291992, 0.010511398315429688, 0.010968446731567383, 0.011425495147705078, 0.011882543563842773, 0.012339591979980469, 0.012796640396118164, 0.01325368881225586, 0.013710737228393555, 0.01416778564453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 12.0, 16.0, 14.0, 18.0, 20.0, 31.0, 40.0, 55.0, 84.0, 113.0, 160.0, 228.0, 472.0, 1412.0, 23985.0, 944489.0, 73329.0, 2556.0, 544.0, 305.0, 183.0, 123.0, 88.0, 66.0, 43.0, 28.0, 29.0, 22.0, 11.0, 9.0, 10.0, 6.0, 8.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24755859375, -0.2399730682373047, -0.23238754272460938, -0.22480201721191406, -0.21721649169921875, -0.20963096618652344, -0.20204544067382812, -0.1944599151611328, -0.1868743896484375, -0.1792888641357422, -0.17170333862304688, -0.16411781311035156, -0.15653228759765625, -0.14894676208496094, -0.14136123657226562, -0.1337757110595703, -0.126190185546875, -0.11860466003417969, -0.11101913452148438, -0.10343360900878906, -0.09584808349609375, -0.08826255798339844, -0.08067703247070312, -0.07309150695800781, -0.0655059814453125, -0.05792045593261719, -0.050334930419921875, -0.04274940490722656, -0.03516387939453125, -0.027578353881835938, -0.019992828369140625, -0.012407302856445312, -0.00482177734375, 0.0027637481689453125, 0.010349273681640625, 0.017934799194335938, 0.02552032470703125, 0.03310585021972656, 0.040691375732421875, 0.04827690124511719, 0.0558624267578125, 0.06344795227050781, 0.07103347778320312, 0.07861900329589844, 0.08620452880859375, 0.09379005432128906, 0.10137557983398438, 0.10896110534667969, 0.116546630859375, 0.12413215637207031, 0.13171768188476562, 0.13930320739746094, 0.14688873291015625, 0.15447425842285156, 0.16205978393554688, 0.1696453094482422, 0.1772308349609375, 0.1848163604736328, 0.19240188598632812, 0.19998741149902344, 0.20757293701171875, 0.21515846252441406, 0.22274398803710938, 0.2303295135498047, 0.2379150390625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 30.0, 60.0, 291.0, 429.0, 127.0, 44.0, 15.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06344835460186005, -0.06029770150780678, -0.05714705213904381, -0.05399639904499054, -0.05084574595093727, -0.047695092856884, -0.04454444348812103, -0.041393790394067764, -0.038243137300014496, -0.03509248420596123, -0.03194183483719826, -0.02879118174314499, -0.02564052864909172, -0.0224898774176836, -0.019339226186275482, -0.016188573092222214, -0.013037923723459244, -0.00988727156072855, -0.0067366198636591434, -0.003585968166589737, -0.0004353160038590431, 0.0027153361588716507, 0.00586598739027977, 0.009016640484333038, 0.012167291715741158, 0.015317943878471851, 0.018468596041202545, 0.021619247272610664, 0.024769898504018784, 0.027920551598072052, 0.03107120282948017, 0.03422185778617859, 0.03737250715494156, 0.04052316024899483, 0.0436738096177578, 0.046824462711811066, 0.049975115805864334, 0.0531257688999176, 0.05627641826868057, 0.05942707136273384, 0.06257772445678711, 0.06572837382555008, 0.06887903064489365, 0.07202968001365662, 0.07518032938241959, 0.07833098620176315, 0.08148163557052612, 0.08463229238986969, 0.08778293430805206, 0.09093358367681503, 0.0940842404961586, 0.09723488986492157, 0.10038553923368454, 0.1035361960530281, 0.10668684542179108, 0.10983750224113464, 0.11298815160989761, 0.11613880097866058, 0.11928945779800415, 0.12244010716676712, 0.1255907565355301, 0.12874141335487366, 0.13189205527305603, 0.1350427120923996, 0.13819336891174316]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 3.0, 3.0, 8.0, 8.0, 9.0, 9.0, 5.0, 9.0, 12.0, 18.0, 28.0, 20.0, 25.0, 30.0, 29.0, 33.0, 32.0, 40.0, 40.0, 50.0, 54.0, 36.0, 46.0, 30.0, 43.0, 38.0, 39.0, 40.0, 30.0, 31.0, 32.0, 24.0, 22.0, 18.0, 11.0, 11.0, 13.0, 17.0, 15.0, 11.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.008916795253753662, -0.00861247070133686, -0.00830814614892006, -0.008003821596503258, -0.007699497044086456, -0.007395172491669655, -0.007090847939252853, -0.006786523386836052, -0.0064821988344192505, -0.006177874282002449, -0.005873549729585648, -0.005569225177168846, -0.005264900624752045, -0.004960576072335243, -0.004656251519918442, -0.00435192696750164, -0.004047602415084839, -0.0037432778626680374, -0.003438953310251236, -0.0031346287578344345, -0.002830304205417633, -0.0025259796530008316, -0.00222165510058403, -0.0019173305481672287, -0.0016130059957504272, -0.0013086814433336258, -0.0010043568909168243, -0.0007000323385000229, -0.00039570778608322144, -9.138323366641998e-05, 0.00021294131875038147, 0.0005172658711671829, 0.0008215904235839844, 0.0011259149760007858, 0.0014302395284175873, 0.0017345640808343887, 0.00203888863325119, 0.0023432131856679916, 0.002647537738084793, 0.0029518622905015945, 0.003256186842918396, 0.0035605113953351974, 0.003864835947751999, 0.0041691605001688, 0.004473485052585602, 0.004777809605002403, 0.005082134157419205, 0.005386458709836006, 0.005690783262252808, 0.005995107814669609, 0.0062994323670864105, 0.006603756919503212, 0.006908081471920013, 0.007212406024336815, 0.007516730576753616, 0.007821055129170418, 0.00812537968158722, 0.00842970423400402, 0.008734028786420822, 0.009038353338837624, 0.009342677891254425, 0.009647002443671227, 0.009951326996088028, 0.01025565154850483, 0.01055997610092163]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 12.0, 6.0, 11.0, 22.0, 28.0, 23.0, 31.0, 43.0, 39.0, 31.0, 49.0, 43.0, 52.0, 48.0, 64.0, 57.0, 56.0, 46.0, 39.0, 39.0, 37.0, 28.0, 32.0, 31.0, 23.0, 19.0, 15.0, 13.0, 10.0, 11.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.280029296875, -9.89599609375, -9.511962890625, -9.1279296875, -8.743896484375, -8.35986328125, -7.975830078125, -7.591796875, -7.207763671875, -6.82373046875, -6.439697265625, -6.0556640625, -5.671630859375, -5.28759765625, -4.903564453125, -4.51953125, -4.135498046875, -3.75146484375, -3.367431640625, -2.9833984375, -2.599365234375, -2.21533203125, -1.831298828125, -1.447265625, -1.063232421875, -0.67919921875, -0.295166015625, 0.0888671875, 0.472900390625, 0.85693359375, 1.240966796875, 1.625, 2.009033203125, 2.39306640625, 2.777099609375, 3.1611328125, 3.545166015625, 3.92919921875, 4.313232421875, 4.697265625, 5.081298828125, 5.46533203125, 5.849365234375, 6.2333984375, 6.617431640625, 7.00146484375, 7.385498046875, 7.76953125, 8.153564453125, 8.53759765625, 8.921630859375, 9.3056640625, 9.689697265625, 10.07373046875, 10.457763671875, 10.841796875, 11.225830078125, 11.60986328125, 11.993896484375, 12.3779296875, 12.761962890625, 13.14599609375, 13.530029296875, 13.9140625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 7.0, 6.0, 15.0, 22.0, 26.0, 37.0, 74.0, 94.0, 133.0, 198.0, 232.0, 370.0, 570.0, 795.0, 1262.0, 1922.0, 2929.0, 4947.0, 8506.0, 16865.0, 46729.0, 496770.0, 386373.0, 42247.0, 16196.0, 8027.0, 4748.0, 2887.0, 1803.0, 1199.0, 810.0, 527.0, 382.0, 245.0, 172.0, 139.0, 93.0, 55.0, 46.0, 30.0, 20.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.447021484375, -20.70654296875, -19.966064453125, -19.2255859375, -18.485107421875, -17.74462890625, -17.004150390625, -16.263671875, -15.523193359375, -14.78271484375, -14.042236328125, -13.3017578125, -12.561279296875, -11.82080078125, -11.080322265625, -10.33984375, -9.599365234375, -8.85888671875, -8.118408203125, -7.3779296875, -6.637451171875, -5.89697265625, -5.156494140625, -4.416015625, -3.675537109375, -2.93505859375, -2.194580078125, -1.4541015625, -0.713623046875, 0.02685546875, 0.767333984375, 1.5078125, 2.248291015625, 2.98876953125, 3.729248046875, 4.4697265625, 5.210205078125, 5.95068359375, 6.691162109375, 7.431640625, 8.172119140625, 8.91259765625, 9.653076171875, 10.3935546875, 11.134033203125, 11.87451171875, 12.614990234375, 13.35546875, 14.095947265625, 14.83642578125, 15.576904296875, 16.3173828125, 17.057861328125, 17.79833984375, 18.538818359375, 19.279296875, 20.019775390625, 20.76025390625, 21.500732421875, 22.2412109375, 22.981689453125, 23.72216796875, 24.462646484375, 25.203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 8.0, 9.0, 8.0, 14.0, 15.0, 25.0, 21.0, 32.0, 26.0, 38.0, 29.0, 43.0, 60.0, 57.0, 70.0, 121.0, 356.0, 1473.0, 146.0, 80.0, 64.0, 43.0, 53.0, 38.0, 44.0, 23.0, 25.0, 31.0, 21.0, 14.0, 12.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.21875, -39.00341796875, -37.7880859375, -36.57275390625, -35.357421875, -34.14208984375, -32.9267578125, -31.71142578125, -30.49609375, -29.28076171875, -28.0654296875, -26.85009765625, -25.634765625, -24.41943359375, -23.2041015625, -21.98876953125, -20.7734375, -19.55810546875, -18.3427734375, -17.12744140625, -15.912109375, -14.69677734375, -13.4814453125, -12.26611328125, -11.05078125, -9.83544921875, -8.6201171875, -7.40478515625, -6.189453125, -4.97412109375, -3.7587890625, -2.54345703125, -1.328125, -0.11279296875, 1.1025390625, 2.31787109375, 3.533203125, 4.74853515625, 5.9638671875, 7.17919921875, 8.39453125, 9.60986328125, 10.8251953125, 12.04052734375, 13.255859375, 14.47119140625, 15.6865234375, 16.90185546875, 18.1171875, 19.33251953125, 20.5478515625, 21.76318359375, 22.978515625, 24.19384765625, 25.4091796875, 26.62451171875, 27.83984375, 29.05517578125, 30.2705078125, 31.48583984375, 32.701171875, 33.91650390625, 35.1318359375, 36.34716796875, 37.5625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 7.0, 4.0, 11.0, 9.0, 12.0, 16.0, 22.0, 21.0, 23.0, 37.0, 53.0, 56.0, 100.0, 138.0, 274.0, 538.0, 2851.0, 27269.0, 2963174.0, 142102.0, 6913.0, 1091.0, 385.0, 179.0, 96.0, 79.0, 58.0, 41.0, 39.0, 29.0, 21.0, 11.0, 12.0, 9.0, 4.0, 1.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -68.419921875, -65.65234375, -62.884765625, -60.1171875, -57.349609375, -54.58203125, -51.814453125, -49.046875, -46.279296875, -43.51171875, -40.744140625, -37.9765625, -35.208984375, -32.44140625, -29.673828125, -26.90625, -24.138671875, -21.37109375, -18.603515625, -15.8359375, -13.068359375, -10.30078125, -7.533203125, -4.765625, -1.998046875, 0.76953125, 3.537109375, 6.3046875, 9.072265625, 11.83984375, 14.607421875, 17.375, 20.142578125, 22.91015625, 25.677734375, 28.4453125, 31.212890625, 33.98046875, 36.748046875, 39.515625, 42.283203125, 45.05078125, 47.818359375, 50.5859375, 53.353515625, 56.12109375, 58.888671875, 61.65625, 64.423828125, 67.19140625, 69.958984375, 72.7265625, 75.494140625, 78.26171875, 81.029296875, 83.796875, 86.564453125, 89.33203125, 92.099609375, 94.8671875, 97.634765625, 100.40234375, 103.169921875, 105.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [6.0, 406.0, 580.0, 19.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.41343307495117, -18.864364624023438, -1.3152961730957031, 16.23377227783203, 33.782840728759766, 51.331912994384766, 68.8809814453125, 86.43003845214844, 103.97911071777344, 121.52818298339844, 139.07723999023438, 156.62631225585938, 174.17538452148438, 191.72445678710938, 209.27352905273438, 226.8225860595703, 244.3716583251953, 261.92071533203125, 279.46978759765625, 297.01885986328125, 314.56793212890625, 332.11700439453125, 349.66607666015625, 367.21514892578125, 384.76422119140625, 402.31329345703125, 419.86236572265625, 437.41143798828125, 454.96051025390625, 472.50958251953125, 490.0586242675781, 507.6076965332031, 525.15673828125, 542.705810546875, 560.2548828125, 577.803955078125, 595.35302734375, 612.902099609375, 630.451171875, 648.000244140625, 665.54931640625, 683.098388671875, 700.6474609375, 718.196533203125, 735.74560546875, 753.294677734375, 770.84375, 788.392822265625, 805.9418334960938, 823.4909057617188, 841.0399780273438, 858.5890502929688, 876.1381225585938, 893.6871948242188, 911.2362670898438, 928.7852783203125, 946.3343505859375, 963.8834228515625, 981.4324951171875, 998.9815673828125, 1016.5306396484375, 1034.0797119140625, 1051.6287841796875, 1069.1778564453125, 1086.7269287109375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 10.0, 9.0, 10.0, 17.0, 23.0, 21.0, 19.0, 30.0, 17.0, 41.0, 32.0, 29.0, 34.0, 44.0, 37.0, 41.0, 44.0, 34.0, 36.0, 38.0, 37.0, 32.0, 38.0, 38.0, 36.0, 30.0, 22.0, 26.0, 31.0, 15.0, 13.0, 19.0, 14.0, 15.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.92601013183594, -78.16325378417969, -75.4004898071289, -72.63773345947266, -69.8749771118164, -67.11221313476562, -64.34945678710938, -61.58669662475586, -58.823936462402344, -56.06117630004883, -53.29841995239258, -50.53565979003906, -47.77289962768555, -45.01013946533203, -42.24738311767578, -39.484622955322266, -36.721866607666016, -33.9591064453125, -31.196348190307617, -28.433589935302734, -25.67082977294922, -22.908071517944336, -20.145313262939453, -17.382553100585938, -14.619794845581055, -11.857035636901855, -9.094276428222656, -6.331518173217773, -3.568758964538574, -0.805999755859375, 1.9567584991455078, 4.719518661499023, 7.482276916503906, 10.245036125183105, 13.007795333862305, 15.770553588867188, 18.533313751220703, 21.296072006225586, 24.05883026123047, 26.821590423583984, 29.584348678588867, 32.34710693359375, 35.109867095947266, 37.87262725830078, 40.63538360595703, 43.39814376831055, 46.16090393066406, 48.92366027832031, 51.68642044067383, 54.449180603027344, 57.211936950683594, 59.97469711303711, 62.737457275390625, 65.50021362304688, 68.26296997070312, 71.0257339477539, 73.78849029541016, 76.5512466430664, 79.31401062011719, 82.07676696777344, 84.83952331542969, 87.60228729248047, 90.36504364013672, 93.1278076171875, 95.89056396484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 13.0, 13.0, 20.0, 28.0, 24.0, 27.0, 24.0, 32.0, 47.0, 47.0, 42.0, 44.0, 49.0, 49.0, 42.0, 45.0, 50.0, 50.0, 41.0, 42.0, 36.0, 30.0, 25.0, 25.0, 18.0, 26.0, 15.0, 16.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.81494140625, -9.4423828125, -9.06982421875, -8.697265625, -8.32470703125, -7.9521484375, -7.57958984375, -7.20703125, -6.83447265625, -6.4619140625, -6.08935546875, -5.716796875, -5.34423828125, -4.9716796875, -4.59912109375, -4.2265625, -3.85400390625, -3.4814453125, -3.10888671875, -2.736328125, -2.36376953125, -1.9912109375, -1.61865234375, -1.24609375, -0.87353515625, -0.5009765625, -0.12841796875, 0.244140625, 0.61669921875, 0.9892578125, 1.36181640625, 1.734375, 2.10693359375, 2.4794921875, 2.85205078125, 3.224609375, 3.59716796875, 3.9697265625, 4.34228515625, 4.71484375, 5.08740234375, 5.4599609375, 5.83251953125, 6.205078125, 6.57763671875, 6.9501953125, 7.32275390625, 7.6953125, 8.06787109375, 8.4404296875, 8.81298828125, 9.185546875, 9.55810546875, 9.9306640625, 10.30322265625, 10.67578125, 11.04833984375, 11.4208984375, 11.79345703125, 12.166015625, 12.53857421875, 12.9111328125, 13.28369140625, 13.65625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 12.0, 17.0, 19.0, 15.0, 38.0, 43.0, 49.0, 87.0, 130.0, 184.0, 332.0, 742.0, 1738.0, 4852.0, 18097.0, 293602.0, 3677399.0, 174743.0, 14862.0, 4123.0, 1531.0, 693.0, 352.0, 177.0, 121.0, 70.0, 50.0, 46.0, 42.0, 20.0, 17.0, 12.0, 14.0, 11.0, 2.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.0439453125, -35.587890625, -34.1318359375, -32.67578125, -31.2197265625, -29.763671875, -28.3076171875, -26.8515625, -25.3955078125, -23.939453125, -22.4833984375, -21.02734375, -19.5712890625, -18.115234375, -16.6591796875, -15.203125, -13.7470703125, -12.291015625, -10.8349609375, -9.37890625, -7.9228515625, -6.466796875, -5.0107421875, -3.5546875, -2.0986328125, -0.642578125, 0.8134765625, 2.26953125, 3.7255859375, 5.181640625, 6.6376953125, 8.09375, 9.5498046875, 11.005859375, 12.4619140625, 13.91796875, 15.3740234375, 16.830078125, 18.2861328125, 19.7421875, 21.1982421875, 22.654296875, 24.1103515625, 25.56640625, 27.0224609375, 28.478515625, 29.9345703125, 31.390625, 32.8466796875, 34.302734375, 35.7587890625, 37.21484375, 38.6708984375, 40.126953125, 41.5830078125, 43.0390625, 44.4951171875, 45.951171875, 47.4072265625, 48.86328125, 50.3193359375, 51.775390625, 53.2314453125, 54.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 12.0, 18.0, 15.0, 27.0, 36.0, 59.0, 71.0, 116.0, 226.0, 470.0, 798.0, 862.0, 573.0, 327.0, 150.0, 95.0, 48.0, 44.0, 31.0, 16.0, 17.0, 18.0, 9.0, 5.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.21875, -36.162109375, -35.10546875, -34.048828125, -32.9921875, -31.935546875, -30.87890625, -29.822265625, -28.765625, -27.708984375, -26.65234375, -25.595703125, -24.5390625, -23.482421875, -22.42578125, -21.369140625, -20.3125, -19.255859375, -18.19921875, -17.142578125, -16.0859375, -15.029296875, -13.97265625, -12.916015625, -11.859375, -10.802734375, -9.74609375, -8.689453125, -7.6328125, -6.576171875, -5.51953125, -4.462890625, -3.40625, -2.349609375, -1.29296875, -0.236328125, 0.8203125, 1.876953125, 2.93359375, 3.990234375, 5.046875, 6.103515625, 7.16015625, 8.216796875, 9.2734375, 10.330078125, 11.38671875, 12.443359375, 13.5, 14.556640625, 15.61328125, 16.669921875, 17.7265625, 18.783203125, 19.83984375, 20.896484375, 21.953125, 23.009765625, 24.06640625, 25.123046875, 26.1796875, 27.236328125, 28.29296875, 29.349609375, 30.40625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 4.0, 5.0, 16.0, 17.0, 21.0, 28.0, 50.0, 81.0, 174.0, 359.0, 1298.0, 6394.0, 59653.0, 3768926.0, 337473.0, 15974.0, 2625.0, 652.0, 224.0, 109.0, 69.0, 37.0, 20.0, 27.0, 11.0, 9.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.0625, -75.4365234375, -72.810546875, -70.1845703125, -67.55859375, -64.9326171875, -62.306640625, -59.6806640625, -57.0546875, -54.4287109375, -51.802734375, -49.1767578125, -46.55078125, -43.9248046875, -41.298828125, -38.6728515625, -36.046875, -33.4208984375, -30.794921875, -28.1689453125, -25.54296875, -22.9169921875, -20.291015625, -17.6650390625, -15.0390625, -12.4130859375, -9.787109375, -7.1611328125, -4.53515625, -1.9091796875, 0.716796875, 3.3427734375, 5.96875, 8.5947265625, 11.220703125, 13.8466796875, 16.47265625, 19.0986328125, 21.724609375, 24.3505859375, 26.9765625, 29.6025390625, 32.228515625, 34.8544921875, 37.48046875, 40.1064453125, 42.732421875, 45.3583984375, 47.984375, 50.6103515625, 53.236328125, 55.8623046875, 58.48828125, 61.1142578125, 63.740234375, 66.3662109375, 68.9921875, 71.6181640625, 74.244140625, 76.8701171875, 79.49609375, 82.1220703125, 84.748046875, 87.3740234375, 90.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 46.0, 118.0, 283.0, 339.0, 150.0, 40.0, 15.0, 9.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-380.7870178222656, -370.51727294921875, -360.2475280761719, -349.977783203125, -339.7080383300781, -329.43829345703125, -319.1685485839844, -308.8988037109375, -298.6290588378906, -288.35931396484375, -278.0895690917969, -267.81982421875, -257.5500793457031, -247.28033447265625, -237.01058959960938, -226.7408447265625, -216.47108459472656, -206.2013397216797, -195.9315948486328, -185.66184997558594, -175.39210510253906, -165.1223602294922, -154.85260009765625, -144.58285522460938, -134.3131103515625, -124.04336547851562, -113.77362060546875, -103.50387573242188, -93.234130859375, -82.96438598632812, -72.69463348388672, -62.424888610839844, -52.1551513671875, -41.885406494140625, -31.615659713745117, -21.34591293334961, -11.076168060302734, -0.8064231872558594, 9.463325500488281, 19.733070373535156, 30.00281524658203, 40.272560119628906, 50.54230499267578, 60.81205368041992, 71.08180236816406, 81.35154724121094, 91.62129211425781, 101.89103698730469, 112.16078186035156, 122.43052673339844, 132.7002716064453, 142.9700164794922, 153.23976135253906, 163.50950622558594, 173.77926635742188, 184.04901123046875, 194.31875610351562, 204.5885009765625, 214.85824584960938, 225.12799072265625, 235.39773559570312, 245.66748046875, 255.93722534179688, 266.20697021484375, 276.4767150878906]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 5.0, 13.0, 16.0, 13.0, 15.0, 21.0, 19.0, 23.0, 21.0, 24.0, 21.0, 31.0, 23.0, 28.0, 30.0, 31.0, 36.0, 34.0, 34.0, 35.0, 23.0, 32.0, 39.0, 32.0, 40.0, 30.0, 25.0, 38.0, 27.0, 20.0, 16.0, 24.0, 19.0, 30.0, 25.0, 17.0, 15.0, 6.0, 16.0, 8.0, 4.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-69.30131530761719, -67.17257690429688, -65.04383850097656, -62.915096282958984, -60.786354064941406, -58.657615661621094, -56.52887725830078, -54.40013885498047, -52.27139663696289, -50.14265823364258, -48.013916015625, -45.88517761230469, -43.756439208984375, -41.6276969909668, -39.498958587646484, -37.370216369628906, -35.241477966308594, -33.11273956298828, -30.983997344970703, -28.85525894165039, -26.726518630981445, -24.5977783203125, -22.469039916992188, -20.340299606323242, -18.211559295654297, -16.08281898498535, -13.954079627990723, -11.825340270996094, -9.696599960327148, -7.567859649658203, -5.439120292663574, -3.3103809356689453, -1.1816329956054688, 0.9471068382263184, 3.0758466720581055, 5.204586505889893, 7.33332633972168, 9.462066650390625, 11.590806007385254, 13.719545364379883, 15.848285675048828, 17.977025985717773, 20.10576629638672, 22.23450469970703, 24.363245010375977, 26.491985321044922, 28.620723724365234, 30.74946403503418, 32.878204345703125, 35.00694274902344, 37.135684967041016, 39.26442337036133, 41.393165588378906, 43.52190399169922, 45.65064239501953, 47.779380798339844, 49.90812301635742, 52.036861419677734, 54.16560363769531, 56.294342041015625, 58.42308044433594, 60.551822662353516, 62.68056106567383, 64.8093032836914, 66.93804168701172]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 26.0, 38.0, 33.0, 34.0, 49.0, 59.0, 50.0, 45.0, 55.0, 55.0, 57.0, 52.0, 50.0, 30.0, 43.0, 32.0, 33.0, 30.0, 23.0, 15.0, 17.0, 14.0, 11.0, 7.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5113525390625, -11.108642578125, -10.7059326171875, -10.30322265625, -9.9005126953125, -9.497802734375, -9.0950927734375, -8.6923828125, -8.2896728515625, -7.886962890625, -7.4842529296875, -7.08154296875, -6.6788330078125, -6.276123046875, -5.8734130859375, -5.470703125, -5.0679931640625, -4.665283203125, -4.2625732421875, -3.85986328125, -3.4571533203125, -3.054443359375, -2.6517333984375, -2.2490234375, -1.8463134765625, -1.443603515625, -1.0408935546875, -0.63818359375, -0.2354736328125, 0.167236328125, 0.5699462890625, 0.97265625, 1.3753662109375, 1.778076171875, 2.1807861328125, 2.58349609375, 2.9862060546875, 3.388916015625, 3.7916259765625, 4.1943359375, 4.5970458984375, 4.999755859375, 5.4024658203125, 5.80517578125, 6.2078857421875, 6.610595703125, 7.0133056640625, 7.416015625, 7.8187255859375, 8.221435546875, 8.6241455078125, 9.02685546875, 9.4295654296875, 9.832275390625, 10.2349853515625, 10.6376953125, 11.0404052734375, 11.443115234375, 11.8458251953125, 12.24853515625, 12.6512451171875, 13.053955078125, 13.4566650390625, 13.859375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 9.0, 13.0, 9.0, 21.0, 35.0, 44.0, 61.0, 88.0, 112.0, 196.0, 255.0, 356.0, 510.0, 765.0, 1030.0, 1638.0, 2381.0, 3581.0, 5602.0, 8552.0, 13717.0, 22672.0, 38420.0, 64914.0, 110402.0, 176342.0, 210461.0, 152995.0, 93301.0, 54713.0, 32231.0, 19375.0, 11830.0, 7472.0, 4776.0, 3055.0, 2063.0, 1460.0, 930.0, 678.0, 459.0, 308.0, 235.0, 139.0, 104.0, 72.0, 53.0, 42.0, 20.0, 28.0, 12.0, 7.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.673828125, -1.61865234375, -1.5634765625, -1.50830078125, -1.453125, -1.39794921875, -1.3427734375, -1.28759765625, -1.232421875, -1.17724609375, -1.1220703125, -1.06689453125, -1.01171875, -0.95654296875, -0.9013671875, -0.84619140625, -0.791015625, -0.73583984375, -0.6806640625, -0.62548828125, -0.5703125, -0.51513671875, -0.4599609375, -0.40478515625, -0.349609375, -0.29443359375, -0.2392578125, -0.18408203125, -0.12890625, -0.07373046875, -0.0185546875, 0.03662109375, 0.091796875, 0.14697265625, 0.2021484375, 0.25732421875, 0.3125, 0.36767578125, 0.4228515625, 0.47802734375, 0.533203125, 0.58837890625, 0.6435546875, 0.69873046875, 0.75390625, 0.80908203125, 0.8642578125, 0.91943359375, 0.974609375, 1.02978515625, 1.0849609375, 1.14013671875, 1.1953125, 1.25048828125, 1.3056640625, 1.36083984375, 1.416015625, 1.47119140625, 1.5263671875, 1.58154296875, 1.63671875, 1.69189453125, 1.7470703125, 1.80224609375, 1.857421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 9.0, 15.0, 13.0, 7.0, 16.0, 27.0, 24.0, 40.0, 37.0, 32.0, 32.0, 31.0, 42.0, 46.0, 42.0, 52.0, 1073.0, 40.0, 44.0, 39.0, 39.0, 41.0, 27.0, 32.0, 33.0, 35.0, 24.0, 27.0, 20.0, 20.0, 12.0, 10.0, 9.0, 6.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.49591064453125, -6.2535400390625, -6.01116943359375, -5.768798828125, -5.52642822265625, -5.2840576171875, -5.04168701171875, -4.79931640625, -4.55694580078125, -4.3145751953125, -4.07220458984375, -3.829833984375, -3.58746337890625, -3.3450927734375, -3.10272216796875, -2.8603515625, -2.61798095703125, -2.3756103515625, -2.13323974609375, -1.890869140625, -1.64849853515625, -1.4061279296875, -1.16375732421875, -0.92138671875, -0.67901611328125, -0.4366455078125, -0.19427490234375, 0.048095703125, 0.29046630859375, 0.5328369140625, 0.77520751953125, 1.017578125, 1.25994873046875, 1.5023193359375, 1.74468994140625, 1.987060546875, 2.22943115234375, 2.4718017578125, 2.71417236328125, 2.95654296875, 3.19891357421875, 3.4412841796875, 3.68365478515625, 3.926025390625, 4.16839599609375, 4.4107666015625, 4.65313720703125, 4.8955078125, 5.13787841796875, 5.3802490234375, 5.62261962890625, 5.864990234375, 6.10736083984375, 6.3497314453125, 6.59210205078125, 6.83447265625, 7.07684326171875, 7.3192138671875, 7.56158447265625, 7.803955078125, 8.04632568359375, 8.2886962890625, 8.53106689453125, 8.7734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 10.0, 23.0, 32.0, 26.0, 61.0, 79.0, 107.0, 194.0, 290.0, 425.0, 637.0, 999.0, 1628.0, 2359.0, 3900.0, 5810.0, 9393.0, 14543.0, 23474.0, 37255.0, 60788.0, 99163.0, 157050.0, 1249343.0, 160806.0, 102220.0, 62955.0, 38138.0, 23789.0, 14874.0, 9695.0, 6097.0, 3931.0, 2508.0, 1634.0, 991.0, 642.0, 423.0, 276.0, 192.0, 124.0, 85.0, 63.0, 29.0, 23.0, 18.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.96484375, -0.936065673828125, -0.90728759765625, -0.878509521484375, -0.8497314453125, -0.820953369140625, -0.79217529296875, -0.763397216796875, -0.734619140625, -0.705841064453125, -0.67706298828125, -0.648284912109375, -0.6195068359375, -0.590728759765625, -0.56195068359375, -0.533172607421875, -0.50439453125, -0.475616455078125, -0.44683837890625, -0.418060302734375, -0.3892822265625, -0.360504150390625, -0.33172607421875, -0.302947998046875, -0.274169921875, -0.245391845703125, -0.21661376953125, -0.187835693359375, -0.1590576171875, -0.130279541015625, -0.10150146484375, -0.072723388671875, -0.0439453125, -0.015167236328125, 0.01361083984375, 0.042388916015625, 0.0711669921875, 0.099945068359375, 0.12872314453125, 0.157501220703125, 0.186279296875, 0.215057373046875, 0.24383544921875, 0.272613525390625, 0.3013916015625, 0.330169677734375, 0.35894775390625, 0.387725830078125, 0.41650390625, 0.445281982421875, 0.47406005859375, 0.502838134765625, 0.5316162109375, 0.560394287109375, 0.58917236328125, 0.617950439453125, 0.646728515625, 0.675506591796875, 0.70428466796875, 0.733062744140625, 0.7618408203125, 0.790618896484375, 0.81939697265625, 0.848175048828125, 0.876953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 12.0, 7.0, 12.0, 13.0, 7.0, 8.0, 20.0, 19.0, 25.0, 35.0, 44.0, 65.0, 92.0, 116.0, 126.0, 93.0, 85.0, 43.0, 38.0, 31.0, 28.0, 16.0, 9.0, 9.0, 12.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016632080078125, -0.01611614227294922, -0.015600204467773438, -0.015084266662597656, -0.014568328857421875, -0.014052391052246094, -0.013536453247070312, -0.013020515441894531, -0.01250457763671875, -0.011988639831542969, -0.011472702026367188, -0.010956764221191406, -0.010440826416015625, -0.009924888610839844, -0.009408950805664062, -0.008893013000488281, -0.0083770751953125, -0.007861137390136719, -0.0073451995849609375, -0.006829261779785156, -0.006313323974609375, -0.005797386169433594, -0.0052814483642578125, -0.004765510559082031, -0.00424957275390625, -0.0037336349487304688, -0.0032176971435546875, -0.0027017593383789062, -0.002185821533203125, -0.0016698837280273438, -0.0011539459228515625, -0.0006380081176757812, -0.0001220703125, 0.00039386749267578125, 0.0009098052978515625, 0.0014257431030273438, 0.001941680908203125, 0.0024576187133789062, 0.0029735565185546875, 0.0034894943237304688, 0.00400543212890625, 0.004521369934082031, 0.0050373077392578125, 0.005553245544433594, 0.006069183349609375, 0.006585121154785156, 0.0071010589599609375, 0.007616996765136719, 0.0081329345703125, 0.008648872375488281, 0.009164810180664062, 0.009680747985839844, 0.010196685791015625, 0.010712623596191406, 0.011228561401367188, 0.011744499206542969, 0.01226043701171875, 0.012776374816894531, 0.013292312622070312, 0.013808250427246094, 0.014324188232421875, 0.014840126037597656, 0.015356063842773438, 0.01587200164794922, 0.016387939453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 13.0, 7.0, 10.0, 13.0, 19.0, 20.0, 47.0, 64.0, 64.0, 127.0, 175.0, 302.0, 686.0, 6116.0, 617113.0, 417091.0, 5151.0, 705.0, 275.0, 182.0, 96.0, 62.0, 41.0, 50.0, 23.0, 17.0, 20.0, 19.0, 12.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2584991455078125, -0.250152587890625, -0.2418060302734375, -0.23345947265625, -0.2251129150390625, -0.216766357421875, -0.2084197998046875, -0.2000732421875, -0.1917266845703125, -0.183380126953125, -0.1750335693359375, -0.16668701171875, -0.1583404541015625, -0.149993896484375, -0.1416473388671875, -0.13330078125, -0.1249542236328125, -0.116607666015625, -0.1082611083984375, -0.09991455078125, -0.0915679931640625, -0.083221435546875, -0.0748748779296875, -0.0665283203125, -0.0581817626953125, -0.049835205078125, -0.0414886474609375, -0.03314208984375, -0.0247955322265625, -0.016448974609375, -0.0081024169921875, 0.000244140625, 0.0085906982421875, 0.016937255859375, 0.0252838134765625, 0.03363037109375, 0.0419769287109375, 0.050323486328125, 0.0586700439453125, 0.0670166015625, 0.0753631591796875, 0.083709716796875, 0.0920562744140625, 0.10040283203125, 0.1087493896484375, 0.117095947265625, 0.1254425048828125, 0.1337890625, 0.1421356201171875, 0.150482177734375, 0.1588287353515625, 0.16717529296875, 0.1755218505859375, 0.183868408203125, 0.1922149658203125, 0.2005615234375, 0.2089080810546875, 0.217254638671875, 0.2256011962890625, 0.23394775390625, 0.2422943115234375, 0.250640869140625, 0.2589874267578125, 0.267333984375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 25.0, 26.0, 30.0, 55.0, 85.0, 144.0, 199.0, 134.0, 105.0, 57.0, 43.0, 19.0, 25.0, 11.0, 14.0, 5.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01906820386648178, -0.01802540011703968, -0.01698259450495243, -0.01593979075551033, -0.01489698700606823, -0.013854182325303555, -0.01281137764453888, -0.011768573895096779, -0.010725769214332104, -0.009682964533567429, -0.008640160784125328, -0.007597356103360653, -0.006554551888257265, -0.005511747673153877, -0.004468942992389202, -0.0034261387772858143, -0.0023833345621824265, -0.0013405302306637168, -0.00029772589914500713, 0.0007450785487890244, 0.0017878827638924122, 0.0028306869789958, 0.003873491659760475, 0.004916295874863863, 0.005959100089967251, 0.007001904305070639, 0.008044708520174026, 0.009087513200938702, 0.010130317881703377, 0.011173121631145477, 0.012215926311910152, 0.013258730992674828, 0.014301534742116928, 0.015344339422881603, 0.01638714410364628, 0.01742994785308838, 0.01847275160253048, 0.01951555535197258, 0.02055836096405983, 0.02160116471350193, 0.02264396846294403, 0.02368677221238613, 0.02472957782447338, 0.02577238157391548, 0.026815185323357582, 0.027857989072799683, 0.028900794684886932, 0.029943598434329033, 0.030986404046416283, 0.03202920779585838, 0.03307201340794563, 0.034114815294742584, 0.035157620906829834, 0.036200426518917084, 0.037243232131004333, 0.038286034017801285, 0.039328839629888535, 0.040371645241975784, 0.041414447128772736, 0.042457252740859985, 0.043500058352947235, 0.044542860239744186, 0.045585665851831436, 0.046628471463918686, 0.04767127335071564]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 5.0, 5.0, 4.0, 16.0, 23.0, 17.0, 16.0, 28.0, 34.0, 28.0, 34.0, 38.0, 38.0, 39.0, 43.0, 46.0, 43.0, 49.0, 45.0, 50.0, 50.0, 28.0, 32.0, 34.0, 24.0, 26.0, 19.0, 24.0, 29.0, 21.0, 17.0, 15.0, 12.0, 13.0, 9.0, 11.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.008784055709838867, -0.008507591672241688, -0.008231127634644508, -0.007954663597047329, -0.0076781995594501495, -0.00740173552185297, -0.007125271484255791, -0.006848807446658611, -0.006572343409061432, -0.0062958793714642525, -0.006019415333867073, -0.005742951296269894, -0.005466487258672714, -0.005190023221075535, -0.004913559183478355, -0.004637095145881176, -0.004360631108283997, -0.004084167070686817, -0.0038077030330896378, -0.0035312389954924583, -0.003254774957895279, -0.0029783109202980995, -0.00270184688270092, -0.0024253828451037407, -0.0021489188075065613, -0.0018724547699093819, -0.0015959907323122025, -0.001319526694715023, -0.0010430626571178436, -0.0007665986195206642, -0.0004901345819234848, -0.0002136705443263054, 6.279349327087402e-05, 0.00033925753086805344, 0.0006157215684652328, 0.0008921856060624123, 0.0011686496436595917, 0.001445113681256771, 0.0017215777188539505, 0.00199804175645113, 0.0022745057940483093, 0.0025509698316454887, 0.002827433869242668, 0.0031038979068398476, 0.003380361944437027, 0.0036568259820342064, 0.003933290019631386, 0.004209754057228565, 0.004486218094825745, 0.004762682132422924, 0.0050391461700201035, 0.005315610207617283, 0.005592074245214462, 0.005868538282811642, 0.006145002320408821, 0.0064214663580060005, 0.00669793039560318, 0.006974394433200359, 0.007250858470797539, 0.007527322508394718, 0.007803786545991898, 0.008080250583589077, 0.008356714621186256, 0.008633178658783436, 0.008909642696380615]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 26.0, 38.0, 33.0, 34.0, 49.0, 59.0, 50.0, 45.0, 55.0, 55.0, 57.0, 52.0, 50.0, 30.0, 43.0, 32.0, 33.0, 30.0, 23.0, 15.0, 17.0, 14.0, 11.0, 7.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5113525390625, -11.108642578125, -10.7059326171875, -10.30322265625, -9.9005126953125, -9.497802734375, -9.0950927734375, -8.6923828125, -8.2896728515625, -7.886962890625, -7.4842529296875, -7.08154296875, -6.6788330078125, -6.276123046875, -5.8734130859375, -5.470703125, -5.0679931640625, -4.665283203125, -4.2625732421875, -3.85986328125, -3.4571533203125, -3.054443359375, -2.6517333984375, -2.2490234375, -1.8463134765625, -1.443603515625, -1.0408935546875, -0.63818359375, -0.2354736328125, 0.167236328125, 0.5699462890625, 0.97265625, 1.3753662109375, 1.778076171875, 2.1807861328125, 2.58349609375, 2.9862060546875, 3.388916015625, 3.7916259765625, 4.1943359375, 4.5970458984375, 4.999755859375, 5.4024658203125, 5.80517578125, 6.2078857421875, 6.610595703125, 7.0133056640625, 7.416015625, 7.8187255859375, 8.221435546875, 8.6241455078125, 9.02685546875, 9.4295654296875, 9.832275390625, 10.2349853515625, 10.6376953125, 11.0404052734375, 11.443115234375, 11.8458251953125, 12.24853515625, 12.6512451171875, 13.053955078125, 13.4566650390625, 13.859375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 16.0, 8.0, 18.0, 29.0, 22.0, 36.0, 50.0, 72.0, 88.0, 160.0, 196.0, 261.0, 359.0, 527.0, 790.0, 1167.0, 1687.0, 2825.0, 4501.0, 7869.0, 15936.0, 42929.0, 267759.0, 593307.0, 63410.0, 20381.0, 9606.0, 5274.0, 3125.0, 1935.0, 1282.0, 867.0, 583.0, 414.0, 288.0, 194.0, 156.0, 106.0, 78.0, 70.0, 47.0, 37.0, 35.0, 17.0, 8.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.515625, -17.921142578125, -17.32666015625, -16.732177734375, -16.1376953125, -15.543212890625, -14.94873046875, -14.354248046875, -13.759765625, -13.165283203125, -12.57080078125, -11.976318359375, -11.3818359375, -10.787353515625, -10.19287109375, -9.598388671875, -9.00390625, -8.409423828125, -7.81494140625, -7.220458984375, -6.6259765625, -6.031494140625, -5.43701171875, -4.842529296875, -4.248046875, -3.653564453125, -3.05908203125, -2.464599609375, -1.8701171875, -1.275634765625, -0.68115234375, -0.086669921875, 0.5078125, 1.102294921875, 1.69677734375, 2.291259765625, 2.8857421875, 3.480224609375, 4.07470703125, 4.669189453125, 5.263671875, 5.858154296875, 6.45263671875, 7.047119140625, 7.6416015625, 8.236083984375, 8.83056640625, 9.425048828125, 10.01953125, 10.614013671875, 11.20849609375, 11.802978515625, 12.3974609375, 12.991943359375, 13.58642578125, 14.180908203125, 14.775390625, 15.369873046875, 15.96435546875, 16.558837890625, 17.1533203125, 17.747802734375, 18.34228515625, 18.936767578125, 19.53125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 7.0, 2.0, 7.0, 18.0, 9.0, 22.0, 18.0, 18.0, 35.0, 26.0, 31.0, 36.0, 49.0, 49.0, 50.0, 60.0, 113.0, 246.0, 1580.0, 149.0, 86.0, 59.0, 48.0, 43.0, 39.0, 33.0, 27.0, 34.0, 26.0, 26.0, 23.0, 16.0, 14.0, 9.0, 1.0, 10.0, 13.0, 7.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.84375, -30.63330078125, -29.4228515625, -28.21240234375, -27.001953125, -25.79150390625, -24.5810546875, -23.37060546875, -22.16015625, -20.94970703125, -19.7392578125, -18.52880859375, -17.318359375, -16.10791015625, -14.8974609375, -13.68701171875, -12.4765625, -11.26611328125, -10.0556640625, -8.84521484375, -7.634765625, -6.42431640625, -5.2138671875, -4.00341796875, -2.79296875, -1.58251953125, -0.3720703125, 0.83837890625, 2.048828125, 3.25927734375, 4.4697265625, 5.68017578125, 6.890625, 8.10107421875, 9.3115234375, 10.52197265625, 11.732421875, 12.94287109375, 14.1533203125, 15.36376953125, 16.57421875, 17.78466796875, 18.9951171875, 20.20556640625, 21.416015625, 22.62646484375, 23.8369140625, 25.04736328125, 26.2578125, 27.46826171875, 28.6787109375, 29.88916015625, 31.099609375, 32.31005859375, 33.5205078125, 34.73095703125, 35.94140625, 37.15185546875, 38.3623046875, 39.57275390625, 40.783203125, 41.99365234375, 43.2041015625, 44.41455078125, 45.625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 0.0, 4.0, 5.0, 5.0, 6.0, 12.0, 7.0, 14.0, 22.0, 23.0, 35.0, 48.0, 71.0, 92.0, 145.0, 232.0, 475.0, 2262.0, 41448.0, 3064997.0, 32679.0, 2002.0, 462.0, 222.0, 130.0, 96.0, 56.0, 43.0, 28.0, 14.0, 22.0, 16.0, 8.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.9375, -91.4814453125, -88.025390625, -84.5693359375, -81.11328125, -77.6572265625, -74.201171875, -70.7451171875, -67.2890625, -63.8330078125, -60.376953125, -56.9208984375, -53.46484375, -50.0087890625, -46.552734375, -43.0966796875, -39.640625, -36.1845703125, -32.728515625, -29.2724609375, -25.81640625, -22.3603515625, -18.904296875, -15.4482421875, -11.9921875, -8.5361328125, -5.080078125, -1.6240234375, 1.83203125, 5.2880859375, 8.744140625, 12.2001953125, 15.65625, 19.1123046875, 22.568359375, 26.0244140625, 29.48046875, 32.9365234375, 36.392578125, 39.8486328125, 43.3046875, 46.7607421875, 50.216796875, 53.6728515625, 57.12890625, 60.5849609375, 64.041015625, 67.4970703125, 70.953125, 74.4091796875, 77.865234375, 81.3212890625, 84.77734375, 88.2333984375, 91.689453125, 95.1455078125, 98.6015625, 102.0576171875, 105.513671875, 108.9697265625, 112.42578125, 115.8818359375, 119.337890625, 122.7939453125, 126.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 50.0, 596.0, 336.0, 30.0, 5.0], "bins": [-778.5198364257812, -765.7190551757812, -752.9182739257812, -740.1174926757812, -727.3167114257812, -714.5159912109375, -701.7152099609375, -688.9144287109375, -676.1136474609375, -663.3128662109375, -650.5120849609375, -637.7113037109375, -624.9105224609375, -612.1097412109375, -599.3089599609375, -586.5082397460938, -573.7073974609375, -560.9066162109375, -548.1058349609375, -535.3050537109375, -522.5042724609375, -509.7035217285156, -496.9027404785156, -484.1019592285156, -471.30120849609375, -458.50042724609375, -445.69964599609375, -432.89886474609375, -420.0981140136719, -407.2973327636719, -394.4965515136719, -381.6957702636719, -368.89501953125, -356.09423828125, -343.29345703125, -330.49267578125, -317.6919250488281, -304.8911437988281, -292.0903625488281, -279.2895812988281, -266.4888000488281, -253.68801879882812, -240.8872528076172, -228.0864715576172, -215.28570556640625, -202.48492431640625, -189.68414306640625, -176.88336181640625, -164.0825958251953, -151.2818145751953, -138.48104858398438, -125.68026733398438, -112.8794937133789, -100.07872009277344, -87.27793884277344, -74.47716522216797, -61.676395416259766, -48.87561798095703, -36.07484436035156, -23.274066925048828, -10.47329330444336, 2.3274803161621094, 15.12826156616211, 27.929035186767578, 40.72980880737305]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 8.0, 12.0, 8.0, 11.0, 12.0, 27.0, 30.0, 26.0, 32.0, 24.0, 26.0, 39.0, 36.0, 34.0, 37.0, 32.0, 35.0, 32.0, 45.0, 46.0, 42.0, 40.0, 45.0, 32.0, 26.0, 29.0, 36.0, 29.0, 23.0, 18.0, 20.0, 21.0, 14.0, 7.0, 10.0, 11.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0], "bins": [-114.74717712402344, -111.5773696899414, -108.4075698852539, -105.23776245117188, -102.06796264648438, -98.89815521240234, -95.72834777832031, -92.55854797363281, -89.38874053955078, -86.21893310546875, -83.04913330078125, -79.87932586669922, -76.70951843261719, -73.53971862792969, -70.36991119384766, -67.20010375976562, -64.03030395507812, -60.86050033569336, -57.690696716308594, -54.52088928222656, -51.3510856628418, -48.18128204345703, -45.011474609375, -41.841670989990234, -38.67186737060547, -35.5020637512207, -32.33226013183594, -29.162452697753906, -25.99264907836914, -22.822845458984375, -19.653039932250977, -16.483234405517578, -13.313438415527344, -10.143633842468262, -6.97382926940918, -3.8040246963500977, -0.6342201232910156, 2.5355844497680664, 5.705389022827148, 8.875194549560547, 12.044998168945312, 15.214802742004395, 18.384607315063477, 21.554412841796875, 24.72421646118164, 27.894020080566406, 31.063825607299805, 34.2336311340332, 37.40343475341797, 40.573238372802734, 43.7430419921875, 46.91284942626953, 50.0826530456543, 53.25245666503906, 56.422264099121094, 59.59206771850586, 62.761871337890625, 65.93167877197266, 69.10147857666016, 72.27128601074219, 75.44108581542969, 78.61089324951172, 81.78070068359375, 84.95050048828125, 88.12030792236328]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 11.0, 10.0, 17.0, 8.0, 28.0, 24.0, 40.0, 26.0, 32.0, 41.0, 47.0, 42.0, 45.0, 56.0, 57.0, 54.0, 49.0, 56.0, 56.0, 44.0, 38.0, 36.0, 32.0, 28.0, 23.0, 18.0, 14.0, 15.0, 13.0, 7.0, 10.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6640625, -12.2269287109375, -11.789794921875, -11.3526611328125, -10.91552734375, -10.4783935546875, -10.041259765625, -9.6041259765625, -9.1669921875, -8.7298583984375, -8.292724609375, -7.8555908203125, -7.41845703125, -6.9813232421875, -6.544189453125, -6.1070556640625, -5.669921875, -5.2327880859375, -4.795654296875, -4.3585205078125, -3.92138671875, -3.4842529296875, -3.047119140625, -2.6099853515625, -2.1728515625, -1.7357177734375, -1.298583984375, -0.8614501953125, -0.42431640625, 0.0128173828125, 0.449951171875, 0.8870849609375, 1.32421875, 1.7613525390625, 2.198486328125, 2.6356201171875, 3.07275390625, 3.5098876953125, 3.947021484375, 4.3841552734375, 4.8212890625, 5.2584228515625, 5.695556640625, 6.1326904296875, 6.56982421875, 7.0069580078125, 7.444091796875, 7.8812255859375, 8.318359375, 8.7554931640625, 9.192626953125, 9.6297607421875, 10.06689453125, 10.5040283203125, 10.941162109375, 11.3782958984375, 11.8154296875, 12.2525634765625, 12.689697265625, 13.1268310546875, 13.56396484375, 14.0010986328125, 14.438232421875, 14.8753662109375, 15.3125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 12.0, 14.0, 26.0, 27.0, 45.0, 84.0, 106.0, 138.0, 271.0, 457.0, 790.0, 1232.0, 2236.0, 4053.0, 7926.0, 19209.0, 66805.0, 492997.0, 2422479.0, 1002359.0, 125705.0, 26307.0, 9931.0, 4850.0, 2567.0, 1361.0, 857.0, 497.0, 285.0, 209.0, 139.0, 94.0, 53.0, 40.0, 32.0, 19.0, 16.0, 6.0, 2.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.1875, -19.507080078125, -18.82666015625, -18.146240234375, -17.4658203125, -16.785400390625, -16.10498046875, -15.424560546875, -14.744140625, -14.063720703125, -13.38330078125, -12.702880859375, -12.0224609375, -11.342041015625, -10.66162109375, -9.981201171875, -9.30078125, -8.620361328125, -7.93994140625, -7.259521484375, -6.5791015625, -5.898681640625, -5.21826171875, -4.537841796875, -3.857421875, -3.177001953125, -2.49658203125, -1.816162109375, -1.1357421875, -0.455322265625, 0.22509765625, 0.905517578125, 1.5859375, 2.266357421875, 2.94677734375, 3.627197265625, 4.3076171875, 4.988037109375, 5.66845703125, 6.348876953125, 7.029296875, 7.709716796875, 8.39013671875, 9.070556640625, 9.7509765625, 10.431396484375, 11.11181640625, 11.792236328125, 12.47265625, 13.153076171875, 13.83349609375, 14.513916015625, 15.1943359375, 15.874755859375, 16.55517578125, 17.235595703125, 17.916015625, 18.596435546875, 19.27685546875, 19.957275390625, 20.6376953125, 21.318115234375, 21.99853515625, 22.678955078125, 23.359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 7.0, 3.0, 10.0, 11.0, 7.0, 11.0, 12.0, 17.0, 28.0, 33.0, 60.0, 65.0, 126.0, 201.0, 365.0, 628.0, 830.0, 664.0, 397.0, 208.0, 112.0, 85.0, 70.0, 31.0, 28.0, 16.0, 9.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.671875, -30.668212890625, -29.66455078125, -28.660888671875, -27.6572265625, -26.653564453125, -25.64990234375, -24.646240234375, -23.642578125, -22.638916015625, -21.63525390625, -20.631591796875, -19.6279296875, -18.624267578125, -17.62060546875, -16.616943359375, -15.61328125, -14.609619140625, -13.60595703125, -12.602294921875, -11.5986328125, -10.594970703125, -9.59130859375, -8.587646484375, -7.583984375, -6.580322265625, -5.57666015625, -4.572998046875, -3.5693359375, -2.565673828125, -1.56201171875, -0.558349609375, 0.4453125, 1.448974609375, 2.45263671875, 3.456298828125, 4.4599609375, 5.463623046875, 6.46728515625, 7.470947265625, 8.474609375, 9.478271484375, 10.48193359375, 11.485595703125, 12.4892578125, 13.492919921875, 14.49658203125, 15.500244140625, 16.50390625, 17.507568359375, 18.51123046875, 19.514892578125, 20.5185546875, 21.522216796875, 22.52587890625, 23.529541015625, 24.533203125, 25.536865234375, 26.54052734375, 27.544189453125, 28.5478515625, 29.551513671875, 30.55517578125, 31.558837890625, 32.5625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 13.0, 26.0, 26.0, 67.0, 111.0, 238.0, 536.0, 1329.0, 4039.0, 15422.0, 105802.0, 3353093.0, 662955.0, 38524.0, 7965.0, 2447.0, 855.0, 348.0, 180.0, 100.0, 48.0, 34.0, 25.0, 16.0, 13.0, 10.0, 8.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.52734375, -57.7109375, -55.89453125, -54.078125, -52.26171875, -50.4453125, -48.62890625, -46.8125, -44.99609375, -43.1796875, -41.36328125, -39.546875, -37.73046875, -35.9140625, -34.09765625, -32.28125, -30.46484375, -28.6484375, -26.83203125, -25.015625, -23.19921875, -21.3828125, -19.56640625, -17.75, -15.93359375, -14.1171875, -12.30078125, -10.484375, -8.66796875, -6.8515625, -5.03515625, -3.21875, -1.40234375, 0.4140625, 2.23046875, 4.046875, 5.86328125, 7.6796875, 9.49609375, 11.3125, 13.12890625, 14.9453125, 16.76171875, 18.578125, 20.39453125, 22.2109375, 24.02734375, 25.84375, 27.66015625, 29.4765625, 31.29296875, 33.109375, 34.92578125, 36.7421875, 38.55859375, 40.375, 42.19140625, 44.0078125, 45.82421875, 47.640625, 49.45703125, 51.2734375, 53.08984375, 54.90625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 41.0, 115.0, 246.0, 304.0, 173.0, 75.0, 29.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-282.99395751953125, -274.4769287109375, -265.95989990234375, -257.4429016113281, -248.92587280273438, -240.40884399414062, -231.89181518554688, -223.37478637695312, -214.85777282714844, -206.3407440185547, -197.82373046875, -189.30670166015625, -180.7896728515625, -172.2726593017578, -163.75563049316406, -155.23861694335938, -146.72158813476562, -138.20455932617188, -129.6875457763672, -121.17051696777344, -112.65349578857422, -104.136474609375, -95.61944580078125, -87.10242462158203, -78.58540344238281, -70.0683822631836, -61.55135726928711, -53.034332275390625, -44.517311096191406, -36.00028991699219, -27.483264923095703, -18.96623992919922, -10.449249267578125, -1.9322261810302734, 6.584796905517578, 15.10181999206543, 23.61884307861328, 32.1358642578125, 40.652889251708984, 49.16991424560547, 57.68693542480469, 66.2039566040039, 74.72097778320312, 83.23800659179688, 91.7550277709961, 100.27204895019531, 108.78907775878906, 117.30609893798828, 125.8231201171875, 134.34014892578125, 142.85716247558594, 151.3741912841797, 159.89120483398438, 168.40823364257812, 176.92526245117188, 185.44229125976562, 193.9593048095703, 202.47633361816406, 210.99334716796875, 219.5103759765625, 228.02740478515625, 236.54441833496094, 245.0614471435547, 253.57846069335938, 262.0954895019531]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 5.0, 4.0, 7.0, 14.0, 7.0, 13.0, 17.0, 20.0, 23.0, 26.0, 26.0, 32.0, 26.0, 37.0, 31.0, 35.0, 34.0, 41.0, 52.0, 44.0, 37.0, 47.0, 44.0, 39.0, 42.0, 42.0, 23.0, 30.0, 32.0, 33.0, 16.0, 5.0, 20.0, 17.0, 9.0, 21.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-79.554443359375, -77.22966003417969, -74.9048843383789, -72.5801010131836, -70.25532531738281, -67.9305419921875, -65.60576629638672, -63.280982971191406, -60.95620346069336, -58.63142395019531, -56.306644439697266, -53.98186492919922, -51.657081604003906, -49.332305908203125, -47.00752258300781, -44.682743072509766, -42.35796356201172, -40.03318405151367, -37.708404541015625, -35.38362503051758, -33.05884552001953, -30.73406410217285, -28.409282684326172, -26.084503173828125, -23.759723663330078, -21.43494415283203, -19.110164642333984, -16.785383224487305, -14.460603713989258, -12.135824203491211, -9.811043739318848, -7.486263275146484, -5.161491394042969, -2.8367114067077637, -0.5119314193725586, 1.8128485679626465, 4.137628555297852, 6.462408065795898, 8.787188529968262, 11.111968994140625, 13.436748504638672, 15.761528015136719, 18.086307525634766, 20.411088943481445, 22.735868453979492, 25.06064796447754, 27.38542938232422, 29.710208892822266, 32.03498840332031, 34.35976791381836, 36.684547424316406, 39.00932693481445, 41.3341064453125, 43.65888977050781, 45.98366928100586, 48.308448791503906, 50.63322830200195, 52.9580078125, 55.28278732299805, 57.607566833496094, 59.932350158691406, 62.25712585449219, 64.5819091796875, 66.90669250488281, 69.2314682006836]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 9.0, 19.0, 20.0, 17.0, 20.0, 23.0, 31.0, 36.0, 35.0, 37.0, 44.0, 45.0, 42.0, 52.0, 61.0, 56.0, 61.0, 58.0, 49.0, 50.0, 36.0, 34.0, 43.0, 17.0, 20.0, 13.0, 17.0, 11.0, 17.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3056640625, -11.861328125, -11.4169921875, -10.97265625, -10.5283203125, -10.083984375, -9.6396484375, -9.1953125, -8.7509765625, -8.306640625, -7.8623046875, -7.41796875, -6.9736328125, -6.529296875, -6.0849609375, -5.640625, -5.1962890625, -4.751953125, -4.3076171875, -3.86328125, -3.4189453125, -2.974609375, -2.5302734375, -2.0859375, -1.6416015625, -1.197265625, -0.7529296875, -0.30859375, 0.1357421875, 0.580078125, 1.0244140625, 1.46875, 1.9130859375, 2.357421875, 2.8017578125, 3.24609375, 3.6904296875, 4.134765625, 4.5791015625, 5.0234375, 5.4677734375, 5.912109375, 6.3564453125, 6.80078125, 7.2451171875, 7.689453125, 8.1337890625, 8.578125, 9.0224609375, 9.466796875, 9.9111328125, 10.35546875, 10.7998046875, 11.244140625, 11.6884765625, 12.1328125, 12.5771484375, 13.021484375, 13.4658203125, 13.91015625, 14.3544921875, 14.798828125, 15.2431640625, 15.6875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 11.0, 21.0, 27.0, 36.0, 67.0, 75.0, 120.0, 191.0, 287.0, 462.0, 710.0, 1199.0, 1862.0, 2986.0, 4878.0, 8149.0, 14378.0, 25935.0, 48907.0, 93298.0, 176578.0, 255657.0, 190361.0, 102589.0, 53490.0, 28122.0, 15476.0, 9092.0, 5079.0, 3182.0, 1942.0, 1211.0, 774.0, 478.0, 304.0, 209.0, 140.0, 71.0, 71.0, 34.0, 27.0, 23.0, 17.0, 8.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.144683837890625, -2.07452392578125, -2.004364013671875, -1.9342041015625, -1.864044189453125, -1.79388427734375, -1.723724365234375, -1.653564453125, -1.583404541015625, -1.51324462890625, -1.443084716796875, -1.3729248046875, -1.302764892578125, -1.23260498046875, -1.162445068359375, -1.09228515625, -1.022125244140625, -0.95196533203125, -0.881805419921875, -0.8116455078125, -0.741485595703125, -0.67132568359375, -0.601165771484375, -0.531005859375, -0.460845947265625, -0.39068603515625, -0.320526123046875, -0.2503662109375, -0.180206298828125, -0.11004638671875, -0.039886474609375, 0.0302734375, 0.100433349609375, 0.17059326171875, 0.240753173828125, 0.3109130859375, 0.381072998046875, 0.45123291015625, 0.521392822265625, 0.591552734375, 0.661712646484375, 0.73187255859375, 0.802032470703125, 0.8721923828125, 0.942352294921875, 1.01251220703125, 1.082672119140625, 1.15283203125, 1.222991943359375, 1.29315185546875, 1.363311767578125, 1.4334716796875, 1.503631591796875, 1.57379150390625, 1.643951416015625, 1.714111328125, 1.784271240234375, 1.85443115234375, 1.924591064453125, 1.9947509765625, 2.064910888671875, 2.13507080078125, 2.205230712890625, 2.275390625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 10.0, 10.0, 14.0, 16.0, 25.0, 22.0, 17.0, 20.0, 21.0, 34.0, 34.0, 34.0, 37.0, 46.0, 37.0, 31.0, 37.0, 1057.0, 33.0, 36.0, 40.0, 30.0, 37.0, 36.0, 35.0, 32.0, 28.0, 32.0, 20.0, 14.0, 14.0, 14.0, 15.0, 15.0, 16.0, 9.0, 8.0, 5.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.78125, -7.5504150390625, -7.319580078125, -7.0887451171875, -6.85791015625, -6.6270751953125, -6.396240234375, -6.1654052734375, -5.9345703125, -5.7037353515625, -5.472900390625, -5.2420654296875, -5.01123046875, -4.7803955078125, -4.549560546875, -4.3187255859375, -4.087890625, -3.8570556640625, -3.626220703125, -3.3953857421875, -3.16455078125, -2.9337158203125, -2.702880859375, -2.4720458984375, -2.2412109375, -2.0103759765625, -1.779541015625, -1.5487060546875, -1.31787109375, -1.0870361328125, -0.856201171875, -0.6253662109375, -0.39453125, -0.1636962890625, 0.067138671875, 0.2979736328125, 0.52880859375, 0.7596435546875, 0.990478515625, 1.2213134765625, 1.4521484375, 1.6829833984375, 1.913818359375, 2.1446533203125, 2.37548828125, 2.6063232421875, 2.837158203125, 3.0679931640625, 3.298828125, 3.5296630859375, 3.760498046875, 3.9913330078125, 4.22216796875, 4.4530029296875, 4.683837890625, 4.9146728515625, 5.1455078125, 5.3763427734375, 5.607177734375, 5.8380126953125, 6.06884765625, 6.2996826171875, 6.530517578125, 6.7613525390625, 6.9921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 7.0, 17.0, 14.0, 36.0, 34.0, 61.0, 80.0, 114.0, 148.0, 241.0, 335.0, 455.0, 698.0, 1101.0, 1588.0, 2328.0, 3385.0, 5176.0, 7651.0, 11467.0, 17561.0, 27446.0, 43792.0, 69685.0, 108941.0, 160156.0, 1230615.0, 142440.0, 94194.0, 60133.0, 37522.0, 23748.0, 15164.0, 10030.0, 6684.0, 4731.0, 2963.0, 2078.0, 1350.0, 918.0, 654.0, 409.0, 306.0, 226.0, 143.0, 107.0, 65.0, 44.0, 26.0, 20.0, 11.0, 12.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.9609375, -0.9312210083007812, -0.9015045166015625, -0.8717880249023438, -0.842071533203125, -0.8123550415039062, -0.7826385498046875, -0.7529220581054688, -0.72320556640625, -0.6934890747070312, -0.6637725830078125, -0.6340560913085938, -0.604339599609375, -0.5746231079101562, -0.5449066162109375, -0.5151901245117188, -0.4854736328125, -0.45575714111328125, -0.4260406494140625, -0.39632415771484375, -0.366607666015625, -0.33689117431640625, -0.3071746826171875, -0.27745819091796875, -0.24774169921875, -0.21802520751953125, -0.1883087158203125, -0.15859222412109375, -0.128875732421875, -0.09915924072265625, -0.0694427490234375, -0.03972625732421875, -0.010009765625, 0.01970672607421875, 0.0494232177734375, 0.07913970947265625, 0.108856201171875, 0.13857269287109375, 0.1682891845703125, 0.19800567626953125, 0.22772216796875, 0.25743865966796875, 0.2871551513671875, 0.31687164306640625, 0.346588134765625, 0.37630462646484375, 0.4060211181640625, 0.43573760986328125, 0.4654541015625, 0.49517059326171875, 0.5248870849609375, 0.5546035766601562, 0.584320068359375, 0.6140365600585938, 0.6437530517578125, 0.6734695434570312, 0.70318603515625, 0.7329025268554688, 0.7626190185546875, 0.7923355102539062, 0.822052001953125, 0.8517684936523438, 0.8814849853515625, 0.9112014770507812, 0.94091796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 14.0, 24.0, 42.0, 70.0, 101.0, 141.0, 175.0, 136.0, 72.0, 53.0, 40.0, 23.0, 15.0, 8.0, 10.0, 9.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.03997802734375, -0.03890728950500488, -0.037836551666259766, -0.03676581382751465, -0.03569507598876953, -0.034624338150024414, -0.0335536003112793, -0.03248286247253418, -0.03141212463378906, -0.030341386795043945, -0.029270648956298828, -0.02819991111755371, -0.027129173278808594, -0.026058435440063477, -0.02498769760131836, -0.023916959762573242, -0.022846221923828125, -0.021775484085083008, -0.02070474624633789, -0.019634008407592773, -0.018563270568847656, -0.01749253273010254, -0.016421794891357422, -0.015351057052612305, -0.014280319213867188, -0.01320958137512207, -0.012138843536376953, -0.011068105697631836, -0.009997367858886719, -0.008926630020141602, -0.007855892181396484, -0.006785154342651367, -0.00571441650390625, -0.004643678665161133, -0.0035729408264160156, -0.0025022029876708984, -0.0014314651489257812, -0.00036072731018066406, 0.0007100105285644531, 0.0017807483673095703, 0.0028514862060546875, 0.003922224044799805, 0.004992961883544922, 0.006063699722290039, 0.007134437561035156, 0.008205175399780273, 0.00927591323852539, 0.010346651077270508, 0.011417388916015625, 0.012488126754760742, 0.01355886459350586, 0.014629602432250977, 0.015700340270996094, 0.01677107810974121, 0.017841815948486328, 0.018912553787231445, 0.019983291625976562, 0.02105402946472168, 0.022124767303466797, 0.023195505142211914, 0.02426624298095703, 0.02533698081970215, 0.026407718658447266, 0.027478456497192383, 0.0285491943359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 5.0, 4.0, 13.0, 19.0, 21.0, 62.0, 94.0, 181.0, 500.0, 7512.0, 1007227.0, 31396.0, 996.0, 266.0, 107.0, 48.0, 23.0, 22.0, 7.0, 8.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60400390625, -0.5813446044921875, -0.558685302734375, -0.5360260009765625, -0.51336669921875, -0.4907073974609375, -0.468048095703125, -0.4453887939453125, -0.4227294921875, -0.4000701904296875, -0.377410888671875, -0.3547515869140625, -0.33209228515625, -0.3094329833984375, -0.286773681640625, -0.2641143798828125, -0.241455078125, -0.2187957763671875, -0.196136474609375, -0.1734771728515625, -0.15081787109375, -0.1281585693359375, -0.105499267578125, -0.0828399658203125, -0.0601806640625, -0.0375213623046875, -0.014862060546875, 0.0077972412109375, 0.03045654296875, 0.0531158447265625, 0.075775146484375, 0.0984344482421875, 0.12109375, 0.1437530517578125, 0.166412353515625, 0.1890716552734375, 0.21173095703125, 0.2343902587890625, 0.257049560546875, 0.2797088623046875, 0.3023681640625, 0.3250274658203125, 0.347686767578125, 0.3703460693359375, 0.39300537109375, 0.4156646728515625, 0.438323974609375, 0.4609832763671875, 0.483642578125, 0.5063018798828125, 0.528961181640625, 0.5516204833984375, 0.57427978515625, 0.5969390869140625, 0.619598388671875, 0.6422576904296875, 0.6649169921875, 0.6875762939453125, 0.710235595703125, 0.7328948974609375, 0.75555419921875, 0.7782135009765625, 0.800872802734375, 0.8235321044921875, 0.84619140625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 8.0, 18.0, 72.0, 292.0, 390.0, 141.0, 51.0, 19.0, 9.0, 7.0, 7.0], "bins": [-0.28634798526763916, -0.2813399136066437, -0.2763318419456482, -0.2713237702846527, -0.2663156986236572, -0.26130759716033936, -0.25629952549934387, -0.2512914538383484, -0.2462833821773529, -0.24127531051635742, -0.23626723885536194, -0.23125915229320526, -0.22625108063220978, -0.2212430089712143, -0.2162349373102188, -0.21122686564922333, -0.20621879398822784, -0.20121072232723236, -0.19620265066623688, -0.1911945641040802, -0.18618649244308472, -0.18117842078208923, -0.17617034912109375, -0.17116227746009827, -0.16615420579910278, -0.1611461341381073, -0.15613806247711182, -0.15112997591495514, -0.14612190425395966, -0.14111383259296417, -0.1361057609319687, -0.1310976892709732, -0.12608958780765533, -0.12108151614665985, -0.11607343703508377, -0.11106536537408829, -0.10605728626251221, -0.10104921460151672, -0.09604114294052124, -0.09103307127952576, -0.08602499961853027, -0.08101692795753479, -0.07600884884595871, -0.07100077718496323, -0.06599269807338715, -0.06098462641239166, -0.05597655475139618, -0.0509684793651104, -0.04596040025353432, -0.040952324867248535, -0.03594425320625305, -0.03093617781996727, -0.025928102433681488, -0.020920027047395706, -0.015911953523755074, -0.010903880000114441, -0.005895804613828659, -0.0008877301588654518, 0.004120344296097755, 0.009128418751060963, 0.01413649320602417, 0.019144568592309952, 0.024152642115950584, 0.029160715639591217, 0.034168791025877]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 6.0, 3.0, 11.0, 4.0, 9.0, 0.0, 8.0, 13.0, 16.0, 18.0, 14.0, 22.0, 17.0, 36.0, 19.0, 32.0, 30.0, 36.0, 44.0, 41.0, 35.0, 43.0, 30.0, 27.0, 43.0, 38.0, 32.0, 30.0, 26.0, 32.0, 30.0, 28.0, 20.0, 34.0, 13.0, 16.0, 28.0, 19.0, 16.0, 16.0, 13.0, 10.0, 14.0, 6.0, 12.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.014987409114837646, -0.014529501087963581, -0.014071593061089516, -0.01361368503421545, -0.013155777007341385, -0.01269786898046732, -0.012239960953593254, -0.011782052926719189, -0.011324144899845123, -0.010866236872971058, -0.010408328846096992, -0.009950420819222927, -0.009492512792348862, -0.009034604765474796, -0.008576696738600731, -0.008118788711726665, -0.0076608806848526, -0.007202972657978535, -0.006745064631104469, -0.006287156604230404, -0.0058292485773563385, -0.005371340550482273, -0.004913432523608208, -0.004455524496734142, -0.003997616469860077, -0.0035397084429860115, -0.003081800416111946, -0.0026238923892378807, -0.0021659843623638153, -0.00170807633548975, -0.0012501683086156845, -0.0007922602817416191, -0.0003343522548675537, 0.0001235557720065117, 0.0005814637988805771, 0.0010393718257546425, 0.0014972798526287079, 0.0019551878795027733, 0.0024130959063768387, 0.002871003933250904, 0.0033289119601249695, 0.003786819986999035, 0.0042447280138731, 0.004702636040747166, 0.005160544067621231, 0.0056184520944952965, 0.006076360121369362, 0.006534268148243427, 0.006992176175117493, 0.007450084201991558, 0.007907992228865623, 0.008365900255739689, 0.008823808282613754, 0.00928171630948782, 0.009739624336361885, 0.01019753236323595, 0.010655440390110016, 0.011113348416984081, 0.011571256443858147, 0.012029164470732212, 0.012487072497606277, 0.012944980524480343, 0.013402888551354408, 0.013860796578228474, 0.014318704605102539]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 9.0, 19.0, 20.0, 17.0, 20.0, 23.0, 31.0, 36.0, 35.0, 37.0, 44.0, 45.0, 42.0, 52.0, 61.0, 56.0, 60.0, 59.0, 49.0, 50.0, 36.0, 34.0, 43.0, 17.0, 20.0, 13.0, 17.0, 11.0, 17.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3056640625, -11.861328125, -11.4169921875, -10.97265625, -10.5283203125, -10.083984375, -9.6396484375, -9.1953125, -8.7509765625, -8.306640625, -7.8623046875, -7.41796875, -6.9736328125, -6.529296875, -6.0849609375, -5.640625, -5.1962890625, -4.751953125, -4.3076171875, -3.86328125, -3.4189453125, -2.974609375, -2.5302734375, -2.0859375, -1.6416015625, -1.197265625, -0.7529296875, -0.30859375, 0.1357421875, 0.580078125, 1.0244140625, 1.46875, 1.9130859375, 2.357421875, 2.8017578125, 3.24609375, 3.6904296875, 4.134765625, 4.5791015625, 5.0234375, 5.4677734375, 5.912109375, 6.3564453125, 6.80078125, 7.2451171875, 7.689453125, 8.1337890625, 8.578125, 9.0224609375, 9.466796875, 9.9111328125, 10.35546875, 10.7998046875, 11.244140625, 11.6884765625, 12.1328125, 12.5771484375, 13.021484375, 13.4658203125, 13.91015625, 14.3544921875, 14.798828125, 15.2431640625, 15.6875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 5.0, 14.0, 14.0, 23.0, 30.0, 30.0, 28.0, 45.0, 89.0, 90.0, 158.0, 177.0, 259.0, 393.0, 556.0, 905.0, 1429.0, 2280.0, 3739.0, 7100.0, 15495.0, 51292.0, 309450.0, 538124.0, 76250.0, 20314.0, 8538.0, 4413.0, 2513.0, 1579.0, 957.0, 646.0, 465.0, 312.0, 219.0, 178.0, 109.0, 92.0, 49.0, 49.0, 37.0, 25.0, 18.0, 13.0, 10.0, 4.0, 8.0, 3.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.53125, -16.000244140625, -15.46923828125, -14.938232421875, -14.4072265625, -13.876220703125, -13.34521484375, -12.814208984375, -12.283203125, -11.752197265625, -11.22119140625, -10.690185546875, -10.1591796875, -9.628173828125, -9.09716796875, -8.566162109375, -8.03515625, -7.504150390625, -6.97314453125, -6.442138671875, -5.9111328125, -5.380126953125, -4.84912109375, -4.318115234375, -3.787109375, -3.256103515625, -2.72509765625, -2.194091796875, -1.6630859375, -1.132080078125, -0.60107421875, -0.070068359375, 0.4609375, 0.991943359375, 1.52294921875, 2.053955078125, 2.5849609375, 3.115966796875, 3.64697265625, 4.177978515625, 4.708984375, 5.239990234375, 5.77099609375, 6.302001953125, 6.8330078125, 7.364013671875, 7.89501953125, 8.426025390625, 8.95703125, 9.488037109375, 10.01904296875, 10.550048828125, 11.0810546875, 11.612060546875, 12.14306640625, 12.674072265625, 13.205078125, 13.736083984375, 14.26708984375, 14.798095703125, 15.3291015625, 15.860107421875, 16.39111328125, 16.922119140625, 17.453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 6.0, 2.0, 9.0, 8.0, 8.0, 21.0, 10.0, 18.0, 23.0, 31.0, 44.0, 30.0, 32.0, 55.0, 43.0, 70.0, 104.0, 376.0, 1579.0, 135.0, 64.0, 55.0, 41.0, 42.0, 35.0, 31.0, 24.0, 24.0, 22.0, 19.0, 18.0, 19.0, 11.0, 10.0, 1.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.25, -45.8232421875, -44.396484375, -42.9697265625, -41.54296875, -40.1162109375, -38.689453125, -37.2626953125, -35.8359375, -34.4091796875, -32.982421875, -31.5556640625, -30.12890625, -28.7021484375, -27.275390625, -25.8486328125, -24.421875, -22.9951171875, -21.568359375, -20.1416015625, -18.71484375, -17.2880859375, -15.861328125, -14.4345703125, -13.0078125, -11.5810546875, -10.154296875, -8.7275390625, -7.30078125, -5.8740234375, -4.447265625, -3.0205078125, -1.59375, -0.1669921875, 1.259765625, 2.6865234375, 4.11328125, 5.5400390625, 6.966796875, 8.3935546875, 9.8203125, 11.2470703125, 12.673828125, 14.1005859375, 15.52734375, 16.9541015625, 18.380859375, 19.8076171875, 21.234375, 22.6611328125, 24.087890625, 25.5146484375, 26.94140625, 28.3681640625, 29.794921875, 31.2216796875, 32.6484375, 34.0751953125, 35.501953125, 36.9287109375, 38.35546875, 39.7822265625, 41.208984375, 42.6357421875, 44.0625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 4.0, 13.0, 12.0, 26.0, 18.0, 36.0, 39.0, 38.0, 66.0, 87.0, 114.0, 179.0, 282.0, 715.0, 2858.0, 45459.0, 3073692.0, 18692.0, 1980.0, 522.0, 275.0, 134.0, 98.0, 102.0, 57.0, 37.0, 30.0, 29.0, 21.0, 16.0, 12.0, 11.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-90.75, -87.662109375, -84.57421875, -81.486328125, -78.3984375, -75.310546875, -72.22265625, -69.134765625, -66.046875, -62.958984375, -59.87109375, -56.783203125, -53.6953125, -50.607421875, -47.51953125, -44.431640625, -41.34375, -38.255859375, -35.16796875, -32.080078125, -28.9921875, -25.904296875, -22.81640625, -19.728515625, -16.640625, -13.552734375, -10.46484375, -7.376953125, -4.2890625, -1.201171875, 1.88671875, 4.974609375, 8.0625, 11.150390625, 14.23828125, 17.326171875, 20.4140625, 23.501953125, 26.58984375, 29.677734375, 32.765625, 35.853515625, 38.94140625, 42.029296875, 45.1171875, 48.205078125, 51.29296875, 54.380859375, 57.46875, 60.556640625, 63.64453125, 66.732421875, 69.8203125, 72.908203125, 75.99609375, 79.083984375, 82.171875, 85.259765625, 88.34765625, 91.435546875, 94.5234375, 97.611328125, 100.69921875, 103.787109375, 106.875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 178.0, 830.0, 8.0, 1.0, 0.0, 1.0], "bins": [-1408.3238525390625, -1384.528564453125, -1360.7333984375, -1336.9381103515625, -1313.142822265625, -1289.34765625, -1265.5523681640625, -1241.7572021484375, -1217.9619140625, -1194.1666259765625, -1170.3714599609375, -1146.576171875, -1122.781005859375, -1098.9857177734375, -1075.1904296875, -1051.395263671875, -1027.5999755859375, -1003.8047485351562, -980.009521484375, -956.2142333984375, -932.4190063476562, -908.623779296875, -884.8284912109375, -861.0332641601562, -837.238037109375, -813.4428100585938, -789.6475830078125, -765.852294921875, -742.0570678710938, -718.2618408203125, -694.466552734375, -670.6713256835938, -646.8760986328125, -623.0808715820312, -599.28564453125, -575.4903564453125, -551.6951293945312, -527.89990234375, -504.1046447753906, -480.30938720703125, -456.51416015625, -432.71893310546875, -408.9236755371094, -385.12841796875, -361.33319091796875, -337.5379638671875, -313.7427062988281, -289.94744873046875, -266.1522216796875, -242.3569793701172, -218.56173706054688, -194.76649475097656, -170.97125244140625, -147.17601013183594, -123.38076782226562, -99.58552551269531, -75.79027557373047, -51.995033264160156, -28.199790954589844, -4.404548645019531, 19.39069366455078, 43.185935974121094, 66.9811782836914, 90.77642059326172, 114.57166290283203]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 9.0, 7.0, 6.0, 9.0, 12.0, 17.0, 14.0, 20.0, 25.0, 22.0, 21.0, 29.0, 31.0, 46.0, 27.0, 43.0, 41.0, 39.0, 31.0, 37.0, 39.0, 44.0, 39.0, 39.0, 33.0, 36.0, 41.0, 27.0, 26.0, 23.0, 24.0, 24.0, 25.0, 19.0, 20.0, 12.0, 5.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-100.46959686279297, -97.39745330810547, -94.32530975341797, -91.25316619873047, -88.18102264404297, -85.10887908935547, -82.0367431640625, -78.964599609375, -75.8924560546875, -72.8203125, -69.7481689453125, -66.676025390625, -63.6038818359375, -60.53173828125, -57.459598541259766, -54.387454986572266, -51.3153076171875, -48.2431640625, -45.1710205078125, -42.098876953125, -39.0267333984375, -35.95458984375, -32.882450103759766, -29.810306549072266, -26.738162994384766, -23.666019439697266, -20.593875885009766, -17.5217342376709, -14.449590682983398, -11.377447128295898, -8.305305480957031, -5.233161926269531, -2.1610183715820312, 0.9111247062683105, 3.9832677841186523, 7.055410385131836, 10.127553939819336, 13.199697494506836, 16.271839141845703, 19.343982696533203, 22.416126251220703, 25.488269805908203, 28.560413360595703, 31.63255500793457, 34.70469665527344, 37.77684020996094, 40.84898376464844, 43.92112731933594, 46.99327087402344, 50.06541442871094, 53.13755798339844, 56.20970153808594, 59.28184509277344, 62.35398864746094, 65.42613220214844, 68.49827575683594, 71.57041931152344, 74.64256286621094, 77.71470642089844, 80.78684997558594, 83.85899353027344, 86.93113708496094, 90.00328063964844, 93.07542419433594, 96.1475601196289]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 13.0, 18.0, 18.0, 19.0, 22.0, 26.0, 37.0, 36.0, 27.0, 38.0, 30.0, 51.0, 68.0, 39.0, 51.0, 65.0, 68.0, 57.0, 45.0, 42.0, 34.0, 27.0, 40.0, 33.0, 19.0, 9.0, 11.0, 17.0, 13.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.3848876953125, -11.918212890625, -11.4515380859375, -10.98486328125, -10.5181884765625, -10.051513671875, -9.5848388671875, -9.1181640625, -8.6514892578125, -8.184814453125, -7.7181396484375, -7.25146484375, -6.7847900390625, -6.318115234375, -5.8514404296875, -5.384765625, -4.9180908203125, -4.451416015625, -3.9847412109375, -3.51806640625, -3.0513916015625, -2.584716796875, -2.1180419921875, -1.6513671875, -1.1846923828125, -0.718017578125, -0.2513427734375, 0.21533203125, 0.6820068359375, 1.148681640625, 1.6153564453125, 2.08203125, 2.5487060546875, 3.015380859375, 3.4820556640625, 3.94873046875, 4.4154052734375, 4.882080078125, 5.3487548828125, 5.8154296875, 6.2821044921875, 6.748779296875, 7.2154541015625, 7.68212890625, 8.1488037109375, 8.615478515625, 9.0821533203125, 9.548828125, 10.0155029296875, 10.482177734375, 10.9488525390625, 11.41552734375, 11.8822021484375, 12.348876953125, 12.8155517578125, 13.2822265625, 13.7489013671875, 14.215576171875, 14.6822509765625, 15.14892578125, 15.6156005859375, 16.082275390625, 16.5489501953125, 17.015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 12.0, 20.0, 17.0, 16.0, 16.0, 30.0, 32.0, 51.0, 83.0, 140.0, 449.0, 1182.0, 4153.0, 20147.0, 589019.0, 3496762.0, 70688.0, 8200.0, 2006.0, 640.0, 244.0, 118.0, 67.0, 57.0, 34.0, 23.0, 9.0, 10.0, 17.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.8125, -43.1064453125, -41.400390625, -39.6943359375, -37.98828125, -36.2822265625, -34.576171875, -32.8701171875, -31.1640625, -29.4580078125, -27.751953125, -26.0458984375, -24.33984375, -22.6337890625, -20.927734375, -19.2216796875, -17.515625, -15.8095703125, -14.103515625, -12.3974609375, -10.69140625, -8.9853515625, -7.279296875, -5.5732421875, -3.8671875, -2.1611328125, -0.455078125, 1.2509765625, 2.95703125, 4.6630859375, 6.369140625, 8.0751953125, 9.78125, 11.4873046875, 13.193359375, 14.8994140625, 16.60546875, 18.3115234375, 20.017578125, 21.7236328125, 23.4296875, 25.1357421875, 26.841796875, 28.5478515625, 30.25390625, 31.9599609375, 33.666015625, 35.3720703125, 37.078125, 38.7841796875, 40.490234375, 42.1962890625, 43.90234375, 45.6083984375, 47.314453125, 49.0205078125, 50.7265625, 52.4326171875, 54.138671875, 55.8447265625, 57.55078125, 59.2568359375, 60.962890625, 62.6689453125, 64.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 15.0, 5.0, 7.0, 15.0, 19.0, 21.0, 35.0, 69.0, 70.0, 119.0, 224.0, 410.0, 712.0, 886.0, 640.0, 396.0, 156.0, 79.0, 63.0, 44.0, 27.0, 17.0, 20.0, 9.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.97705078125, -33.8603515625, -32.74365234375, -31.626953125, -30.51025390625, -29.3935546875, -28.27685546875, -27.16015625, -26.04345703125, -24.9267578125, -23.81005859375, -22.693359375, -21.57666015625, -20.4599609375, -19.34326171875, -18.2265625, -17.10986328125, -15.9931640625, -14.87646484375, -13.759765625, -12.64306640625, -11.5263671875, -10.40966796875, -9.29296875, -8.17626953125, -7.0595703125, -5.94287109375, -4.826171875, -3.70947265625, -2.5927734375, -1.47607421875, -0.359375, 0.75732421875, 1.8740234375, 2.99072265625, 4.107421875, 5.22412109375, 6.3408203125, 7.45751953125, 8.57421875, 9.69091796875, 10.8076171875, 11.92431640625, 13.041015625, 14.15771484375, 15.2744140625, 16.39111328125, 17.5078125, 18.62451171875, 19.7412109375, 20.85791015625, 21.974609375, 23.09130859375, 24.2080078125, 25.32470703125, 26.44140625, 27.55810546875, 28.6748046875, 29.79150390625, 30.908203125, 32.02490234375, 33.1416015625, 34.25830078125, 35.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 25.0, 30.0, 44.0, 80.0, 149.0, 338.0, 1073.0, 4737.0, 41737.0, 2965491.0, 1149681.0, 25876.0, 3531.0, 784.0, 287.0, 156.0, 90.0, 45.0, 28.0, 18.0, 23.0, 7.0, 10.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.6875, -75.2529296875, -72.818359375, -70.3837890625, -67.94921875, -65.5146484375, -63.080078125, -60.6455078125, -58.2109375, -55.7763671875, -53.341796875, -50.9072265625, -48.47265625, -46.0380859375, -43.603515625, -41.1689453125, -38.734375, -36.2998046875, -33.865234375, -31.4306640625, -28.99609375, -26.5615234375, -24.126953125, -21.6923828125, -19.2578125, -16.8232421875, -14.388671875, -11.9541015625, -9.51953125, -7.0849609375, -4.650390625, -2.2158203125, 0.21875, 2.6533203125, 5.087890625, 7.5224609375, 9.95703125, 12.3916015625, 14.826171875, 17.2607421875, 19.6953125, 22.1298828125, 24.564453125, 26.9990234375, 29.43359375, 31.8681640625, 34.302734375, 36.7373046875, 39.171875, 41.6064453125, 44.041015625, 46.4755859375, 48.91015625, 51.3447265625, 53.779296875, 56.2138671875, 58.6484375, 61.0830078125, 63.517578125, 65.9521484375, 68.38671875, 70.8212890625, 73.255859375, 75.6904296875, 78.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 35.0, 118.0, 250.0, 328.0, 175.0, 62.0, 25.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.44061279296875, -302.3659362792969, -293.2912902832031, -284.21661376953125, -275.1419677734375, -266.0672912597656, -256.9926452636719, -247.91796875, -238.84332275390625, -229.76866149902344, -220.69400024414062, -211.6193389892578, -202.544677734375, -193.4700164794922, -184.39535522460938, -175.3206787109375, -166.2460174560547, -157.17135620117188, -148.09669494628906, -139.02203369140625, -129.94737243652344, -120.87271118164062, -111.79804229736328, -102.72338104248047, -93.64871978759766, -84.57405853271484, -75.49939727783203, -66.42472839355469, -57.35007095336914, -48.27540969848633, -39.20074462890625, -30.126083374023438, -21.051422119140625, -11.976759910583496, -2.902097702026367, 6.172565460205078, 15.24722671508789, 24.321887969970703, 33.39655303955078, 42.471214294433594, 51.545875549316406, 60.62053680419922, 69.69519805908203, 78.76986694335938, 87.84452819824219, 96.919189453125, 105.99385070800781, 115.06851196289062, 124.14317321777344, 133.21783447265625, 142.29249572753906, 151.36715698242188, 160.4418182373047, 169.5164794921875, 178.59115600585938, 187.66580200195312, 196.740478515625, 205.8151397705078, 214.88980102539062, 223.96446228027344, 233.03912353515625, 242.11378479003906, 251.18844604492188, 260.26312255859375, 269.3377685546875]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 3.0, 6.0, 16.0, 19.0, 18.0, 15.0, 19.0, 17.0, 24.0, 13.0, 29.0, 23.0, 21.0, 34.0, 33.0, 29.0, 38.0, 38.0, 36.0, 47.0, 33.0, 45.0, 45.0, 40.0, 37.0, 29.0, 26.0, 30.0, 26.0, 14.0, 20.0, 22.0, 25.0, 20.0, 14.0, 15.0, 15.0, 11.0, 8.0, 4.0, 10.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-65.13229370117188, -62.97682571411133, -60.821353912353516, -58.66588592529297, -56.510414123535156, -54.35494613647461, -52.19947814941406, -50.04400634765625, -47.8885383605957, -45.733070373535156, -43.577598571777344, -41.4221305847168, -39.26666259765625, -37.11119079589844, -34.95572280883789, -32.800254821777344, -30.64478302001953, -28.48931312561035, -26.333843231201172, -24.178375244140625, -22.022905349731445, -19.867435455322266, -17.71196746826172, -15.556497573852539, -13.40102767944336, -11.24555778503418, -9.090088844299316, -6.934619426727295, -4.779150009155273, -2.6236801147460938, -0.46821117401123047, 1.6872577667236328, 3.8427276611328125, 5.998197078704834, 8.153666496276855, 10.309135437011719, 12.464605331420898, 14.620075225830078, 16.775543212890625, 18.931013107299805, 21.086483001708984, 23.241952896118164, 25.397422790527344, 27.55289077758789, 29.70836067199707, 31.86383056640625, 34.0192985534668, 36.174766540527344, 38.330238342285156, 40.4857063293457, 42.641178131103516, 44.79664611816406, 46.952117919921875, 49.10758590698242, 51.26305389404297, 53.41852569580078, 55.57399368286133, 57.729461669921875, 59.88493347167969, 62.040401458740234, 64.19586944580078, 66.3513412475586, 68.5068130493164, 70.66227722167969, 72.8177490234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 11.0, 16.0, 16.0, 12.0, 23.0, 13.0, 21.0, 24.0, 25.0, 23.0, 36.0, 33.0, 39.0, 43.0, 38.0, 45.0, 51.0, 62.0, 48.0, 48.0, 37.0, 52.0, 43.0, 36.0, 31.0, 30.0, 23.0, 22.0, 25.0, 18.0, 13.0, 4.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.617431640625, -10.21142578125, -9.805419921875, -9.3994140625, -8.993408203125, -8.58740234375, -8.181396484375, -7.775390625, -7.369384765625, -6.96337890625, -6.557373046875, -6.1513671875, -5.745361328125, -5.33935546875, -4.933349609375, -4.52734375, -4.121337890625, -3.71533203125, -3.309326171875, -2.9033203125, -2.497314453125, -2.09130859375, -1.685302734375, -1.279296875, -0.873291015625, -0.46728515625, -0.061279296875, 0.3447265625, 0.750732421875, 1.15673828125, 1.562744140625, 1.96875, 2.374755859375, 2.78076171875, 3.186767578125, 3.5927734375, 3.998779296875, 4.40478515625, 4.810791015625, 5.216796875, 5.622802734375, 6.02880859375, 6.434814453125, 6.8408203125, 7.246826171875, 7.65283203125, 8.058837890625, 8.46484375, 8.870849609375, 9.27685546875, 9.682861328125, 10.0888671875, 10.494873046875, 10.90087890625, 11.306884765625, 11.712890625, 12.118896484375, 12.52490234375, 12.930908203125, 13.3369140625, 13.742919921875, 14.14892578125, 14.554931640625, 14.9609375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 3.0, 9.0, 15.0, 14.0, 27.0, 34.0, 67.0, 106.0, 145.0, 218.0, 332.0, 500.0, 790.0, 1151.0, 1770.0, 2693.0, 4203.0, 6459.0, 10296.0, 16638.0, 27387.0, 45926.0, 76804.0, 127554.0, 196307.0, 198143.0, 130193.0, 78920.0, 47005.0, 28150.0, 17072.0, 10796.0, 6677.0, 4251.0, 2708.0, 1770.0, 1133.0, 822.0, 483.0, 337.0, 238.0, 143.0, 96.0, 59.0, 42.0, 24.0, 20.0, 8.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.984375, -1.9224090576171875, -1.860443115234375, -1.7984771728515625, -1.73651123046875, -1.6745452880859375, -1.612579345703125, -1.5506134033203125, -1.4886474609375, -1.4266815185546875, -1.364715576171875, -1.3027496337890625, -1.24078369140625, -1.1788177490234375, -1.116851806640625, -1.0548858642578125, -0.992919921875, -0.9309539794921875, -0.868988037109375, -0.8070220947265625, -0.74505615234375, -0.6830902099609375, -0.621124267578125, -0.5591583251953125, -0.4971923828125, -0.4352264404296875, -0.373260498046875, -0.3112945556640625, -0.24932861328125, -0.1873626708984375, -0.125396728515625, -0.0634307861328125, -0.00146484375, 0.0605010986328125, 0.122467041015625, 0.1844329833984375, 0.24639892578125, 0.3083648681640625, 0.370330810546875, 0.4322967529296875, 0.4942626953125, 0.5562286376953125, 0.618194580078125, 0.6801605224609375, 0.74212646484375, 0.8040924072265625, 0.866058349609375, 0.9280242919921875, 0.989990234375, 1.0519561767578125, 1.113922119140625, 1.1758880615234375, 1.23785400390625, 1.2998199462890625, 1.361785888671875, 1.4237518310546875, 1.4857177734375, 1.5476837158203125, 1.609649658203125, 1.6716156005859375, 1.73358154296875, 1.7955474853515625, 1.857513427734375, 1.9194793701171875, 1.9814453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 7.0, 6.0, 7.0, 14.0, 14.0, 12.0, 24.0, 25.0, 27.0, 24.0, 23.0, 28.0, 40.0, 42.0, 40.0, 47.0, 37.0, 35.0, 1067.0, 47.0, 42.0, 37.0, 37.0, 25.0, 33.0, 34.0, 40.0, 36.0, 17.0, 32.0, 21.0, 12.0, 14.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.59375, -8.336181640625, -8.07861328125, -7.821044921875, -7.5634765625, -7.305908203125, -7.04833984375, -6.790771484375, -6.533203125, -6.275634765625, -6.01806640625, -5.760498046875, -5.5029296875, -5.245361328125, -4.98779296875, -4.730224609375, -4.47265625, -4.215087890625, -3.95751953125, -3.699951171875, -3.4423828125, -3.184814453125, -2.92724609375, -2.669677734375, -2.412109375, -2.154541015625, -1.89697265625, -1.639404296875, -1.3818359375, -1.124267578125, -0.86669921875, -0.609130859375, -0.3515625, -0.093994140625, 0.16357421875, 0.421142578125, 0.6787109375, 0.936279296875, 1.19384765625, 1.451416015625, 1.708984375, 1.966552734375, 2.22412109375, 2.481689453125, 2.7392578125, 2.996826171875, 3.25439453125, 3.511962890625, 3.76953125, 4.027099609375, 4.28466796875, 4.542236328125, 4.7998046875, 5.057373046875, 5.31494140625, 5.572509765625, 5.830078125, 6.087646484375, 6.34521484375, 6.602783203125, 6.8603515625, 7.117919921875, 7.37548828125, 7.633056640625, 7.890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 11.0, 13.0, 30.0, 33.0, 46.0, 73.0, 111.0, 171.0, 225.0, 370.0, 446.0, 802.0, 1308.0, 1978.0, 3112.0, 4941.0, 8122.0, 13218.0, 21679.0, 36798.0, 63178.0, 110043.0, 183275.0, 1268947.0, 156714.0, 91325.0, 52123.0, 30317.0, 18089.0, 10980.0, 6965.0, 4225.0, 2635.0, 1653.0, 1053.0, 668.0, 479.0, 334.0, 195.0, 132.0, 106.0, 64.0, 42.0, 36.0, 25.0, 9.0, 6.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.189453125, -1.1514892578125, -1.113525390625, -1.0755615234375, -1.03759765625, -0.9996337890625, -0.961669921875, -0.9237060546875, -0.8857421875, -0.8477783203125, -0.809814453125, -0.7718505859375, -0.73388671875, -0.6959228515625, -0.657958984375, -0.6199951171875, -0.58203125, -0.5440673828125, -0.506103515625, -0.4681396484375, -0.43017578125, -0.3922119140625, -0.354248046875, -0.3162841796875, -0.2783203125, -0.2403564453125, -0.202392578125, -0.1644287109375, -0.12646484375, -0.0885009765625, -0.050537109375, -0.0125732421875, 0.025390625, 0.0633544921875, 0.101318359375, 0.1392822265625, 0.17724609375, 0.2152099609375, 0.253173828125, 0.2911376953125, 0.3291015625, 0.3670654296875, 0.405029296875, 0.4429931640625, 0.48095703125, 0.5189208984375, 0.556884765625, 0.5948486328125, 0.6328125, 0.6707763671875, 0.708740234375, 0.7467041015625, 0.78466796875, 0.8226318359375, 0.860595703125, 0.8985595703125, 0.9365234375, 0.9744873046875, 1.012451171875, 1.0504150390625, 1.08837890625, 1.1263427734375, 1.164306640625, 1.2022705078125, 1.240234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 11.0, 8.0, 5.0, 17.0, 17.0, 24.0, 34.0, 43.0, 49.0, 73.0, 120.0, 191.0, 128.0, 69.0, 47.0, 43.0, 17.0, 25.0, 15.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.040712833404541016, -0.03928089141845703, -0.03784894943237305, -0.03641700744628906, -0.03498506546020508, -0.033553123474121094, -0.03212118148803711, -0.030689239501953125, -0.02925729751586914, -0.027825355529785156, -0.026393413543701172, -0.024961471557617188, -0.023529529571533203, -0.02209758758544922, -0.020665645599365234, -0.01923370361328125, -0.017801761627197266, -0.01636981964111328, -0.014937877655029297, -0.013505935668945312, -0.012073993682861328, -0.010642051696777344, -0.00921010971069336, -0.007778167724609375, -0.006346225738525391, -0.004914283752441406, -0.003482341766357422, -0.0020503997802734375, -0.0006184577941894531, 0.0008134841918945312, 0.0022454261779785156, 0.0036773681640625, 0.005109310150146484, 0.006541252136230469, 0.007973194122314453, 0.009405136108398438, 0.010837078094482422, 0.012269020080566406, 0.01370096206665039, 0.015132904052734375, 0.01656484603881836, 0.017996788024902344, 0.019428730010986328, 0.020860671997070312, 0.022292613983154297, 0.02372455596923828, 0.025156497955322266, 0.02658843994140625, 0.028020381927490234, 0.02945232391357422, 0.030884265899658203, 0.03231620788574219, 0.03374814987182617, 0.035180091857910156, 0.03661203384399414, 0.038043975830078125, 0.03947591781616211, 0.040907859802246094, 0.04233980178833008, 0.04377174377441406, 0.04520368576049805, 0.04663562774658203, 0.048067569732666016, 0.04949951171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 10.0, 9.0, 16.0, 20.0, 41.0, 55.0, 90.0, 182.0, 767.0, 18342.0, 1021624.0, 6430.0, 505.0, 161.0, 81.0, 57.0, 38.0, 29.0, 13.0, 17.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.05078125, -1.0202255249023438, -0.9896697998046875, -0.9591140747070312, -0.928558349609375, -0.8980026245117188, -0.8674468994140625, -0.8368911743164062, -0.80633544921875, -0.7757797241210938, -0.7452239990234375, -0.7146682739257812, -0.684112548828125, -0.6535568237304688, -0.6230010986328125, -0.5924453735351562, -0.5618896484375, -0.5313339233398438, -0.5007781982421875, -0.47022247314453125, -0.439666748046875, -0.40911102294921875, -0.3785552978515625, -0.34799957275390625, -0.31744384765625, -0.28688812255859375, -0.2563323974609375, -0.22577667236328125, -0.195220947265625, -0.16466522216796875, -0.1341094970703125, -0.10355377197265625, -0.072998046875, -0.04244232177734375, -0.0118865966796875, 0.01866912841796875, 0.049224853515625, 0.07978057861328125, 0.1103363037109375, 0.14089202880859375, 0.17144775390625, 0.20200347900390625, 0.2325592041015625, 0.26311492919921875, 0.293670654296875, 0.32422637939453125, 0.3547821044921875, 0.38533782958984375, 0.4158935546875, 0.44644927978515625, 0.4770050048828125, 0.5075607299804688, 0.538116455078125, 0.5686721801757812, 0.5992279052734375, 0.6297836303710938, 0.66033935546875, 0.6908950805664062, 0.7214508056640625, 0.7520065307617188, 0.782562255859375, 0.8131179809570312, 0.8436737060546875, 0.8742294311523438, 0.90478515625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 25.0, 114.0, 479.0, 285.0, 62.0, 17.0, 15.0, 7.0], "bins": [-0.5228639245033264, -0.5139737129211426, -0.505083441734314, -0.4961932301521301, -0.4873030185699463, -0.47841277718544006, -0.4695225656032562, -0.46063232421875, -0.45174211263656616, -0.44285187125205994, -0.4339616596698761, -0.4250714182853699, -0.41618120670318604, -0.4072909653186798, -0.39840075373649597, -0.38951051235198975, -0.3806202709674835, -0.3717300295829773, -0.36283981800079346, -0.35394957661628723, -0.3450593650341034, -0.33616912364959717, -0.32727891206741333, -0.3183886706829071, -0.3094984292984009, -0.30060818791389465, -0.2917179763317108, -0.2828277349472046, -0.27393752336502075, -0.2650472819805145, -0.2561570703983307, -0.24726682901382446, -0.23837663233280182, -0.2294864058494568, -0.22059617936611176, -0.21170595288276672, -0.2028157114982605, -0.19392549991607666, -0.18503525853157043, -0.1761450320482254, -0.16725480556488037, -0.15836457908153534, -0.1494743525981903, -0.14058412611484528, -0.13169389963150024, -0.12280366569757462, -0.11391343176364899, -0.10502320528030396, -0.09613297879695892, -0.08724275231361389, -0.07835252583026886, -0.06946229189634323, -0.0605720654129982, -0.05168183892965317, -0.04279160872101784, -0.03390137851238251, -0.025011155754327774, -0.016120927408337593, -0.007230699062347412, 0.0016595292836427689, 0.01054975762963295, 0.01943998411297798, 0.028330214321613312, 0.03722044453024864, 0.046110671013593674]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 13.0, 3.0, 13.0, 16.0, 13.0, 21.0, 12.0, 13.0, 24.0, 25.0, 24.0, 34.0, 36.0, 41.0, 39.0, 39.0, 50.0, 40.0, 53.0, 45.0, 35.0, 40.0, 45.0, 42.0, 38.0, 31.0, 38.0, 24.0, 30.0, 11.0, 17.0, 19.0, 16.0, 10.0, 7.0, 12.0, 8.0, 10.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04622715711593628, -0.044882070273160934, -0.04353698343038559, -0.042191896587610245, -0.0408468097448349, -0.039501722902059555, -0.03815663605928421, -0.036811549216508865, -0.03546646237373352, -0.034121375530958176, -0.03277628868818283, -0.031431201845407486, -0.03008611500263214, -0.028741028159856796, -0.02739594131708145, -0.026050854474306107, -0.02470576763153076, -0.023360680788755417, -0.022015593945980072, -0.020670507103204727, -0.019325420260429382, -0.017980333417654037, -0.016635246574878693, -0.015290159732103348, -0.013945072889328003, -0.012599986046552658, -0.011254899203777313, -0.009909812361001968, -0.008564725518226624, -0.007219638675451279, -0.005874551832675934, -0.004529464989900589, -0.003184378147125244, -0.0018392913043498993, -0.0004942044615745544, 0.0008508823812007904, 0.0021959692239761353, 0.00354105606675148, 0.004886142909526825, 0.00623122975230217, 0.007576316595077515, 0.00892140343785286, 0.010266490280628204, 0.01161157712340355, 0.012956663966178894, 0.014301750808954239, 0.015646837651729584, 0.01699192449450493, 0.018337011337280273, 0.01968209818005562, 0.021027185022830963, 0.022372271865606308, 0.023717358708381653, 0.025062445551156998, 0.026407532393932343, 0.027752619236707687, 0.029097706079483032, 0.030442792922258377, 0.03178787976503372, 0.03313296660780907, 0.03447805345058441, 0.035823140293359756, 0.0371682271361351, 0.038513313978910446, 0.03985840082168579]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 17.0, 16.0, 12.0, 23.0, 13.0, 21.0, 24.0, 24.0, 24.0, 36.0, 33.0, 39.0, 43.0, 38.0, 46.0, 50.0, 62.0, 48.0, 48.0, 37.0, 52.0, 44.0, 35.0, 31.0, 30.0, 23.0, 22.0, 25.0, 18.0, 13.0, 4.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.617431640625, -10.21142578125, -9.805419921875, -9.3994140625, -8.993408203125, -8.58740234375, -8.181396484375, -7.775390625, -7.369384765625, -6.96337890625, -6.557373046875, -6.1513671875, -5.745361328125, -5.33935546875, -4.933349609375, -4.52734375, -4.121337890625, -3.71533203125, -3.309326171875, -2.9033203125, -2.497314453125, -2.09130859375, -1.685302734375, -1.279296875, -0.873291015625, -0.46728515625, -0.061279296875, 0.3447265625, 0.750732421875, 1.15673828125, 1.562744140625, 1.96875, 2.374755859375, 2.78076171875, 3.186767578125, 3.5927734375, 3.998779296875, 4.40478515625, 4.810791015625, 5.216796875, 5.622802734375, 6.02880859375, 6.434814453125, 6.8408203125, 7.246826171875, 7.65283203125, 8.058837890625, 8.46484375, 8.870849609375, 9.27685546875, 9.682861328125, 10.0888671875, 10.494873046875, 10.90087890625, 11.306884765625, 11.712890625, 12.118896484375, 12.52490234375, 12.930908203125, 13.3369140625, 13.742919921875, 14.14892578125, 14.554931640625, 14.9609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 3.0, 6.0, 13.0, 13.0, 15.0, 21.0, 34.0, 71.0, 101.0, 122.0, 199.0, 312.0, 541.0, 927.0, 1461.0, 2658.0, 4800.0, 9231.0, 20126.0, 57004.0, 495301.0, 368560.0, 49167.0, 18292.0, 8753.0, 4603.0, 2566.0, 1442.0, 814.0, 504.0, 316.0, 193.0, 128.0, 70.0, 50.0, 38.0, 21.0, 17.0, 21.0, 10.0, 3.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.0625, -23.284912109375, -22.50732421875, -21.729736328125, -20.9521484375, -20.174560546875, -19.39697265625, -18.619384765625, -17.841796875, -17.064208984375, -16.28662109375, -15.509033203125, -14.7314453125, -13.953857421875, -13.17626953125, -12.398681640625, -11.62109375, -10.843505859375, -10.06591796875, -9.288330078125, -8.5107421875, -7.733154296875, -6.95556640625, -6.177978515625, -5.400390625, -4.622802734375, -3.84521484375, -3.067626953125, -2.2900390625, -1.512451171875, -0.73486328125, 0.042724609375, 0.8203125, 1.597900390625, 2.37548828125, 3.153076171875, 3.9306640625, 4.708251953125, 5.48583984375, 6.263427734375, 7.041015625, 7.818603515625, 8.59619140625, 9.373779296875, 10.1513671875, 10.928955078125, 11.70654296875, 12.484130859375, 13.26171875, 14.039306640625, 14.81689453125, 15.594482421875, 16.3720703125, 17.149658203125, 17.92724609375, 18.704833984375, 19.482421875, 20.260009765625, 21.03759765625, 21.815185546875, 22.5927734375, 23.370361328125, 24.14794921875, 24.925537109375, 25.703125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 6.0, 21.0, 14.0, 18.0, 22.0, 31.0, 33.0, 48.0, 34.0, 31.0, 44.0, 61.0, 83.0, 122.0, 310.0, 1512.0, 164.0, 81.0, 55.0, 37.0, 47.0, 38.0, 30.0, 26.0, 21.0, 13.0, 28.0, 20.0, 15.0, 11.0, 15.0, 9.0, 9.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-42.59375, -41.3095703125, -40.025390625, -38.7412109375, -37.45703125, -36.1728515625, -34.888671875, -33.6044921875, -32.3203125, -31.0361328125, -29.751953125, -28.4677734375, -27.18359375, -25.8994140625, -24.615234375, -23.3310546875, -22.046875, -20.7626953125, -19.478515625, -18.1943359375, -16.91015625, -15.6259765625, -14.341796875, -13.0576171875, -11.7734375, -10.4892578125, -9.205078125, -7.9208984375, -6.63671875, -5.3525390625, -4.068359375, -2.7841796875, -1.5, -0.2158203125, 1.068359375, 2.3525390625, 3.63671875, 4.9208984375, 6.205078125, 7.4892578125, 8.7734375, 10.0576171875, 11.341796875, 12.6259765625, 13.91015625, 15.1943359375, 16.478515625, 17.7626953125, 19.046875, 20.3310546875, 21.615234375, 22.8994140625, 24.18359375, 25.4677734375, 26.751953125, 28.0361328125, 29.3203125, 30.6044921875, 31.888671875, 33.1728515625, 34.45703125, 35.7412109375, 37.025390625, 38.3095703125, 39.59375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 11.0, 12.0, 12.0, 18.0, 12.0, 32.0, 43.0, 41.0, 51.0, 82.0, 83.0, 130.0, 206.0, 363.0, 1502.0, 15700.0, 2848897.0, 269915.0, 6695.0, 878.0, 344.0, 164.0, 123.0, 81.0, 79.0, 54.0, 41.0, 26.0, 34.0, 13.0, 12.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.5, -84.357421875, -81.21484375, -78.072265625, -74.9296875, -71.787109375, -68.64453125, -65.501953125, -62.359375, -59.216796875, -56.07421875, -52.931640625, -49.7890625, -46.646484375, -43.50390625, -40.361328125, -37.21875, -34.076171875, -30.93359375, -27.791015625, -24.6484375, -21.505859375, -18.36328125, -15.220703125, -12.078125, -8.935546875, -5.79296875, -2.650390625, 0.4921875, 3.634765625, 6.77734375, 9.919921875, 13.0625, 16.205078125, 19.34765625, 22.490234375, 25.6328125, 28.775390625, 31.91796875, 35.060546875, 38.203125, 41.345703125, 44.48828125, 47.630859375, 50.7734375, 53.916015625, 57.05859375, 60.201171875, 63.34375, 66.486328125, 69.62890625, 72.771484375, 75.9140625, 79.056640625, 82.19921875, 85.341796875, 88.484375, 91.626953125, 94.76953125, 97.912109375, 101.0546875, 104.197265625, 107.33984375, 110.482421875, 113.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 17.0, 58.0, 238.0, 449.0, 183.0, 44.0, 16.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.0624694824219, -285.7979736328125, -278.5334777832031, -271.2690124511719, -264.0045166015625, -256.7400207519531, -249.47552490234375, -242.21102905273438, -234.94654846191406, -227.6820526123047, -220.41757202148438, -213.153076171875, -205.88858032226562, -198.6240997314453, -191.35960388183594, -184.09512329101562, -176.83062744140625, -169.56613159179688, -162.30165100097656, -155.0371551513672, -147.77267456054688, -140.5081787109375, -133.24368286132812, -125.97919464111328, -118.71470642089844, -111.4502182006836, -104.18572998046875, -96.92123413085938, -89.65674591064453, -82.39225769042969, -75.12776184082031, -67.86327362060547, -60.59877014160156, -53.33428192138672, -46.06978988647461, -38.8052978515625, -31.540809631347656, -24.276321411132812, -17.011829376220703, -9.747337341308594, -2.48284912109375, 4.781641006469727, 12.046131134033203, 19.31062126159668, 26.575111389160156, 33.839599609375, 41.10409164428711, 48.36858367919922, 55.63307189941406, 62.897560119628906, 70.16204833984375, 77.42654418945312, 84.69103240966797, 91.95552062988281, 99.22001647949219, 106.48450469970703, 113.74899291992188, 121.01348114013672, 128.27796936035156, 135.54246520996094, 142.80694580078125, 150.07144165039062, 157.3359375, 164.60043334960938, 171.8649139404297]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 3.0, 11.0, 10.0, 14.0, 10.0, 10.0, 18.0, 19.0, 31.0, 28.0, 31.0, 26.0, 31.0, 38.0, 37.0, 41.0, 36.0, 50.0, 40.0, 45.0, 42.0, 46.0, 52.0, 45.0, 37.0, 32.0, 33.0, 32.0, 16.0, 9.0, 19.0, 17.0, 10.0, 10.0, 13.0, 5.0, 7.0, 8.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.7728271484375, -100.11311340332031, -96.45339965820312, -92.79368591308594, -89.13397216796875, -85.47425842285156, -81.8145523071289, -78.15483856201172, -74.49512481689453, -70.83541107177734, -67.17569732666016, -63.515987396240234, -59.85627365112305, -56.19655990600586, -52.53684997558594, -48.87713623046875, -45.21742248535156, -41.557708740234375, -37.89799499511719, -34.238285064697266, -30.578571319580078, -26.91885757446289, -23.259145736694336, -19.59943389892578, -15.939720153808594, -12.280007362365723, -8.620294570922852, -4.9605817794799805, -1.3008689880371094, 2.358844757080078, 6.018556594848633, 9.678268432617188, 13.337982177734375, 16.997695922851562, 20.657407760620117, 24.317119598388672, 27.97683334350586, 31.636547088623047, 35.29625701904297, 38.955970764160156, 42.615684509277344, 46.27539825439453, 49.93511199951172, 53.59482192993164, 57.25453567504883, 60.914249420166016, 64.57395935058594, 68.23367309570312, 71.89338684082031, 75.5531005859375, 79.21281433105469, 82.87252807617188, 86.53224182128906, 90.19195556640625, 93.8516616821289, 97.5113754272461, 101.17108917236328, 104.83080291748047, 108.49051666259766, 112.15023040771484, 115.8099365234375, 119.46965026855469, 123.12936401367188, 126.78907775878906, 130.44879150390625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 16.0, 18.0, 17.0, 26.0, 23.0, 30.0, 28.0, 26.0, 30.0, 44.0, 38.0, 49.0, 54.0, 48.0, 55.0, 51.0, 48.0, 43.0, 46.0, 43.0, 32.0, 34.0, 39.0, 22.0, 21.0, 18.0, 18.0, 5.0, 15.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.224365234375, -10.77685546875, -10.329345703125, -9.8818359375, -9.434326171875, -8.98681640625, -8.539306640625, -8.091796875, -7.644287109375, -7.19677734375, -6.749267578125, -6.3017578125, -5.854248046875, -5.40673828125, -4.959228515625, -4.51171875, -4.064208984375, -3.61669921875, -3.169189453125, -2.7216796875, -2.274169921875, -1.82666015625, -1.379150390625, -0.931640625, -0.484130859375, -0.03662109375, 0.410888671875, 0.8583984375, 1.305908203125, 1.75341796875, 2.200927734375, 2.6484375, 3.095947265625, 3.54345703125, 3.990966796875, 4.4384765625, 4.885986328125, 5.33349609375, 5.781005859375, 6.228515625, 6.676025390625, 7.12353515625, 7.571044921875, 8.0185546875, 8.466064453125, 8.91357421875, 9.361083984375, 9.80859375, 10.256103515625, 10.70361328125, 11.151123046875, 11.5986328125, 12.046142578125, 12.49365234375, 12.941162109375, 13.388671875, 13.836181640625, 14.28369140625, 14.731201171875, 15.1787109375, 15.626220703125, 16.07373046875, 16.521240234375, 16.96875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 9.0, 17.0, 14.0, 17.0, 9.0, 27.0, 21.0, 31.0, 36.0, 37.0, 93.0, 229.0, 781.0, 2750.0, 12495.0, 163052.0, 3651671.0, 343241.0, 15198.0, 3029.0, 845.0, 295.0, 108.0, 69.0, 45.0, 34.0, 21.0, 25.0, 16.0, 16.0, 10.0, 10.0, 7.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.9375, -39.3369140625, -37.736328125, -36.1357421875, -34.53515625, -32.9345703125, -31.333984375, -29.7333984375, -28.1328125, -26.5322265625, -24.931640625, -23.3310546875, -21.73046875, -20.1298828125, -18.529296875, -16.9287109375, -15.328125, -13.7275390625, -12.126953125, -10.5263671875, -8.92578125, -7.3251953125, -5.724609375, -4.1240234375, -2.5234375, -0.9228515625, 0.677734375, 2.2783203125, 3.87890625, 5.4794921875, 7.080078125, 8.6806640625, 10.28125, 11.8818359375, 13.482421875, 15.0830078125, 16.68359375, 18.2841796875, 19.884765625, 21.4853515625, 23.0859375, 24.6865234375, 26.287109375, 27.8876953125, 29.48828125, 31.0888671875, 32.689453125, 34.2900390625, 35.890625, 37.4912109375, 39.091796875, 40.6923828125, 42.29296875, 43.8935546875, 45.494140625, 47.0947265625, 48.6953125, 50.2958984375, 51.896484375, 53.4970703125, 55.09765625, 56.6982421875, 58.298828125, 59.8994140625, 61.5]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 7.0, 5.0, 14.0, 18.0, 33.0, 29.0, 36.0, 57.0, 102.0, 103.0, 186.0, 270.0, 413.0, 606.0, 661.0, 518.0, 337.0, 194.0, 136.0, 92.0, 48.0, 46.0, 35.0, 30.0, 18.0, 10.0, 14.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.375, -22.54541015625, -21.7158203125, -20.88623046875, -20.056640625, -19.22705078125, -18.3974609375, -17.56787109375, -16.73828125, -15.90869140625, -15.0791015625, -14.24951171875, -13.419921875, -12.59033203125, -11.7607421875, -10.93115234375, -10.1015625, -9.27197265625, -8.4423828125, -7.61279296875, -6.783203125, -5.95361328125, -5.1240234375, -4.29443359375, -3.46484375, -2.63525390625, -1.8056640625, -0.97607421875, -0.146484375, 0.68310546875, 1.5126953125, 2.34228515625, 3.171875, 4.00146484375, 4.8310546875, 5.66064453125, 6.490234375, 7.31982421875, 8.1494140625, 8.97900390625, 9.80859375, 10.63818359375, 11.4677734375, 12.29736328125, 13.126953125, 13.95654296875, 14.7861328125, 15.61572265625, 16.4453125, 17.27490234375, 18.1044921875, 18.93408203125, 19.763671875, 20.59326171875, 21.4228515625, 22.25244140625, 23.08203125, 23.91162109375, 24.7412109375, 25.57080078125, 26.400390625, 27.22998046875, 28.0595703125, 28.88916015625, 29.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 7.0, 11.0, 15.0, 25.0, 28.0, 35.0, 58.0, 79.0, 119.0, 282.0, 763.0, 3381.0, 37675.0, 3582988.0, 552556.0, 13286.0, 1808.0, 493.0, 228.0, 138.0, 97.0, 41.0, 41.0, 30.0, 21.0, 16.0, 5.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-102.0625, -99.212890625, -96.36328125, -93.513671875, -90.6640625, -87.814453125, -84.96484375, -82.115234375, -79.265625, -76.416015625, -73.56640625, -70.716796875, -67.8671875, -65.017578125, -62.16796875, -59.318359375, -56.46875, -53.619140625, -50.76953125, -47.919921875, -45.0703125, -42.220703125, -39.37109375, -36.521484375, -33.671875, -30.822265625, -27.97265625, -25.123046875, -22.2734375, -19.423828125, -16.57421875, -13.724609375, -10.875, -8.025390625, -5.17578125, -2.326171875, 0.5234375, 3.373046875, 6.22265625, 9.072265625, 11.921875, 14.771484375, 17.62109375, 20.470703125, 23.3203125, 26.169921875, 29.01953125, 31.869140625, 34.71875, 37.568359375, 40.41796875, 43.267578125, 46.1171875, 48.966796875, 51.81640625, 54.666015625, 57.515625, 60.365234375, 63.21484375, 66.064453125, 68.9140625, 71.763671875, 74.61328125, 77.462890625, 80.3125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 35.0, 244.0, 410.0, 251.0, 51.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-554.8233642578125, -541.4363403320312, -528.04931640625, -514.6622314453125, -501.27520751953125, -487.88818359375, -474.50115966796875, -461.1141052246094, -447.72705078125, -434.34002685546875, -420.9529724121094, -407.5659484863281, -394.17889404296875, -380.7918701171875, -367.40484619140625, -354.0177917480469, -340.6307678222656, -327.2437438964844, -313.856689453125, -300.46966552734375, -287.0826110839844, -273.6955871582031, -260.30853271484375, -246.9215087890625, -233.5344696044922, -220.14743041992188, -206.76039123535156, -193.37335205078125, -179.986328125, -166.59927368164062, -153.21224975585938, -139.82521057128906, -126.43820190429688, -113.05116271972656, -99.66412353515625, -86.27709197998047, -72.89005279541016, -59.503013610839844, -46.11598205566406, -32.72894287109375, -19.341903686523438, -5.954866409301758, 7.432170867919922, 20.81920623779297, 34.20624542236328, 47.593284606933594, 60.980316162109375, 74.36735534667969, 87.75439453125, 101.14143371582031, 114.52847290039062, 127.9155044555664, 141.30255126953125, 154.6895751953125, 168.0766143798828, 181.46365356445312, 194.85069274902344, 208.23773193359375, 221.62477111816406, 235.01181030273438, 248.39883422851562, 261.785888671875, 275.17291259765625, 288.5599365234375, 301.9469909667969]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 11.0, 12.0, 10.0, 14.0, 21.0, 17.0, 19.0, 24.0, 32.0, 32.0, 43.0, 37.0, 40.0, 44.0, 39.0, 42.0, 48.0, 46.0, 45.0, 45.0, 42.0, 42.0, 34.0, 28.0, 37.0, 22.0, 31.0, 31.0, 24.0, 16.0, 8.0, 6.0, 11.0, 9.0, 13.0, 3.0, 7.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-90.00277709960938, -87.25083923339844, -84.49890899658203, -81.7469711303711, -78.99504089355469, -76.24310302734375, -73.49116516113281, -70.73922729492188, -67.98729705810547, -65.23535919189453, -62.483428955078125, -59.73149108886719, -56.979557037353516, -54.227622985839844, -51.475685119628906, -48.723751068115234, -45.97181701660156, -43.21988296508789, -40.46794891357422, -37.71601104736328, -34.96407699584961, -32.21214294433594, -29.460206985473633, -26.708271026611328, -23.956336975097656, -21.204402923583984, -18.45246696472168, -15.700531959533691, -12.948596954345703, -10.196661949157715, -7.444726943969727, -4.692790985107422, -1.94085693359375, 0.8110780715942383, 3.5630130767822266, 6.314948081970215, 9.066883087158203, 11.818818092346191, 14.57075309753418, 17.322689056396484, 20.074623107910156, 22.826557159423828, 25.578493118286133, 28.330429077148438, 31.08236312866211, 33.83429718017578, 36.58623504638672, 39.33816909790039, 42.09010314941406, 44.842037200927734, 47.593971252441406, 50.345909118652344, 53.097843170166016, 55.84977722167969, 58.601715087890625, 61.3536491394043, 64.10558319091797, 66.8575210571289, 69.60945129394531, 72.36138916015625, 75.11332702636719, 77.8652572631836, 80.61719512939453, 83.36912536621094, 86.12106323242188]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 8.0, 7.0, 8.0, 7.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 22.0, 30.0, 36.0, 48.0, 54.0, 49.0, 53.0, 62.0, 42.0, 37.0, 44.0, 52.0, 46.0, 38.0, 30.0, 44.0, 29.0, 32.0, 22.0, 18.0, 14.0, 10.0, 7.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.737060546875, -11.28662109375, -10.836181640625, -10.3857421875, -9.935302734375, -9.48486328125, -9.034423828125, -8.583984375, -8.133544921875, -7.68310546875, -7.232666015625, -6.7822265625, -6.331787109375, -5.88134765625, -5.430908203125, -4.98046875, -4.530029296875, -4.07958984375, -3.629150390625, -3.1787109375, -2.728271484375, -2.27783203125, -1.827392578125, -1.376953125, -0.926513671875, -0.47607421875, -0.025634765625, 0.4248046875, 0.875244140625, 1.32568359375, 1.776123046875, 2.2265625, 2.677001953125, 3.12744140625, 3.577880859375, 4.0283203125, 4.478759765625, 4.92919921875, 5.379638671875, 5.830078125, 6.280517578125, 6.73095703125, 7.181396484375, 7.6318359375, 8.082275390625, 8.53271484375, 8.983154296875, 9.43359375, 9.884033203125, 10.33447265625, 10.784912109375, 11.2353515625, 11.685791015625, 12.13623046875, 12.586669921875, 13.037109375, 13.487548828125, 13.93798828125, 14.388427734375, 14.8388671875, 15.289306640625, 15.73974609375, 16.190185546875, 16.640625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 13.0, 7.0, 12.0, 23.0, 48.0, 54.0, 85.0, 112.0, 214.0, 322.0, 514.0, 764.0, 1300.0, 2190.0, 3781.0, 6592.0, 11624.0, 21431.0, 39385.0, 74952.0, 143035.0, 239643.0, 225743.0, 129665.0, 66680.0, 35449.0, 19510.0, 10676.0, 5913.0, 3527.0, 2059.0, 1212.0, 736.0, 479.0, 253.0, 203.0, 121.0, 74.0, 52.0, 34.0, 19.0, 16.0, 10.0, 10.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.658203125, -2.57745361328125, -2.4967041015625, -2.41595458984375, -2.335205078125, -2.25445556640625, -2.1737060546875, -2.09295654296875, -2.01220703125, -1.93145751953125, -1.8507080078125, -1.76995849609375, -1.689208984375, -1.60845947265625, -1.5277099609375, -1.44696044921875, -1.3662109375, -1.28546142578125, -1.2047119140625, -1.12396240234375, -1.043212890625, -0.96246337890625, -0.8817138671875, -0.80096435546875, -0.72021484375, -0.63946533203125, -0.5587158203125, -0.47796630859375, -0.397216796875, -0.31646728515625, -0.2357177734375, -0.15496826171875, -0.07421875, 0.00653076171875, 0.0872802734375, 0.16802978515625, 0.248779296875, 0.32952880859375, 0.4102783203125, 0.49102783203125, 0.57177734375, 0.65252685546875, 0.7332763671875, 0.81402587890625, 0.894775390625, 0.97552490234375, 1.0562744140625, 1.13702392578125, 1.2177734375, 1.29852294921875, 1.3792724609375, 1.46002197265625, 1.540771484375, 1.62152099609375, 1.7022705078125, 1.78302001953125, 1.86376953125, 1.94451904296875, 2.0252685546875, 2.10601806640625, 2.186767578125, 2.26751708984375, 2.3482666015625, 2.42901611328125, 2.509765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 4.0, 7.0, 5.0, 16.0, 15.0, 14.0, 11.0, 15.0, 22.0, 30.0, 34.0, 23.0, 31.0, 35.0, 26.0, 34.0, 42.0, 28.0, 42.0, 1070.0, 40.0, 42.0, 40.0, 35.0, 31.0, 42.0, 23.0, 28.0, 26.0, 25.0, 24.0, 20.0, 16.0, 22.0, 21.0, 16.0, 17.0, 13.0, 11.0, 11.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3990478515625, -7.141845703125, -6.8846435546875, -6.62744140625, -6.3702392578125, -6.113037109375, -5.8558349609375, -5.5986328125, -5.3414306640625, -5.084228515625, -4.8270263671875, -4.56982421875, -4.3126220703125, -4.055419921875, -3.7982177734375, -3.541015625, -3.2838134765625, -3.026611328125, -2.7694091796875, -2.51220703125, -2.2550048828125, -1.997802734375, -1.7406005859375, -1.4833984375, -1.2261962890625, -0.968994140625, -0.7117919921875, -0.45458984375, -0.1973876953125, 0.059814453125, 0.3170166015625, 0.57421875, 0.8314208984375, 1.088623046875, 1.3458251953125, 1.60302734375, 1.8602294921875, 2.117431640625, 2.3746337890625, 2.6318359375, 2.8890380859375, 3.146240234375, 3.4034423828125, 3.66064453125, 3.9178466796875, 4.175048828125, 4.4322509765625, 4.689453125, 4.9466552734375, 5.203857421875, 5.4610595703125, 5.71826171875, 5.9754638671875, 6.232666015625, 6.4898681640625, 6.7470703125, 7.0042724609375, 7.261474609375, 7.5186767578125, 7.77587890625, 8.0330810546875, 8.290283203125, 8.5474853515625, 8.8046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 12.0, 30.0, 46.0, 50.0, 76.0, 111.0, 130.0, 221.0, 314.0, 487.0, 702.0, 1028.0, 1432.0, 2110.0, 3094.0, 4664.0, 7057.0, 10803.0, 16575.0, 25582.0, 40351.0, 65532.0, 105350.0, 159400.0, 1238153.0, 149836.0, 97796.0, 60218.0, 37288.0, 23492.0, 14917.0, 9987.0, 6714.0, 4382.0, 2887.0, 1983.0, 1306.0, 890.0, 669.0, 454.0, 289.0, 231.0, 145.0, 96.0, 75.0, 41.0, 33.0, 20.0, 15.0, 17.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.1005859375, -1.0666351318359375, -1.032684326171875, -0.9987335205078125, -0.96478271484375, -0.9308319091796875, -0.896881103515625, -0.8629302978515625, -0.8289794921875, -0.7950286865234375, -0.761077880859375, -0.7271270751953125, -0.69317626953125, -0.6592254638671875, -0.625274658203125, -0.5913238525390625, -0.557373046875, -0.5234222412109375, -0.489471435546875, -0.4555206298828125, -0.42156982421875, -0.3876190185546875, -0.353668212890625, -0.3197174072265625, -0.2857666015625, -0.2518157958984375, -0.217864990234375, -0.1839141845703125, -0.14996337890625, -0.1160125732421875, -0.082061767578125, -0.0481109619140625, -0.01416015625, 0.0197906494140625, 0.053741455078125, 0.0876922607421875, 0.12164306640625, 0.1555938720703125, 0.189544677734375, 0.2234954833984375, 0.2574462890625, 0.2913970947265625, 0.325347900390625, 0.3592987060546875, 0.39324951171875, 0.4272003173828125, 0.461151123046875, 0.4951019287109375, 0.529052734375, 0.5630035400390625, 0.596954345703125, 0.6309051513671875, 0.66485595703125, 0.6988067626953125, 0.732757568359375, 0.7667083740234375, 0.8006591796875, 0.8346099853515625, 0.868560791015625, 0.9025115966796875, 0.93646240234375, 0.9704132080078125, 1.004364013671875, 1.0383148193359375, 1.072265625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 13.0, 6.0, 8.0, 12.0, 14.0, 9.0, 15.0, 24.0, 18.0, 31.0, 18.0, 35.0, 33.0, 29.0, 35.0, 34.0, 29.0, 43.0, 63.0, 46.0, 51.0, 38.0, 41.0, 40.0, 33.0, 31.0, 29.0, 32.0, 27.0, 24.0, 24.0, 13.0, 17.0, 16.0, 12.0, 11.0, 14.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0149078369140625, -0.014421701431274414, -0.013935565948486328, -0.013449430465698242, -0.012963294982910156, -0.01247715950012207, -0.011991024017333984, -0.011504888534545898, -0.011018753051757812, -0.010532617568969727, -0.01004648208618164, -0.009560346603393555, -0.009074211120605469, -0.008588075637817383, -0.008101940155029297, -0.007615804672241211, -0.007129669189453125, -0.006643533706665039, -0.006157398223876953, -0.005671262741088867, -0.005185127258300781, -0.004698991775512695, -0.004212856292724609, -0.0037267208099365234, -0.0032405853271484375, -0.0027544498443603516, -0.0022683143615722656, -0.0017821788787841797, -0.0012960433959960938, -0.0008099079132080078, -0.0003237724304199219, 0.00016236305236816406, 0.00064849853515625, 0.001134634017944336, 0.0016207695007324219, 0.002106904983520508, 0.0025930404663085938, 0.0030791759490966797, 0.0035653114318847656, 0.0040514469146728516, 0.0045375823974609375, 0.0050237178802490234, 0.005509853363037109, 0.005995988845825195, 0.006482124328613281, 0.006968259811401367, 0.007454395294189453, 0.007940530776977539, 0.008426666259765625, 0.008912801742553711, 0.009398937225341797, 0.009885072708129883, 0.010371208190917969, 0.010857343673706055, 0.01134347915649414, 0.011829614639282227, 0.012315750122070312, 0.012801885604858398, 0.013288021087646484, 0.01377415657043457, 0.014260292053222656, 0.014746427536010742, 0.015232563018798828, 0.015718698501586914, 0.016204833984375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 12.0, 10.0, 7.0, 15.0, 15.0, 26.0, 28.0, 25.0, 37.0, 51.0, 62.0, 104.0, 151.0, 282.0, 1096.0, 8388.0, 141246.0, 851897.0, 40426.0, 3346.0, 588.0, 215.0, 118.0, 78.0, 62.0, 57.0, 27.0, 26.0, 21.0, 30.0, 20.0, 14.0, 13.0, 7.0, 9.0, 3.0, 6.0, 7.0, 1.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.365478515625, -0.3545036315917969, -0.34352874755859375, -0.3325538635253906, -0.3215789794921875, -0.3106040954589844, -0.29962921142578125, -0.2886543273925781, -0.277679443359375, -0.2667045593261719, -0.25572967529296875, -0.24475479125976562, -0.2337799072265625, -0.22280502319335938, -0.21183013916015625, -0.20085525512695312, -0.18988037109375, -0.17890548706054688, -0.16793060302734375, -0.15695571899414062, -0.1459808349609375, -0.13500595092773438, -0.12403106689453125, -0.11305618286132812, -0.102081298828125, -0.09110641479492188, -0.08013153076171875, -0.06915664672851562, -0.0581817626953125, -0.047206878662109375, -0.03623199462890625, -0.025257110595703125, -0.0142822265625, -0.003307342529296875, 0.00766754150390625, 0.018642425537109375, 0.0296173095703125, 0.040592193603515625, 0.05156707763671875, 0.06254196166992188, 0.073516845703125, 0.08449172973632812, 0.09546661376953125, 0.10644149780273438, 0.1174163818359375, 0.12839126586914062, 0.13936614990234375, 0.15034103393554688, 0.16131591796875, 0.17229080200195312, 0.18326568603515625, 0.19424057006835938, 0.2052154541015625, 0.21619033813476562, 0.22716522216796875, 0.23814010620117188, 0.249114990234375, 0.2600898742675781, 0.27106475830078125, 0.2820396423339844, 0.2930145263671875, 0.3039894104003906, 0.31496429443359375, 0.3259391784667969, 0.3369140625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 25.0, 35.0, 65.0, 92.0, 167.0, 233.0, 127.0, 68.0, 41.0, 35.0, 22.0, 16.0, 7.0, 11.0, 5.0, 7.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11992428451776505, -0.1170882135629654, -0.11425214260816574, -0.11141607165336609, -0.10858000069856644, -0.10574392974376678, -0.10290785878896713, -0.10007178783416748, -0.09723571687936783, -0.09439964592456818, -0.09156357496976852, -0.08872750401496887, -0.08589143306016922, -0.08305536210536957, -0.08021929115056992, -0.07738322019577026, -0.07454714924097061, -0.07171107828617096, -0.06887500733137131, -0.06603893637657166, -0.063202865421772, -0.06036679446697235, -0.0575307235121727, -0.05469465255737305, -0.051858581602573395, -0.04902251064777374, -0.04618643969297409, -0.04335036873817444, -0.040514297783374786, -0.037678226828575134, -0.03484215587377548, -0.03200608491897583, -0.029170017689466476, -0.026333946734666824, -0.023497875779867172, -0.02066180482506752, -0.017825733870267868, -0.014989662915468216, -0.012153591960668564, -0.009317521005868912, -0.00648145005106926, -0.0036453790962696075, -0.0008093081414699554, 0.0020267628133296967, 0.004862833768129349, 0.007698904722929001, 0.010534975677728653, 0.013371046632528305, 0.016207117587327957, 0.01904318854212761, 0.02187925949692726, 0.024715330451726913, 0.027551401406526566, 0.030387472361326218, 0.03322354331612587, 0.03605961427092552, 0.038895685225725174, 0.041731756180524826, 0.04456782713532448, 0.04740389809012413, 0.05023996904492378, 0.053076039999723434, 0.05591211095452309, 0.05874818190932274, 0.06158425286412239]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 6.0, 1.0, 10.0, 5.0, 9.0, 10.0, 8.0, 21.0, 21.0, 17.0, 23.0, 24.0, 27.0, 33.0, 29.0, 30.0, 33.0, 47.0, 40.0, 26.0, 40.0, 37.0, 48.0, 46.0, 40.0, 28.0, 37.0, 32.0, 28.0, 26.0, 29.0, 31.0, 25.0, 23.0, 15.0, 11.0, 18.0, 13.0, 9.0, 12.0, 14.0, 10.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012537598609924316, -0.01213921420276165, -0.011740829795598984, -0.011342445388436317, -0.010944060981273651, -0.010545676574110985, -0.010147292166948318, -0.009748907759785652, -0.009350523352622986, -0.00895213894546032, -0.008553754538297653, -0.008155370131134987, -0.0077569857239723206, -0.007358601316809654, -0.006960216909646988, -0.006561832502484322, -0.006163448095321655, -0.005765063688158989, -0.005366679280996323, -0.004968294873833656, -0.00456991046667099, -0.004171526059508324, -0.0037731416523456573, -0.003374757245182991, -0.0029763728380203247, -0.0025779884308576584, -0.002179604023694992, -0.0017812196165323257, -0.0013828352093696594, -0.000984450802206993, -0.0005860663950443268, -0.00018768198788166046, 0.00021070241928100586, 0.0006090868264436722, 0.0010074712336063385, 0.0014058556407690048, 0.0018042400479316711, 0.0022026244550943375, 0.002601008862257004, 0.00299939326941967, 0.0033977776765823364, 0.0037961620837450027, 0.004194546490907669, 0.004592930898070335, 0.004991315305233002, 0.005389699712395668, 0.005788084119558334, 0.006186468526721001, 0.006584852933883667, 0.006983237341046333, 0.007381621748209, 0.007780006155371666, 0.008178390562534332, 0.008576774969696999, 0.008975159376859665, 0.009373543784022331, 0.009771928191184998, 0.010170312598347664, 0.01056869700551033, 0.010967081412672997, 0.011365465819835663, 0.01176385022699833, 0.012162234634160995, 0.012560619041323662, 0.012959003448486328]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 7.0, 7.0, 8.0, 7.0, 14.0, 18.0, 28.0, 19.0, 20.0, 28.0, 22.0, 30.0, 38.0, 48.0, 55.0, 47.0, 56.0, 60.0, 43.0, 34.0, 44.0, 53.0, 45.0, 38.0, 33.0, 42.0, 29.0, 31.0, 25.0, 15.0, 17.0, 9.0, 5.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.7291259765625, -11.278564453125, -10.8280029296875, -10.37744140625, -9.9268798828125, -9.476318359375, -9.0257568359375, -8.5751953125, -8.1246337890625, -7.674072265625, -7.2235107421875, -6.77294921875, -6.3223876953125, -5.871826171875, -5.4212646484375, -4.970703125, -4.5201416015625, -4.069580078125, -3.6190185546875, -3.16845703125, -2.7178955078125, -2.267333984375, -1.8167724609375, -1.3662109375, -0.9156494140625, -0.465087890625, -0.0145263671875, 0.43603515625, 0.8865966796875, 1.337158203125, 1.7877197265625, 2.23828125, 2.6888427734375, 3.139404296875, 3.5899658203125, 4.04052734375, 4.4910888671875, 4.941650390625, 5.3922119140625, 5.8427734375, 6.2933349609375, 6.743896484375, 7.1944580078125, 7.64501953125, 8.0955810546875, 8.546142578125, 8.9967041015625, 9.447265625, 9.8978271484375, 10.348388671875, 10.7989501953125, 11.24951171875, 11.7000732421875, 12.150634765625, 12.6011962890625, 13.0517578125, 13.5023193359375, 13.952880859375, 14.4034423828125, 14.85400390625, 15.3045654296875, 15.755126953125, 16.2056884765625, 16.65625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 13.0, 13.0, 30.0, 24.0, 36.0, 55.0, 78.0, 150.0, 224.0, 331.0, 560.0, 954.0, 1488.0, 2520.0, 4442.0, 7916.0, 14818.0, 29212.0, 74887.0, 561929.0, 248244.0, 50378.0, 22709.0, 11940.0, 6427.0, 3624.0, 2236.0, 1235.0, 752.0, 478.0, 307.0, 182.0, 107.0, 83.0, 42.0, 40.0, 36.0, 17.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.640625, -18.015625, -17.390625, -16.765625, -16.140625, -15.515625, -14.890625, -14.265625, -13.640625, -13.015625, -12.390625, -11.765625, -11.140625, -10.515625, -9.890625, -9.265625, -8.640625, -8.015625, -7.390625, -6.765625, -6.140625, -5.515625, -4.890625, -4.265625, -3.640625, -3.015625, -2.390625, -1.765625, -1.140625, -0.515625, 0.109375, 0.734375, 1.359375, 1.984375, 2.609375, 3.234375, 3.859375, 4.484375, 5.109375, 5.734375, 6.359375, 6.984375, 7.609375, 8.234375, 8.859375, 9.484375, 10.109375, 10.734375, 11.359375, 11.984375, 12.609375, 13.234375, 13.859375, 14.484375, 15.109375, 15.734375, 16.359375, 16.984375, 17.609375, 18.234375, 18.859375, 19.484375, 20.109375, 20.734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 13.0, 14.0, 13.0, 8.0, 18.0, 26.0, 33.0, 34.0, 43.0, 50.0, 49.0, 66.0, 97.0, 236.0, 1721.0, 173.0, 84.0, 71.0, 45.0, 48.0, 37.0, 45.0, 28.0, 17.0, 18.0, 18.0, 8.0, 12.0, 11.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-63.4375, -61.865234375, -60.29296875, -58.720703125, -57.1484375, -55.576171875, -54.00390625, -52.431640625, -50.859375, -49.287109375, -47.71484375, -46.142578125, -44.5703125, -42.998046875, -41.42578125, -39.853515625, -38.28125, -36.708984375, -35.13671875, -33.564453125, -31.9921875, -30.419921875, -28.84765625, -27.275390625, -25.703125, -24.130859375, -22.55859375, -20.986328125, -19.4140625, -17.841796875, -16.26953125, -14.697265625, -13.125, -11.552734375, -9.98046875, -8.408203125, -6.8359375, -5.263671875, -3.69140625, -2.119140625, -0.546875, 1.025390625, 2.59765625, 4.169921875, 5.7421875, 7.314453125, 8.88671875, 10.458984375, 12.03125, 13.603515625, 15.17578125, 16.748046875, 18.3203125, 19.892578125, 21.46484375, 23.037109375, 24.609375, 26.181640625, 27.75390625, 29.326171875, 30.8984375, 32.470703125, 34.04296875, 35.615234375, 37.1875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 14.0, 10.0, 15.0, 26.0, 27.0, 46.0, 41.0, 79.0, 115.0, 158.0, 237.0, 390.0, 1676.0, 29969.0, 3073157.0, 36653.0, 1915.0, 362.0, 246.0, 153.0, 105.0, 72.0, 48.0, 32.0, 34.0, 30.0, 12.0, 11.0, 12.0, 12.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-121.5, -117.7646484375, -114.029296875, -110.2939453125, -106.55859375, -102.8232421875, -99.087890625, -95.3525390625, -91.6171875, -87.8818359375, -84.146484375, -80.4111328125, -76.67578125, -72.9404296875, -69.205078125, -65.4697265625, -61.734375, -57.9990234375, -54.263671875, -50.5283203125, -46.79296875, -43.0576171875, -39.322265625, -35.5869140625, -31.8515625, -28.1162109375, -24.380859375, -20.6455078125, -16.91015625, -13.1748046875, -9.439453125, -5.7041015625, -1.96875, 1.7666015625, 5.501953125, 9.2373046875, 12.97265625, 16.7080078125, 20.443359375, 24.1787109375, 27.9140625, 31.6494140625, 35.384765625, 39.1201171875, 42.85546875, 46.5908203125, 50.326171875, 54.0615234375, 57.796875, 61.5322265625, 65.267578125, 69.0029296875, 72.73828125, 76.4736328125, 80.208984375, 83.9443359375, 87.6796875, 91.4150390625, 95.150390625, 98.8857421875, 102.62109375, 106.3564453125, 110.091796875, 113.8271484375, 117.5625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 42.0, 611.0, 341.0, 22.0, 2.0], "bins": [-773.5540771484375, -760.8399047851562, -748.125732421875, -735.4114990234375, -722.6973266601562, -709.983154296875, -697.2689819335938, -684.5547485351562, -671.840576171875, -659.1264038085938, -646.4122314453125, -633.697998046875, -620.9838256835938, -608.2696533203125, -595.5554809570312, -582.8412475585938, -570.1270751953125, -557.4129028320312, -544.69873046875, -531.9844970703125, -519.2703247070312, -506.55615234375, -493.8419494628906, -481.1277770996094, -468.4136047363281, -455.6994323730469, -442.9852294921875, -430.27105712890625, -417.5568542480469, -404.8426818847656, -392.12847900390625, -379.414306640625, -366.70013427734375, -353.9859619140625, -341.2717590332031, -328.5575866699219, -315.8433837890625, -303.12921142578125, -290.4150085449219, -277.7008361816406, -264.98663330078125, -252.27244567871094, -239.55825805664062, -226.8440704345703, -214.1298828125, -201.4156951904297, -188.70150756835938, -175.98733520507812, -163.27313232421875, -150.55894470214844, -137.84475708007812, -125.13056945800781, -112.4163818359375, -99.70219421386719, -86.9880142211914, -74.2738265991211, -61.55963897705078, -48.84545135498047, -36.131263732910156, -23.41707992553711, -10.702892303466797, 2.0112953186035156, 14.725479125976562, 27.439666748046875, 40.15385437011719]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 7.0, 11.0, 10.0, 13.0, 17.0, 14.0, 22.0, 17.0, 26.0, 25.0, 23.0, 29.0, 28.0, 42.0, 37.0, 35.0, 40.0, 36.0, 42.0, 34.0, 40.0, 29.0, 41.0, 29.0, 27.0, 26.0, 26.0, 35.0, 30.0, 26.0, 24.0, 16.0, 16.0, 15.0, 14.0, 20.0, 12.0, 7.0, 7.0, 5.0, 2.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-83.64948272705078, -80.78413391113281, -77.91877746582031, -75.05342102050781, -72.18807220458984, -69.32272338867188, -66.45736694335938, -63.59201431274414, -60.726661682128906, -57.86130905151367, -54.99595642089844, -52.1306037902832, -49.26525115966797, -46.399898529052734, -43.5345458984375, -40.669193267822266, -37.80384063720703, -34.9384880065918, -32.07313537597656, -29.207782745361328, -26.342430114746094, -23.47707748413086, -20.611724853515625, -17.74637222290039, -14.881019592285156, -12.015666961669922, -9.150314331054688, -6.284961700439453, -3.4196090698242188, -0.5542564392089844, 2.31109619140625, 5.176448822021484, 8.041801452636719, 10.907154083251953, 13.772506713867188, 16.637859344482422, 19.503211975097656, 22.36856460571289, 25.233917236328125, 28.09926986694336, 30.964622497558594, 33.82997512817383, 36.69532775878906, 39.5606803894043, 42.42603302001953, 45.291385650634766, 48.15673828125, 51.022090911865234, 53.88744354248047, 56.7527961730957, 59.61814880371094, 62.48350143432617, 65.3488540649414, 68.21420288085938, 71.07955932617188, 73.94491577148438, 76.81026458740234, 79.67561340332031, 82.54096984863281, 85.40632629394531, 88.27167510986328, 91.13702392578125, 94.00238037109375, 96.86773681640625, 99.73308563232422]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 7.0, 14.0, 15.0, 16.0, 24.0, 18.0, 15.0, 23.0, 29.0, 33.0, 32.0, 39.0, 53.0, 54.0, 56.0, 48.0, 43.0, 34.0, 46.0, 44.0, 45.0, 40.0, 47.0, 35.0, 31.0, 32.0, 25.0, 19.0, 22.0, 12.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.953857421875, -11.48583984375, -11.017822265625, -10.5498046875, -10.081787109375, -9.61376953125, -9.145751953125, -8.677734375, -8.209716796875, -7.74169921875, -7.273681640625, -6.8056640625, -6.337646484375, -5.86962890625, -5.401611328125, -4.93359375, -4.465576171875, -3.99755859375, -3.529541015625, -3.0615234375, -2.593505859375, -2.12548828125, -1.657470703125, -1.189453125, -0.721435546875, -0.25341796875, 0.214599609375, 0.6826171875, 1.150634765625, 1.61865234375, 2.086669921875, 2.5546875, 3.022705078125, 3.49072265625, 3.958740234375, 4.4267578125, 4.894775390625, 5.36279296875, 5.830810546875, 6.298828125, 6.766845703125, 7.23486328125, 7.702880859375, 8.1708984375, 8.638916015625, 9.10693359375, 9.574951171875, 10.04296875, 10.510986328125, 10.97900390625, 11.447021484375, 11.9150390625, 12.383056640625, 12.85107421875, 13.319091796875, 13.787109375, 14.255126953125, 14.72314453125, 15.191162109375, 15.6591796875, 16.127197265625, 16.59521484375, 17.063232421875, 17.53125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 13.0, 11.0, 15.0, 25.0, 37.0, 38.0, 43.0, 51.0, 74.0, 116.0, 146.0, 236.0, 365.0, 762.0, 1624.0, 4371.0, 14934.0, 114533.0, 2306112.0, 1659254.0, 72781.0, 11620.0, 3712.0, 1504.0, 712.0, 354.0, 230.0, 171.0, 91.0, 81.0, 64.0, 51.0, 40.0, 24.0, 23.0, 12.0, 11.0, 8.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96875, -31.7880859375, -30.607421875, -29.4267578125, -28.24609375, -27.0654296875, -25.884765625, -24.7041015625, -23.5234375, -22.3427734375, -21.162109375, -19.9814453125, -18.80078125, -17.6201171875, -16.439453125, -15.2587890625, -14.078125, -12.8974609375, -11.716796875, -10.5361328125, -9.35546875, -8.1748046875, -6.994140625, -5.8134765625, -4.6328125, -3.4521484375, -2.271484375, -1.0908203125, 0.08984375, 1.2705078125, 2.451171875, 3.6318359375, 4.8125, 5.9931640625, 7.173828125, 8.3544921875, 9.53515625, 10.7158203125, 11.896484375, 13.0771484375, 14.2578125, 15.4384765625, 16.619140625, 17.7998046875, 18.98046875, 20.1611328125, 21.341796875, 22.5224609375, 23.703125, 24.8837890625, 26.064453125, 27.2451171875, 28.42578125, 29.6064453125, 30.787109375, 31.9677734375, 33.1484375, 34.3291015625, 35.509765625, 36.6904296875, 37.87109375, 39.0517578125, 40.232421875, 41.4130859375, 42.59375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 21.0, 12.0, 23.0, 23.0, 38.0, 59.0, 83.0, 123.0, 206.0, 362.0, 574.0, 776.0, 699.0, 411.0, 245.0, 141.0, 79.0, 54.0, 41.0, 19.0, 19.0, 19.0, 4.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -37.112548828125, -36.10009765625, -35.087646484375, -34.0751953125, -33.062744140625, -32.05029296875, -31.037841796875, -30.025390625, -29.012939453125, -28.00048828125, -26.988037109375, -25.9755859375, -24.963134765625, -23.95068359375, -22.938232421875, -21.92578125, -20.913330078125, -19.90087890625, -18.888427734375, -17.8759765625, -16.863525390625, -15.85107421875, -14.838623046875, -13.826171875, -12.813720703125, -11.80126953125, -10.788818359375, -9.7763671875, -8.763916015625, -7.75146484375, -6.739013671875, -5.7265625, -4.714111328125, -3.70166015625, -2.689208984375, -1.6767578125, -0.664306640625, 0.34814453125, 1.360595703125, 2.373046875, 3.385498046875, 4.39794921875, 5.410400390625, 6.4228515625, 7.435302734375, 8.44775390625, 9.460205078125, 10.47265625, 11.485107421875, 12.49755859375, 13.510009765625, 14.5224609375, 15.534912109375, 16.54736328125, 17.559814453125, 18.572265625, 19.584716796875, 20.59716796875, 21.609619140625, 22.6220703125, 23.634521484375, 24.64697265625, 25.659423828125, 26.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 23.0, 24.0, 37.0, 60.0, 127.0, 207.0, 516.0, 2037.0, 29133.0, 3876939.0, 277267.0, 6101.0, 966.0, 310.0, 185.0, 104.0, 63.0, 41.0, 23.0, 22.0, 22.0, 17.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.0625, -89.5830078125, -86.103515625, -82.6240234375, -79.14453125, -75.6650390625, -72.185546875, -68.7060546875, -65.2265625, -61.7470703125, -58.267578125, -54.7880859375, -51.30859375, -47.8291015625, -44.349609375, -40.8701171875, -37.390625, -33.9111328125, -30.431640625, -26.9521484375, -23.47265625, -19.9931640625, -16.513671875, -13.0341796875, -9.5546875, -6.0751953125, -2.595703125, 0.8837890625, 4.36328125, 7.8427734375, 11.322265625, 14.8017578125, 18.28125, 21.7607421875, 25.240234375, 28.7197265625, 32.19921875, 35.6787109375, 39.158203125, 42.6376953125, 46.1171875, 49.5966796875, 53.076171875, 56.5556640625, 60.03515625, 63.5146484375, 66.994140625, 70.4736328125, 73.953125, 77.4326171875, 80.912109375, 84.3916015625, 87.87109375, 91.3505859375, 94.830078125, 98.3095703125, 101.7890625, 105.2685546875, 108.748046875, 112.2275390625, 115.70703125, 119.1865234375, 122.666015625, 126.1455078125, 129.625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 26.0, 26.0, 42.0, 51.0, 97.0, 131.0, 130.0, 134.0, 122.0, 90.0, 55.0, 27.0, 19.0, 11.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.36597442626953, -105.58758544921875, -101.80918884277344, -98.03079986572266, -94.25241088867188, -90.47401428222656, -86.69562530517578, -82.917236328125, -79.13883972167969, -75.3604507446289, -71.5820541381836, -67.80366516113281, -64.02527618408203, -60.246883392333984, -56.46849060058594, -52.690101623535156, -48.911712646484375, -45.13331985473633, -41.35493087768555, -37.5765380859375, -33.79814910888672, -30.019756317138672, -26.241363525390625, -22.46297264099121, -18.684581756591797, -14.906190872192383, -11.127799034118652, -7.349407196044922, -3.571016311645508, 0.20737457275390625, 3.985767364501953, 7.764158248901367, 11.54254150390625, 15.320932388305664, 19.099323272705078, 22.877716064453125, 26.65610694885254, 30.434497833251953, 34.212890625, 37.99127960205078, 41.76967239379883, 45.548065185546875, 49.326454162597656, 53.1048469543457, 56.88323974609375, 60.66162872314453, 64.44001770019531, 68.21841430664062, 71.9968032836914, 75.77519226074219, 79.5535888671875, 83.33197784423828, 87.11036682128906, 90.88876342773438, 94.66715240478516, 98.44554138183594, 102.22393798828125, 106.00232696533203, 109.78072357177734, 113.55911254882812, 117.3375015258789, 121.11589050292969, 124.894287109375, 128.6726837158203, 132.45106506347656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 3.0, 8.0, 8.0, 8.0, 7.0, 18.0, 11.0, 21.0, 13.0, 14.0, 17.0, 20.0, 32.0, 20.0, 29.0, 23.0, 34.0, 36.0, 30.0, 22.0, 26.0, 54.0, 33.0, 42.0, 32.0, 41.0, 34.0, 43.0, 35.0, 34.0, 31.0, 16.0, 20.0, 24.0, 12.0, 19.0, 15.0, 21.0, 13.0, 16.0, 6.0, 9.0, 9.0, 6.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-60.43287658691406, -58.43415069580078, -56.4354248046875, -54.43669891357422, -52.43797302246094, -50.439247131347656, -48.44052505493164, -46.44179916381836, -44.44307327270508, -42.4443473815918, -40.445621490478516, -38.446895599365234, -36.44817352294922, -34.44944763183594, -32.450721740722656, -30.451995849609375, -28.453269958496094, -26.454544067382812, -24.45581817626953, -22.457094192504883, -20.4583683013916, -18.45964241027832, -16.460918426513672, -14.46219253540039, -12.46346664428711, -10.464740753173828, -8.466015815734863, -6.46729040145874, -4.468564987182617, -2.469839096069336, -0.4711141586303711, 1.5276107788085938, 3.526336669921875, 5.525062084197998, 7.523787498474121, 9.522512435913086, 11.521238327026367, 13.519964218139648, 15.518689155578613, 17.517414093017578, 19.51613998413086, 21.51486587524414, 23.513591766357422, 25.51231575012207, 27.51104164123535, 29.509767532348633, 31.50849151611328, 33.50721740722656, 35.505943298339844, 37.504669189453125, 39.503395080566406, 41.50212097167969, 43.50084686279297, 45.49957275390625, 47.498294830322266, 49.49702072143555, 51.49574661254883, 53.49447250366211, 55.49319839477539, 57.49192428588867, 59.49064636230469, 61.48937225341797, 63.48809814453125, 65.48682403564453, 67.48554992675781]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 5.0, 17.0, 13.0, 21.0, 21.0, 24.0, 27.0, 20.0, 43.0, 48.0, 38.0, 39.0, 56.0, 53.0, 40.0, 45.0, 45.0, 38.0, 49.0, 40.0, 54.0, 33.0, 27.0, 18.0, 29.0, 30.0, 22.0, 14.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.25146484375, -10.8154296875, -10.37939453125, -9.943359375, -9.50732421875, -9.0712890625, -8.63525390625, -8.19921875, -7.76318359375, -7.3271484375, -6.89111328125, -6.455078125, -6.01904296875, -5.5830078125, -5.14697265625, -4.7109375, -4.27490234375, -3.8388671875, -3.40283203125, -2.966796875, -2.53076171875, -2.0947265625, -1.65869140625, -1.22265625, -0.78662109375, -0.3505859375, 0.08544921875, 0.521484375, 0.95751953125, 1.3935546875, 1.82958984375, 2.265625, 2.70166015625, 3.1376953125, 3.57373046875, 4.009765625, 4.44580078125, 4.8818359375, 5.31787109375, 5.75390625, 6.18994140625, 6.6259765625, 7.06201171875, 7.498046875, 7.93408203125, 8.3701171875, 8.80615234375, 9.2421875, 9.67822265625, 10.1142578125, 10.55029296875, 10.986328125, 11.42236328125, 11.8583984375, 12.29443359375, 12.73046875, 13.16650390625, 13.6025390625, 14.03857421875, 14.474609375, 14.91064453125, 15.3466796875, 15.78271484375, 16.21875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 10.0, 19.0, 26.0, 49.0, 75.0, 92.0, 132.0, 171.0, 299.0, 493.0, 640.0, 937.0, 1372.0, 2167.0, 3135.0, 4590.0, 7086.0, 10737.0, 17119.0, 26723.0, 43078.0, 70233.0, 112308.0, 166685.0, 188950.0, 143878.0, 92453.0, 57101.0, 35027.0, 22179.0, 13916.0, 8992.0, 5876.0, 3910.0, 2576.0, 1839.0, 1218.0, 796.0, 551.0, 346.0, 283.0, 166.0, 97.0, 77.0, 60.0, 24.0, 22.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0], "bins": [-1.9052734375, -1.8480377197265625, -1.790802001953125, -1.7335662841796875, -1.67633056640625, -1.6190948486328125, -1.561859130859375, -1.5046234130859375, -1.4473876953125, -1.3901519775390625, -1.332916259765625, -1.2756805419921875, -1.21844482421875, -1.1612091064453125, -1.103973388671875, -1.0467376708984375, -0.989501953125, -0.9322662353515625, -0.875030517578125, -0.8177947998046875, -0.76055908203125, -0.7033233642578125, -0.646087646484375, -0.5888519287109375, -0.5316162109375, -0.4743804931640625, -0.417144775390625, -0.3599090576171875, -0.30267333984375, -0.2454376220703125, -0.188201904296875, -0.1309661865234375, -0.07373046875, -0.0164947509765625, 0.040740966796875, 0.0979766845703125, 0.15521240234375, 0.2124481201171875, 0.269683837890625, 0.3269195556640625, 0.3841552734375, 0.4413909912109375, 0.498626708984375, 0.5558624267578125, 0.61309814453125, 0.6703338623046875, 0.727569580078125, 0.7848052978515625, 0.842041015625, 0.8992767333984375, 0.956512451171875, 1.0137481689453125, 1.07098388671875, 1.1282196044921875, 1.185455322265625, 1.2426910400390625, 1.2999267578125, 1.3571624755859375, 1.414398193359375, 1.4716339111328125, 1.52886962890625, 1.5861053466796875, 1.643341064453125, 1.7005767822265625, 1.7578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 11.0, 16.0, 26.0, 21.0, 20.0, 24.0, 39.0, 30.0, 29.0, 43.0, 32.0, 33.0, 46.0, 30.0, 1058.0, 45.0, 35.0, 37.0, 41.0, 34.0, 35.0, 33.0, 34.0, 29.0, 26.0, 16.0, 24.0, 21.0, 17.0, 14.0, 11.0, 7.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.0377197265625, -7.770751953125, -7.5037841796875, -7.23681640625, -6.9698486328125, -6.702880859375, -6.4359130859375, -6.1689453125, -5.9019775390625, -5.635009765625, -5.3680419921875, -5.10107421875, -4.8341064453125, -4.567138671875, -4.3001708984375, -4.033203125, -3.7662353515625, -3.499267578125, -3.2322998046875, -2.96533203125, -2.6983642578125, -2.431396484375, -2.1644287109375, -1.8974609375, -1.6304931640625, -1.363525390625, -1.0965576171875, -0.82958984375, -0.5626220703125, -0.295654296875, -0.0286865234375, 0.23828125, 0.5052490234375, 0.772216796875, 1.0391845703125, 1.30615234375, 1.5731201171875, 1.840087890625, 2.1070556640625, 2.3740234375, 2.6409912109375, 2.907958984375, 3.1749267578125, 3.44189453125, 3.7088623046875, 3.975830078125, 4.2427978515625, 4.509765625, 4.7767333984375, 5.043701171875, 5.3106689453125, 5.57763671875, 5.8446044921875, 6.111572265625, 6.3785400390625, 6.6455078125, 6.9124755859375, 7.179443359375, 7.4464111328125, 7.71337890625, 7.9803466796875, 8.247314453125, 8.5142822265625, 8.78125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 9.0, 14.0, 17.0, 38.0, 40.0, 81.0, 105.0, 131.0, 192.0, 294.0, 371.0, 596.0, 830.0, 1189.0, 1800.0, 2516.0, 3639.0, 5251.0, 7811.0, 11670.0, 17986.0, 27895.0, 43752.0, 69432.0, 108478.0, 161616.0, 1226939.0, 142930.0, 93822.0, 59648.0, 37764.0, 23713.0, 15315.0, 10052.0, 6588.0, 4555.0, 3104.0, 2083.0, 1488.0, 1017.0, 722.0, 502.0, 334.0, 232.0, 183.0, 108.0, 91.0, 58.0, 46.0, 32.0, 18.0, 12.0, 9.0, 9.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0514068603515625, -1.017852783203125, -0.9842987060546875, -0.95074462890625, -0.9171905517578125, -0.883636474609375, -0.8500823974609375, -0.8165283203125, -0.7829742431640625, -0.749420166015625, -0.7158660888671875, -0.68231201171875, -0.6487579345703125, -0.615203857421875, -0.5816497802734375, -0.548095703125, -0.5145416259765625, -0.480987548828125, -0.4474334716796875, -0.41387939453125, -0.3803253173828125, -0.346771240234375, -0.3132171630859375, -0.2796630859375, -0.2461090087890625, -0.212554931640625, -0.1790008544921875, -0.14544677734375, -0.1118927001953125, -0.078338623046875, -0.0447845458984375, -0.01123046875, 0.0223236083984375, 0.055877685546875, 0.0894317626953125, 0.12298583984375, 0.1565399169921875, 0.190093994140625, 0.2236480712890625, 0.2572021484375, 0.2907562255859375, 0.324310302734375, 0.3578643798828125, 0.39141845703125, 0.4249725341796875, 0.458526611328125, 0.4920806884765625, 0.525634765625, 0.5591888427734375, 0.592742919921875, 0.6262969970703125, 0.65985107421875, 0.6934051513671875, 0.726959228515625, 0.7605133056640625, 0.7940673828125, 0.8276214599609375, 0.861175537109375, 0.8947296142578125, 0.92828369140625, 0.9618377685546875, 0.995391845703125, 1.0289459228515625, 1.0625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 13.0, 9.0, 13.0, 8.0, 10.0, 17.0, 26.0, 34.0, 46.0, 84.0, 121.0, 201.0, 119.0, 68.0, 54.0, 36.0, 15.0, 15.0, 18.0, 16.0, 8.0, 5.0, 10.0, 4.0, 7.0, 0.0, 6.0, 3.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.038210391998291016, -0.03680896759033203, -0.03540754318237305, -0.03400611877441406, -0.03260469436645508, -0.031203269958496094, -0.02980184555053711, -0.028400421142578125, -0.02699899673461914, -0.025597572326660156, -0.024196147918701172, -0.022794723510742188, -0.021393299102783203, -0.01999187469482422, -0.018590450286865234, -0.01718902587890625, -0.015787601470947266, -0.014386177062988281, -0.012984752655029297, -0.011583328247070312, -0.010181903839111328, -0.008780479431152344, -0.007379055023193359, -0.005977630615234375, -0.004576206207275391, -0.0031747817993164062, -0.0017733573913574219, -0.0003719329833984375, 0.0010294914245605469, 0.0024309158325195312, 0.0038323402404785156, 0.0052337646484375, 0.006635189056396484, 0.008036613464355469, 0.009438037872314453, 0.010839462280273438, 0.012240886688232422, 0.013642311096191406, 0.01504373550415039, 0.016445159912109375, 0.01784658432006836, 0.019248008728027344, 0.020649433135986328, 0.022050857543945312, 0.023452281951904297, 0.02485370635986328, 0.026255130767822266, 0.02765655517578125, 0.029057979583740234, 0.03045940399169922, 0.0318608283996582, 0.03326225280761719, 0.03466367721557617, 0.036065101623535156, 0.03746652603149414, 0.038867950439453125, 0.04026937484741211, 0.041670799255371094, 0.04307222366333008, 0.04447364807128906, 0.04587507247924805, 0.04727649688720703, 0.048677921295166016, 0.050079345703125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 5.0, 8.0, 10.0, 11.0, 25.0, 22.0, 30.0, 34.0, 75.0, 135.0, 351.0, 3100.0, 1017358.0, 26285.0, 630.0, 176.0, 87.0, 53.0, 35.0, 18.0, 15.0, 15.0, 11.0, 14.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0745086669921875, -1.043548583984375, -1.0125885009765625, -0.98162841796875, -0.9506683349609375, -0.919708251953125, -0.8887481689453125, -0.8577880859375, -0.8268280029296875, -0.795867919921875, -0.7649078369140625, -0.73394775390625, -0.7029876708984375, -0.672027587890625, -0.6410675048828125, -0.610107421875, -0.5791473388671875, -0.548187255859375, -0.5172271728515625, -0.48626708984375, -0.4553070068359375, -0.424346923828125, -0.3933868408203125, -0.3624267578125, -0.3314666748046875, -0.300506591796875, -0.2695465087890625, -0.23858642578125, -0.2076263427734375, -0.176666259765625, -0.1457061767578125, -0.11474609375, -0.0837860107421875, -0.052825927734375, -0.0218658447265625, 0.00909423828125, 0.0400543212890625, 0.071014404296875, 0.1019744873046875, 0.1329345703125, 0.1638946533203125, 0.194854736328125, 0.2258148193359375, 0.25677490234375, 0.2877349853515625, 0.318695068359375, 0.3496551513671875, 0.380615234375, 0.4115753173828125, 0.442535400390625, 0.4734954833984375, 0.50445556640625, 0.5354156494140625, 0.566375732421875, 0.5973358154296875, 0.6282958984375, 0.6592559814453125, 0.690216064453125, 0.7211761474609375, 0.75213623046875, 0.7830963134765625, 0.814056396484375, 0.8450164794921875, 0.8759765625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 17.0, 49.0, 176.0, 395.0, 242.0, 77.0, 26.0, 16.0, 7.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.26095834374427795, -0.2561827600002289, -0.2514071464538574, -0.24663156270980835, -0.24185597896575928, -0.2370803952217102, -0.23230479657649994, -0.22752919793128967, -0.2227536141872406, -0.21797803044319153, -0.21320243179798126, -0.208426833152771, -0.20365124940872192, -0.19887566566467285, -0.19410006701946259, -0.18932446837425232, -0.18454888463020325, -0.17977330088615417, -0.1749977022409439, -0.17022210359573364, -0.16544651985168457, -0.1606709361076355, -0.15589533746242523, -0.15111973881721497, -0.1463441550731659, -0.14156857132911682, -0.13679297268390656, -0.1320173740386963, -0.12724179029464722, -0.12246619910001755, -0.11769060790538788, -0.11291501671075821, -0.10813944041728973, -0.10336384922266006, -0.0985882580280304, -0.09381266683340073, -0.08903707563877106, -0.08426148444414139, -0.07948589324951172, -0.07471030205488205, -0.06993471086025238, -0.06515911966562271, -0.06038352847099304, -0.05560793727636337, -0.050832346081733704, -0.046056754887104034, -0.041281163692474365, -0.036505572497844696, -0.03172997757792473, -0.02695438638329506, -0.02217879518866539, -0.01740320399403572, -0.012627612799406052, -0.007852021604776382, -0.0030764304101467133, 0.001699160784482956, 0.006474751979112625, 0.011250343173742294, 0.016025934368371964, 0.020801525563001633, 0.025577116757631302, 0.03035270795226097, 0.03512829914689064, 0.03990389034152031, 0.04467948153614998]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 9.0, 15.0, 20.0, 24.0, 18.0, 15.0, 22.0, 25.0, 36.0, 35.0, 34.0, 29.0, 42.0, 40.0, 36.0, 41.0, 37.0, 40.0, 33.0, 33.0, 41.0, 34.0, 35.0, 23.0, 25.0, 34.0, 32.0, 20.0, 26.0, 23.0, 15.0, 11.0, 6.0, 13.0, 12.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.027714073657989502, -0.026950374245643616, -0.02618667669594288, -0.02542297914624214, -0.024659279733896255, -0.02389558032155037, -0.023131882771849632, -0.022368185222148895, -0.02160448580980301, -0.020840786397457123, -0.020077088847756386, -0.01931339129805565, -0.018549691885709763, -0.017785992473363876, -0.01702229492366314, -0.016258597373962402, -0.015494897961616516, -0.014731199480593204, -0.013967500999569893, -0.013203802518546581, -0.01244010403752327, -0.011676405556499958, -0.010912707075476646, -0.010149008594453335, -0.009385310113430023, -0.008621611632406712, -0.0078579131513834, -0.007094214670360088, -0.006330516189336777, -0.005566817708313465, -0.0048031192272901535, -0.004039420746266842, -0.0032757222652435303, -0.0025120237842202187, -0.001748325303196907, -0.0009846268221735954, -0.0002209283411502838, 0.0005427701398730278, 0.0013064686208963394, 0.002070167101919651, 0.0028338655829429626, 0.0035975640639662743, 0.004361262544989586, 0.0051249610260128975, 0.005888659507036209, 0.006652357988059521, 0.007416056469082832, 0.008179754950106144, 0.008943453431129456, 0.009707151912152767, 0.010470850393176079, 0.01123454887419939, 0.011998247355222702, 0.012761945836246014, 0.013525644317269325, 0.014289342798292637, 0.015053041279315948, 0.015816740691661835, 0.01658043824136257, 0.01734413579106331, 0.018107835203409195, 0.01887153461575508, 0.019635232165455818, 0.020398929715156555, 0.02116262912750244]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 5.0, 17.0, 13.0, 21.0, 21.0, 24.0, 27.0, 20.0, 43.0, 48.0, 38.0, 39.0, 56.0, 53.0, 40.0, 45.0, 45.0, 38.0, 49.0, 40.0, 54.0, 33.0, 27.0, 18.0, 29.0, 30.0, 21.0, 15.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.25146484375, -10.8154296875, -10.37939453125, -9.943359375, -9.50732421875, -9.0712890625, -8.63525390625, -8.19921875, -7.76318359375, -7.3271484375, -6.89111328125, -6.455078125, -6.01904296875, -5.5830078125, -5.14697265625, -4.7109375, -4.27490234375, -3.8388671875, -3.40283203125, -2.966796875, -2.53076171875, -2.0947265625, -1.65869140625, -1.22265625, -0.78662109375, -0.3505859375, 0.08544921875, 0.521484375, 0.95751953125, 1.3935546875, 1.82958984375, 2.265625, 2.70166015625, 3.1376953125, 3.57373046875, 4.009765625, 4.44580078125, 4.8818359375, 5.31787109375, 5.75390625, 6.18994140625, 6.6259765625, 7.06201171875, 7.498046875, 7.93408203125, 8.3701171875, 8.80615234375, 9.2421875, 9.67822265625, 10.1142578125, 10.55029296875, 10.986328125, 11.42236328125, 11.8583984375, 12.29443359375, 12.73046875, 13.16650390625, 13.6025390625, 14.03857421875, 14.474609375, 14.91064453125, 15.3466796875, 15.78271484375, 16.21875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 10.0, 19.0, 19.0, 19.0, 41.0, 48.0, 68.0, 108.0, 117.0, 200.0, 267.0, 411.0, 676.0, 1007.0, 1657.0, 2588.0, 4539.0, 8701.0, 22300.0, 117306.0, 720497.0, 124412.0, 22640.0, 8902.0, 4614.0, 2645.0, 1577.0, 1073.0, 692.0, 423.0, 303.0, 194.0, 137.0, 94.0, 67.0, 47.0, 35.0, 28.0, 16.0, 11.0, 7.0, 9.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.296875, -16.72998046875, -16.1630859375, -15.59619140625, -15.029296875, -14.46240234375, -13.8955078125, -13.32861328125, -12.76171875, -12.19482421875, -11.6279296875, -11.06103515625, -10.494140625, -9.92724609375, -9.3603515625, -8.79345703125, -8.2265625, -7.65966796875, -7.0927734375, -6.52587890625, -5.958984375, -5.39208984375, -4.8251953125, -4.25830078125, -3.69140625, -3.12451171875, -2.5576171875, -1.99072265625, -1.423828125, -0.85693359375, -0.2900390625, 0.27685546875, 0.84375, 1.41064453125, 1.9775390625, 2.54443359375, 3.111328125, 3.67822265625, 4.2451171875, 4.81201171875, 5.37890625, 5.94580078125, 6.5126953125, 7.07958984375, 7.646484375, 8.21337890625, 8.7802734375, 9.34716796875, 9.9140625, 10.48095703125, 11.0478515625, 11.61474609375, 12.181640625, 12.74853515625, 13.3154296875, 13.88232421875, 14.44921875, 15.01611328125, 15.5830078125, 16.14990234375, 16.716796875, 17.28369140625, 17.8505859375, 18.41748046875, 18.984375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 10.0, 12.0, 16.0, 15.0, 18.0, 25.0, 25.0, 27.0, 46.0, 31.0, 43.0, 40.0, 59.0, 64.0, 91.0, 343.0, 1622.0, 95.0, 58.0, 43.0, 36.0, 33.0, 38.0, 41.0, 36.0, 27.0, 22.0, 15.0, 17.0, 24.0, 9.0, 11.0, 10.0, 12.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.03125, -37.736328125, -36.44140625, -35.146484375, -33.8515625, -32.556640625, -31.26171875, -29.966796875, -28.671875, -27.376953125, -26.08203125, -24.787109375, -23.4921875, -22.197265625, -20.90234375, -19.607421875, -18.3125, -17.017578125, -15.72265625, -14.427734375, -13.1328125, -11.837890625, -10.54296875, -9.248046875, -7.953125, -6.658203125, -5.36328125, -4.068359375, -2.7734375, -1.478515625, -0.18359375, 1.111328125, 2.40625, 3.701171875, 4.99609375, 6.291015625, 7.5859375, 8.880859375, 10.17578125, 11.470703125, 12.765625, 14.060546875, 15.35546875, 16.650390625, 17.9453125, 19.240234375, 20.53515625, 21.830078125, 23.125, 24.419921875, 25.71484375, 27.009765625, 28.3046875, 29.599609375, 30.89453125, 32.189453125, 33.484375, 34.779296875, 36.07421875, 37.369140625, 38.6640625, 39.958984375, 41.25390625, 42.548828125, 43.84375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 10.0, 18.0, 18.0, 23.0, 27.0, 22.0, 44.0, 62.0, 74.0, 116.0, 115.0, 175.0, 330.0, 692.0, 4004.0, 71816.0, 3047326.0, 17492.0, 1845.0, 515.0, 238.0, 160.0, 144.0, 95.0, 62.0, 50.0, 33.0, 29.0, 29.0, 23.0, 17.0, 14.0, 20.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-91.8125, -89.0556640625, -86.298828125, -83.5419921875, -80.78515625, -78.0283203125, -75.271484375, -72.5146484375, -69.7578125, -67.0009765625, -64.244140625, -61.4873046875, -58.73046875, -55.9736328125, -53.216796875, -50.4599609375, -47.703125, -44.9462890625, -42.189453125, -39.4326171875, -36.67578125, -33.9189453125, -31.162109375, -28.4052734375, -25.6484375, -22.8916015625, -20.134765625, -17.3779296875, -14.62109375, -11.8642578125, -9.107421875, -6.3505859375, -3.59375, -0.8369140625, 1.919921875, 4.6767578125, 7.43359375, 10.1904296875, 12.947265625, 15.7041015625, 18.4609375, 21.2177734375, 23.974609375, 26.7314453125, 29.48828125, 32.2451171875, 35.001953125, 37.7587890625, 40.515625, 43.2724609375, 46.029296875, 48.7861328125, 51.54296875, 54.2998046875, 57.056640625, 59.8134765625, 62.5703125, 65.3271484375, 68.083984375, 70.8408203125, 73.59765625, 76.3544921875, 79.111328125, 81.8681640625, 84.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 67.0, 253.0, 414.0, 203.0, 57.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.71463012695312, -210.3649139404297, -206.0152130126953, -201.66549682617188, -197.3157958984375, -192.96607971191406, -188.61636352539062, -184.26666259765625, -179.9169464111328, -175.56723022460938, -171.217529296875, -166.86781311035156, -162.5181121826172, -158.16839599609375, -153.81869506835938, -149.46897888183594, -145.1192626953125, -140.76954650878906, -136.4198455810547, -132.07012939453125, -127.72042083740234, -123.37071228027344, -119.02100372314453, -114.67129516601562, -110.32159423828125, -105.97188568115234, -101.62217712402344, -97.2724609375, -92.9227523803711, -88.57304382324219, -84.22333526611328, -79.87362670898438, -75.52389526367188, -71.17418670654297, -66.82447814941406, -62.47476577758789, -58.12505340576172, -53.77534484863281, -49.425636291503906, -45.075927734375, -40.726219177246094, -36.37651062011719, -32.026798248291016, -27.67708969116211, -23.32737922668457, -18.97766876220703, -14.627960205078125, -10.278249740600586, -5.928539276123047, -1.578829288482666, 2.770880699157715, 7.1205902099609375, 11.470300674438477, 15.820011138916016, 20.169719696044922, 24.51943016052246, 28.869140625, 33.218849182128906, 37.56856155395508, 41.918270111083984, 46.267982482910156, 50.61769104003906, 54.96739959716797, 59.317108154296875, 63.66682052612305]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 11.0, 12.0, 15.0, 13.0, 17.0, 11.0, 19.0, 22.0, 26.0, 26.0, 30.0, 33.0, 34.0, 37.0, 34.0, 29.0, 40.0, 39.0, 44.0, 39.0, 49.0, 39.0, 48.0, 33.0, 27.0, 29.0, 36.0, 32.0, 31.0, 22.0, 14.0, 20.0, 11.0, 9.0, 8.0, 15.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-94.56412506103516, -91.71785736083984, -88.87159729003906, -86.02532958984375, -83.17906951904297, -80.33280181884766, -77.48654174804688, -74.64027404785156, -71.79401397705078, -68.94774627685547, -66.10148620605469, -63.25522232055664, -60.408958435058594, -57.56269454956055, -54.7164306640625, -51.87016296386719, -49.02389907836914, -46.177635192871094, -43.33137130737305, -40.485107421875, -37.63884353637695, -34.792579650878906, -31.946313858032227, -29.10004997253418, -26.253786087036133, -23.407522201538086, -20.56125831604004, -17.71499252319336, -14.868729591369629, -12.022465705871582, -9.176200866699219, -6.329936981201172, -3.483673095703125, -0.637408971786499, 2.208855152130127, 5.055119514465332, 7.901383399963379, 10.747647285461426, 13.593912124633789, 16.440176010131836, 19.286439895629883, 22.13270378112793, 24.978967666625977, 27.825233459472656, 30.671497344970703, 33.51776123046875, 36.3640251159668, 39.210289001464844, 42.05655288696289, 44.90281677246094, 47.749080657958984, 50.59534454345703, 53.44160842895508, 56.287872314453125, 59.13414001464844, 61.98040008544922, 64.82666778564453, 67.67293548583984, 70.51919555664062, 73.36546325683594, 76.21172332763672, 79.05799102783203, 81.90425109863281, 84.75051879882812, 87.5967788696289]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 12.0, 6.0, 20.0, 11.0, 13.0, 17.0, 10.0, 24.0, 30.0, 30.0, 36.0, 30.0, 49.0, 48.0, 52.0, 44.0, 54.0, 36.0, 39.0, 47.0, 36.0, 38.0, 40.0, 44.0, 46.0, 20.0, 25.0, 23.0, 23.0, 16.0, 15.0, 11.0, 13.0, 2.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6112060546875, -11.167724609375, -10.7242431640625, -10.28076171875, -9.8372802734375, -9.393798828125, -8.9503173828125, -8.5068359375, -8.0633544921875, -7.619873046875, -7.1763916015625, -6.73291015625, -6.2894287109375, -5.845947265625, -5.4024658203125, -4.958984375, -4.5155029296875, -4.072021484375, -3.6285400390625, -3.18505859375, -2.7415771484375, -2.298095703125, -1.8546142578125, -1.4111328125, -0.9676513671875, -0.524169921875, -0.0806884765625, 0.36279296875, 0.8062744140625, 1.249755859375, 1.6932373046875, 2.13671875, 2.5802001953125, 3.023681640625, 3.4671630859375, 3.91064453125, 4.3541259765625, 4.797607421875, 5.2410888671875, 5.6845703125, 6.1280517578125, 6.571533203125, 7.0150146484375, 7.45849609375, 7.9019775390625, 8.345458984375, 8.7889404296875, 9.232421875, 9.6759033203125, 10.119384765625, 10.5628662109375, 11.00634765625, 11.4498291015625, 11.893310546875, 12.3367919921875, 12.7802734375, 13.2237548828125, 13.667236328125, 14.1107177734375, 14.55419921875, 14.9976806640625, 15.441162109375, 15.8846435546875, 16.328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 16.0, 16.0, 15.0, 26.0, 24.0, 29.0, 24.0, 36.0, 48.0, 53.0, 97.0, 160.0, 286.0, 655.0, 1527.0, 4379.0, 14364.0, 85653.0, 1590128.0, 2326199.0, 144290.0, 17590.0, 4933.0, 1881.0, 803.0, 362.0, 214.0, 114.0, 93.0, 54.0, 39.0, 40.0, 26.0, 19.0, 24.0, 13.0, 11.0, 10.0, 11.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.734375, -29.640380859375, -28.54638671875, -27.452392578125, -26.3583984375, -25.264404296875, -24.17041015625, -23.076416015625, -21.982421875, -20.888427734375, -19.79443359375, -18.700439453125, -17.6064453125, -16.512451171875, -15.41845703125, -14.324462890625, -13.23046875, -12.136474609375, -11.04248046875, -9.948486328125, -8.8544921875, -7.760498046875, -6.66650390625, -5.572509765625, -4.478515625, -3.384521484375, -2.29052734375, -1.196533203125, -0.1025390625, 0.991455078125, 2.08544921875, 3.179443359375, 4.2734375, 5.367431640625, 6.46142578125, 7.555419921875, 8.6494140625, 9.743408203125, 10.83740234375, 11.931396484375, 13.025390625, 14.119384765625, 15.21337890625, 16.307373046875, 17.4013671875, 18.495361328125, 19.58935546875, 20.683349609375, 21.77734375, 22.871337890625, 23.96533203125, 25.059326171875, 26.1533203125, 27.247314453125, 28.34130859375, 29.435302734375, 30.529296875, 31.623291015625, 32.71728515625, 33.811279296875, 34.9052734375, 35.999267578125, 37.09326171875, 38.187255859375, 39.28125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 3.0, 9.0, 17.0, 13.0, 26.0, 39.0, 46.0, 59.0, 74.0, 130.0, 188.0, 336.0, 539.0, 689.0, 650.0, 483.0, 247.0, 172.0, 90.0, 74.0, 42.0, 34.0, 22.0, 18.0, 15.0, 15.0, 7.0, 10.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.0, -35.071533203125, -34.14306640625, -33.214599609375, -32.2861328125, -31.357666015625, -30.42919921875, -29.500732421875, -28.572265625, -27.643798828125, -26.71533203125, -25.786865234375, -24.8583984375, -23.929931640625, -23.00146484375, -22.072998046875, -21.14453125, -20.216064453125, -19.28759765625, -18.359130859375, -17.4306640625, -16.502197265625, -15.57373046875, -14.645263671875, -13.716796875, -12.788330078125, -11.85986328125, -10.931396484375, -10.0029296875, -9.074462890625, -8.14599609375, -7.217529296875, -6.2890625, -5.360595703125, -4.43212890625, -3.503662109375, -2.5751953125, -1.646728515625, -0.71826171875, 0.210205078125, 1.138671875, 2.067138671875, 2.99560546875, 3.924072265625, 4.8525390625, 5.781005859375, 6.70947265625, 7.637939453125, 8.56640625, 9.494873046875, 10.42333984375, 11.351806640625, 12.2802734375, 13.208740234375, 14.13720703125, 15.065673828125, 15.994140625, 16.922607421875, 17.85107421875, 18.779541015625, 19.7080078125, 20.636474609375, 21.56494140625, 22.493408203125, 23.421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 7.0, 6.0, 13.0, 11.0, 11.0, 14.0, 26.0, 25.0, 40.0, 51.0, 86.0, 152.0, 282.0, 667.0, 7524.0, 2757185.0, 1420938.0, 5918.0, 623.0, 254.0, 142.0, 77.0, 69.0, 45.0, 33.0, 28.0, 12.0, 17.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5, -106.244140625, -101.98828125, -97.732421875, -93.4765625, -89.220703125, -84.96484375, -80.708984375, -76.453125, -72.197265625, -67.94140625, -63.685546875, -59.4296875, -55.173828125, -50.91796875, -46.662109375, -42.40625, -38.150390625, -33.89453125, -29.638671875, -25.3828125, -21.126953125, -16.87109375, -12.615234375, -8.359375, -4.103515625, 0.15234375, 4.408203125, 8.6640625, 12.919921875, 17.17578125, 21.431640625, 25.6875, 29.943359375, 34.19921875, 38.455078125, 42.7109375, 46.966796875, 51.22265625, 55.478515625, 59.734375, 63.990234375, 68.24609375, 72.501953125, 76.7578125, 81.013671875, 85.26953125, 89.525390625, 93.78125, 98.037109375, 102.29296875, 106.548828125, 110.8046875, 115.060546875, 119.31640625, 123.572265625, 127.828125, 132.083984375, 136.33984375, 140.595703125, 144.8515625, 149.107421875, 153.36328125, 157.619140625, 161.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 9.0, 35.0, 55.0, 119.0, 150.0, 181.0, 188.0, 122.0, 63.0, 37.0, 18.0, 15.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.97232055664062, -248.7565155029297, -243.54071044921875, -238.32489013671875, -233.1090850830078, -227.89328002929688, -222.67747497558594, -217.461669921875, -212.24586486816406, -207.03005981445312, -201.8142547607422, -196.59844970703125, -191.38262939453125, -186.1668243408203, -180.95101928710938, -175.73521423339844, -170.5194091796875, -165.30360412597656, -160.08779907226562, -154.87197875976562, -149.6561737060547, -144.44036865234375, -139.2245635986328, -134.00875854492188, -128.79293823242188, -123.57713317871094, -118.36132049560547, -113.14551544189453, -107.9297103881836, -102.71389770507812, -97.49809265136719, -92.28228759765625, -87.06649017333984, -81.8506851196289, -76.63487243652344, -71.4190673828125, -66.20326232910156, -60.98745346069336, -55.771644592285156, -50.55583953857422, -45.340030670166016, -40.12422180175781, -34.908416748046875, -29.692607879638672, -24.4768009185791, -19.26099395751953, -14.045185089111328, -8.82938003540039, -3.6135711669921875, 1.602236270904541, 6.8180437088012695, 12.033851623535156, 17.249658584594727, 22.465465545654297, 27.6812744140625, 32.89707946777344, 38.11288833618164, 43.328697204589844, 48.54450225830078, 53.760311126708984, 58.97611999511719, 64.19192504882812, 69.40773010253906, 74.62353515625, 79.83934783935547]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 8.0, 5.0, 13.0, 8.0, 22.0, 16.0, 24.0, 24.0, 17.0, 29.0, 26.0, 39.0, 27.0, 33.0, 39.0, 43.0, 35.0, 39.0, 48.0, 42.0, 52.0, 38.0, 47.0, 27.0, 44.0, 31.0, 35.0, 32.0, 29.0, 22.0, 17.0, 14.0, 17.0, 12.0, 8.0, 5.0, 9.0, 1.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-84.88372802734375, -82.41515350341797, -79.94657897949219, -77.4780044555664, -75.00942993164062, -72.54084777832031, -70.07227325439453, -67.60369873046875, -65.13512420654297, -62.66654968261719, -60.197975158691406, -57.72939682006836, -55.26082229614258, -52.7922477722168, -50.32366943359375, -47.85509490966797, -45.38652038574219, -42.917945861816406, -40.449371337890625, -37.98079299926758, -35.5122184753418, -33.043643951416016, -30.5750675201416, -28.106491088867188, -25.637916564941406, -23.169342041015625, -20.70076560974121, -18.232189178466797, -15.763614654541016, -13.295039176940918, -10.82646369934082, -8.357887268066406, -5.889320373535156, -3.4207448959350586, -0.9521694183349609, 1.5164060592651367, 3.9849815368652344, 6.453557014465332, 8.92213249206543, 11.390708923339844, 13.859283447265625, 16.327857971191406, 18.79643440246582, 21.265010833740234, 23.733585357666016, 26.202159881591797, 28.67073631286621, 31.139312744140625, 33.607887268066406, 36.07646179199219, 38.54503631591797, 41.013614654541016, 43.4821891784668, 45.95076370239258, 48.419342041015625, 50.887916564941406, 53.35649108886719, 55.82506561279297, 58.29364013671875, 60.7622184753418, 63.23079299926758, 65.69937133789062, 68.1679458618164, 70.63652038574219, 73.10509490966797]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 10.0, 24.0, 19.0, 23.0, 22.0, 25.0, 28.0, 31.0, 44.0, 51.0, 41.0, 47.0, 57.0, 46.0, 48.0, 69.0, 45.0, 29.0, 34.0, 35.0, 35.0, 38.0, 22.0, 28.0, 25.0, 15.0, 17.0, 13.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.142822265625, -13.68408203125, -13.225341796875, -12.7666015625, -12.307861328125, -11.84912109375, -11.390380859375, -10.931640625, -10.472900390625, -10.01416015625, -9.555419921875, -9.0966796875, -8.637939453125, -8.17919921875, -7.720458984375, -7.26171875, -6.802978515625, -6.34423828125, -5.885498046875, -5.4267578125, -4.968017578125, -4.50927734375, -4.050537109375, -3.591796875, -3.133056640625, -2.67431640625, -2.215576171875, -1.7568359375, -1.298095703125, -0.83935546875, -0.380615234375, 0.078125, 0.536865234375, 0.99560546875, 1.454345703125, 1.9130859375, 2.371826171875, 2.83056640625, 3.289306640625, 3.748046875, 4.206787109375, 4.66552734375, 5.124267578125, 5.5830078125, 6.041748046875, 6.50048828125, 6.959228515625, 7.41796875, 7.876708984375, 8.33544921875, 8.794189453125, 9.2529296875, 9.711669921875, 10.17041015625, 10.629150390625, 11.087890625, 11.546630859375, 12.00537109375, 12.464111328125, 12.9228515625, 13.381591796875, 13.84033203125, 14.299072265625, 14.7578125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 19.0, 24.0, 44.0, 70.0, 98.0, 123.0, 216.0, 332.0, 473.0, 672.0, 1074.0, 1455.0, 2224.0, 3465.0, 5223.0, 7811.0, 12215.0, 19323.0, 30590.0, 51114.0, 84252.0, 135904.0, 192265.0, 181601.0, 121685.0, 74015.0, 45063.0, 27471.0, 17391.0, 11053.0, 7232.0, 4698.0, 3177.0, 2042.0, 1325.0, 945.0, 585.0, 398.0, 292.0, 192.0, 125.0, 88.0, 61.0, 24.0, 32.0, 19.0, 10.0, 10.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.9482421875, -1.8871307373046875, -1.826019287109375, -1.7649078369140625, -1.70379638671875, -1.6426849365234375, -1.581573486328125, -1.5204620361328125, -1.4593505859375, -1.3982391357421875, -1.337127685546875, -1.2760162353515625, -1.21490478515625, -1.1537933349609375, -1.092681884765625, -1.0315704345703125, -0.970458984375, -0.9093475341796875, -0.848236083984375, -0.7871246337890625, -0.72601318359375, -0.6649017333984375, -0.603790283203125, -0.5426788330078125, -0.4815673828125, -0.4204559326171875, -0.359344482421875, -0.2982330322265625, -0.23712158203125, -0.1760101318359375, -0.114898681640625, -0.0537872314453125, 0.00732421875, 0.0684356689453125, 0.129547119140625, 0.1906585693359375, 0.25177001953125, 0.3128814697265625, 0.373992919921875, 0.4351043701171875, 0.4962158203125, 0.5573272705078125, 0.618438720703125, 0.6795501708984375, 0.74066162109375, 0.8017730712890625, 0.862884521484375, 0.9239959716796875, 0.985107421875, 1.0462188720703125, 1.107330322265625, 1.1684417724609375, 1.22955322265625, 1.2906646728515625, 1.351776123046875, 1.4128875732421875, 1.4739990234375, 1.5351104736328125, 1.596221923828125, 1.6573333740234375, 1.71844482421875, 1.7795562744140625, 1.840667724609375, 1.9017791748046875, 1.962890625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 0.0, 8.0, 11.0, 9.0, 7.0, 13.0, 17.0, 17.0, 18.0, 22.0, 19.0, 26.0, 35.0, 37.0, 35.0, 40.0, 44.0, 45.0, 38.0, 44.0, 36.0, 1071.0, 38.0, 35.0, 36.0, 39.0, 48.0, 29.0, 35.0, 28.0, 18.0, 25.0, 19.0, 14.0, 10.0, 10.0, 12.0, 7.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2945556640625, -8.995361328125, -8.6961669921875, -8.39697265625, -8.0977783203125, -7.798583984375, -7.4993896484375, -7.2001953125, -6.9010009765625, -6.601806640625, -6.3026123046875, -6.00341796875, -5.7042236328125, -5.405029296875, -5.1058349609375, -4.806640625, -4.5074462890625, -4.208251953125, -3.9090576171875, -3.60986328125, -3.3106689453125, -3.011474609375, -2.7122802734375, -2.4130859375, -2.1138916015625, -1.814697265625, -1.5155029296875, -1.21630859375, -0.9171142578125, -0.617919921875, -0.3187255859375, -0.01953125, 0.2796630859375, 0.578857421875, 0.8780517578125, 1.17724609375, 1.4764404296875, 1.775634765625, 2.0748291015625, 2.3740234375, 2.6732177734375, 2.972412109375, 3.2716064453125, 3.57080078125, 3.8699951171875, 4.169189453125, 4.4683837890625, 4.767578125, 5.0667724609375, 5.365966796875, 5.6651611328125, 5.96435546875, 6.2635498046875, 6.562744140625, 6.8619384765625, 7.1611328125, 7.4603271484375, 7.759521484375, 8.0587158203125, 8.35791015625, 8.6571044921875, 8.956298828125, 9.2554931640625, 9.5546875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 10.0, 7.0, 8.0, 25.0, 32.0, 58.0, 94.0, 167.0, 234.0, 355.0, 610.0, 974.0, 1618.0, 2829.0, 4432.0, 7715.0, 12720.0, 22229.0, 39757.0, 72526.0, 132103.0, 303981.0, 1179624.0, 139069.0, 75917.0, 42087.0, 23710.0, 13843.0, 8228.0, 4789.0, 2908.0, 1719.0, 1061.0, 660.0, 370.0, 258.0, 139.0, 95.0, 58.0, 41.0, 22.0, 24.0, 17.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.3458251953125, -1.301025390625, -1.2562255859375, -1.21142578125, -1.1666259765625, -1.121826171875, -1.0770263671875, -1.0322265625, -0.9874267578125, -0.942626953125, -0.8978271484375, -0.85302734375, -0.8082275390625, -0.763427734375, -0.7186279296875, -0.673828125, -0.6290283203125, -0.584228515625, -0.5394287109375, -0.49462890625, -0.4498291015625, -0.405029296875, -0.3602294921875, -0.3154296875, -0.2706298828125, -0.225830078125, -0.1810302734375, -0.13623046875, -0.0914306640625, -0.046630859375, -0.0018310546875, 0.04296875, 0.0877685546875, 0.132568359375, 0.1773681640625, 0.22216796875, 0.2669677734375, 0.311767578125, 0.3565673828125, 0.4013671875, 0.4461669921875, 0.490966796875, 0.5357666015625, 0.58056640625, 0.6253662109375, 0.670166015625, 0.7149658203125, 0.759765625, 0.8045654296875, 0.849365234375, 0.8941650390625, 0.93896484375, 0.9837646484375, 1.028564453125, 1.0733642578125, 1.1181640625, 1.1629638671875, 1.207763671875, 1.2525634765625, 1.29736328125, 1.3421630859375, 1.386962890625, 1.4317626953125, 1.4765625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 13.0, 8.0, 12.0, 12.0, 16.0, 11.0, 15.0, 30.0, 36.0, 59.0, 70.0, 94.0, 126.0, 108.0, 92.0, 64.0, 30.0, 25.0, 39.0, 12.0, 17.0, 16.0, 12.0, 13.0, 8.0, 7.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026132822036743164, -0.025288105010986328, -0.024443387985229492, -0.023598670959472656, -0.02275395393371582, -0.021909236907958984, -0.02106451988220215, -0.020219802856445312, -0.019375085830688477, -0.01853036880493164, -0.017685651779174805, -0.01684093475341797, -0.015996217727661133, -0.015151500701904297, -0.014306783676147461, -0.013462066650390625, -0.012617349624633789, -0.011772632598876953, -0.010927915573120117, -0.010083198547363281, -0.009238481521606445, -0.00839376449584961, -0.0075490474700927734, -0.0067043304443359375, -0.0058596134185791016, -0.005014896392822266, -0.00417017936706543, -0.0033254623413085938, -0.002480745315551758, -0.0016360282897949219, -0.0007913112640380859, 5.340576171875e-05, 0.0008981227874755859, 0.0017428398132324219, 0.002587556838989258, 0.0034322738647460938, 0.00427699089050293, 0.005121707916259766, 0.0059664249420166016, 0.0068111419677734375, 0.0076558589935302734, 0.00850057601928711, 0.009345293045043945, 0.010190010070800781, 0.011034727096557617, 0.011879444122314453, 0.012724161148071289, 0.013568878173828125, 0.014413595199584961, 0.015258312225341797, 0.016103029251098633, 0.01694774627685547, 0.017792463302612305, 0.01863718032836914, 0.019481897354125977, 0.020326614379882812, 0.02117133140563965, 0.022016048431396484, 0.02286076545715332, 0.023705482482910156, 0.024550199508666992, 0.025394916534423828, 0.026239633560180664, 0.0270843505859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 2.0, 5.0, 8.0, 9.0, 17.0, 17.0, 19.0, 29.0, 47.0, 70.0, 73.0, 146.0, 346.0, 2284.0, 605991.0, 436572.0, 2055.0, 334.0, 170.0, 101.0, 51.0, 34.0, 31.0, 18.0, 12.0, 17.0, 12.0, 15.0, 7.0, 8.0, 3.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.57421875, -0.5562667846679688, -0.5383148193359375, -0.5203628540039062, -0.502410888671875, -0.48445892333984375, -0.4665069580078125, -0.44855499267578125, -0.43060302734375, -0.41265106201171875, -0.3946990966796875, -0.37674713134765625, -0.358795166015625, -0.34084320068359375, -0.3228912353515625, -0.30493927001953125, -0.2869873046875, -0.26903533935546875, -0.2510833740234375, -0.23313140869140625, -0.215179443359375, -0.19722747802734375, -0.1792755126953125, -0.16132354736328125, -0.14337158203125, -0.12541961669921875, -0.1074676513671875, -0.08951568603515625, -0.071563720703125, -0.05361175537109375, -0.0356597900390625, -0.01770782470703125, 0.000244140625, 0.01819610595703125, 0.0361480712890625, 0.05410003662109375, 0.072052001953125, 0.09000396728515625, 0.1079559326171875, 0.12590789794921875, 0.14385986328125, 0.16181182861328125, 0.1797637939453125, 0.19771575927734375, 0.215667724609375, 0.23361968994140625, 0.2515716552734375, 0.26952362060546875, 0.2874755859375, 0.30542755126953125, 0.3233795166015625, 0.34133148193359375, 0.359283447265625, 0.37723541259765625, 0.3951873779296875, 0.41313934326171875, 0.43109130859375, 0.44904327392578125, 0.4669952392578125, 0.48494720458984375, 0.502899169921875, 0.5208511352539062, 0.5388031005859375, 0.5567550659179688, 0.57470703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 15.0, 37.0, 85.0, 289.0, 383.0, 111.0, 54.0, 17.0, 3.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09389685094356537, -0.08982937037944794, -0.0857618898153305, -0.08169440180063248, -0.07762692123651505, -0.07355944067239761, -0.06949195265769958, -0.06542447209358215, -0.06135699152946472, -0.05728951096534729, -0.05322202667593956, -0.04915454238653183, -0.0450870618224144, -0.04101958125829697, -0.036952096968889236, -0.032884612679481506, -0.028817132115364075, -0.024749649688601494, -0.020682167261838913, -0.016614684835076332, -0.012547202408313751, -0.00847971998155117, -0.0044122375547885895, -0.0003447551280260086, 0.0037227272987365723, 0.007790209725499153, 0.011857692152261734, 0.015925174579024315, 0.019992657005786896, 0.024060139432549477, 0.028127621859312057, 0.03219510614871979, 0.03626260161399841, 0.040330082178115845, 0.044397566467523575, 0.048465050756931305, 0.05253253132104874, 0.05660001188516617, 0.0606674961745739, 0.06473498046398163, 0.06880246102809906, 0.07286994159221649, 0.07693742215633392, 0.08100491017103195, 0.08507239073514938, 0.08913987129926682, 0.09320735931396484, 0.09727483987808228, 0.10134232044219971, 0.10540980100631714, 0.10947728157043457, 0.1135447695851326, 0.11761225014925003, 0.12167973071336746, 0.1257472187280655, 0.12981469929218292, 0.13388217985630035, 0.13794966042041779, 0.14201714098453522, 0.14608462154865265, 0.15015211701393127, 0.1542195975780487, 0.15828707814216614, 0.16235455870628357, 0.166422039270401]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 7.0, 9.0, 7.0, 5.0, 8.0, 13.0, 16.0, 12.0, 16.0, 23.0, 24.0, 19.0, 24.0, 33.0, 27.0, 19.0, 29.0, 36.0, 46.0, 53.0, 48.0, 31.0, 45.0, 42.0, 36.0, 28.0, 31.0, 29.0, 21.0, 25.0, 26.0, 31.0, 21.0, 28.0, 17.0, 11.0, 14.0, 14.0, 7.0, 17.0, 6.0, 5.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.020461082458496094, -0.019826708361506462, -0.01919233426451683, -0.0185579601675272, -0.017923586070537567, -0.017289211973547935, -0.016654837876558304, -0.016020463779568672, -0.01538608968257904, -0.014751715585589409, -0.014117341488599777, -0.013482967391610146, -0.012848593294620514, -0.012214219197630882, -0.01157984510064125, -0.010945471003651619, -0.010311096906661987, -0.009676722809672356, -0.009042348712682724, -0.008407974615693092, -0.007773600518703461, -0.007139226421713829, -0.006504852324724197, -0.005870478227734566, -0.005236104130744934, -0.004601730033755302, -0.003967355936765671, -0.003332981839776039, -0.0026986077427864075, -0.002064233645796776, -0.0014298595488071442, -0.0007954854518175125, -0.00016111135482788086, 0.0004732627421617508, 0.0011076368391513824, 0.001742010936141014, 0.0023763850331306458, 0.0030107591301202774, 0.003645133227109909, 0.004279507324099541, 0.004913881421089172, 0.005548255518078804, 0.006182629615068436, 0.006817003712058067, 0.007451377809047699, 0.00808575190603733, 0.008720126003026962, 0.009354500100016594, 0.009988874197006226, 0.010623248293995857, 0.011257622390985489, 0.01189199648797512, 0.012526370584964752, 0.013160744681954384, 0.013795118778944016, 0.014429492875933647, 0.015063866972923279, 0.01569824106991291, 0.016332615166902542, 0.016966989263892174, 0.017601363360881805, 0.018235737457871437, 0.01887011155486107, 0.0195044856518507, 0.020138859748840332]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 11.0, 23.0, 19.0, 23.0, 22.0, 25.0, 28.0, 31.0, 44.0, 51.0, 41.0, 47.0, 57.0, 46.0, 48.0, 69.0, 45.0, 29.0, 35.0, 34.0, 36.0, 37.0, 22.0, 28.0, 24.0, 16.0, 17.0, 13.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.142822265625, -13.68408203125, -13.225341796875, -12.7666015625, -12.307861328125, -11.84912109375, -11.390380859375, -10.931640625, -10.472900390625, -10.01416015625, -9.555419921875, -9.0966796875, -8.637939453125, -8.17919921875, -7.720458984375, -7.26171875, -6.802978515625, -6.34423828125, -5.885498046875, -5.4267578125, -4.968017578125, -4.50927734375, -4.050537109375, -3.591796875, -3.133056640625, -2.67431640625, -2.215576171875, -1.7568359375, -1.298095703125, -0.83935546875, -0.380615234375, 0.078125, 0.536865234375, 0.99560546875, 1.454345703125, 1.9130859375, 2.371826171875, 2.83056640625, 3.289306640625, 3.748046875, 4.206787109375, 4.66552734375, 5.124267578125, 5.5830078125, 6.041748046875, 6.50048828125, 6.959228515625, 7.41796875, 7.876708984375, 8.33544921875, 8.794189453125, 9.2529296875, 9.711669921875, 10.17041015625, 10.629150390625, 11.087890625, 11.546630859375, 12.00537109375, 12.464111328125, 12.9228515625, 13.381591796875, 13.84033203125, 14.299072265625, 14.7578125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 7.0, 21.0, 27.0, 41.0, 59.0, 72.0, 101.0, 133.0, 189.0, 260.0, 344.0, 499.0, 648.0, 858.0, 1183.0, 1641.0, 2365.0, 3407.0, 5235.0, 8035.0, 13841.0, 26391.0, 60084.0, 185242.0, 473087.0, 152171.0, 52511.0, 23526.0, 12828.0, 7644.0, 4792.0, 3186.0, 2234.0, 1553.0, 1146.0, 862.0, 653.0, 444.0, 349.0, 242.0, 165.0, 118.0, 115.0, 74.0, 50.0, 27.0, 32.0, 18.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 2.0, 2.0], "bins": [-10.4296875, -10.1080322265625, -9.786376953125, -9.4647216796875, -9.14306640625, -8.8214111328125, -8.499755859375, -8.1781005859375, -7.8564453125, -7.5347900390625, -7.213134765625, -6.8914794921875, -6.56982421875, -6.2481689453125, -5.926513671875, -5.6048583984375, -5.283203125, -4.9615478515625, -4.639892578125, -4.3182373046875, -3.99658203125, -3.6749267578125, -3.353271484375, -3.0316162109375, -2.7099609375, -2.3883056640625, -2.066650390625, -1.7449951171875, -1.42333984375, -1.1016845703125, -0.780029296875, -0.4583740234375, -0.13671875, 0.1849365234375, 0.506591796875, 0.8282470703125, 1.14990234375, 1.4715576171875, 1.793212890625, 2.1148681640625, 2.4365234375, 2.7581787109375, 3.079833984375, 3.4014892578125, 3.72314453125, 4.0447998046875, 4.366455078125, 4.6881103515625, 5.009765625, 5.3314208984375, 5.653076171875, 5.9747314453125, 6.29638671875, 6.6180419921875, 6.939697265625, 7.2613525390625, 7.5830078125, 7.9046630859375, 8.226318359375, 8.5479736328125, 8.86962890625, 9.1912841796875, 9.512939453125, 9.8345947265625, 10.15625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 10.0, 6.0, 12.0, 10.0, 21.0, 14.0, 20.0, 28.0, 23.0, 37.0, 38.0, 36.0, 52.0, 47.0, 51.0, 75.0, 128.0, 1713.0, 205.0, 80.0, 49.0, 38.0, 47.0, 35.0, 26.0, 26.0, 28.0, 26.0, 31.0, 21.0, 20.0, 21.0, 6.0, 5.0, 15.0, 8.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -35.11865234375, -33.7998046875, -32.48095703125, -31.162109375, -29.84326171875, -28.5244140625, -27.20556640625, -25.88671875, -24.56787109375, -23.2490234375, -21.93017578125, -20.611328125, -19.29248046875, -17.9736328125, -16.65478515625, -15.3359375, -14.01708984375, -12.6982421875, -11.37939453125, -10.060546875, -8.74169921875, -7.4228515625, -6.10400390625, -4.78515625, -3.46630859375, -2.1474609375, -0.82861328125, 0.490234375, 1.80908203125, 3.1279296875, 4.44677734375, 5.765625, 7.08447265625, 8.4033203125, 9.72216796875, 11.041015625, 12.35986328125, 13.6787109375, 14.99755859375, 16.31640625, 17.63525390625, 18.9541015625, 20.27294921875, 21.591796875, 22.91064453125, 24.2294921875, 25.54833984375, 26.8671875, 28.18603515625, 29.5048828125, 30.82373046875, 32.142578125, 33.46142578125, 34.7802734375, 36.09912109375, 37.41796875, 38.73681640625, 40.0556640625, 41.37451171875, 42.693359375, 44.01220703125, 45.3310546875, 46.64990234375, 47.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 15.0, 7.0, 12.0, 11.0, 7.0, 24.0, 24.0, 29.0, 34.0, 66.0, 56.0, 70.0, 97.0, 133.0, 161.0, 238.0, 423.0, 1588.0, 23523.0, 3064472.0, 50803.0, 2368.0, 510.0, 257.0, 174.0, 133.0, 102.0, 75.0, 65.0, 57.0, 32.0, 27.0, 32.0, 16.0, 12.0, 12.0, 8.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-113.0625, -109.97265625, -106.8828125, -103.79296875, -100.703125, -97.61328125, -94.5234375, -91.43359375, -88.34375, -85.25390625, -82.1640625, -79.07421875, -75.984375, -72.89453125, -69.8046875, -66.71484375, -63.625, -60.53515625, -57.4453125, -54.35546875, -51.265625, -48.17578125, -45.0859375, -41.99609375, -38.90625, -35.81640625, -32.7265625, -29.63671875, -26.546875, -23.45703125, -20.3671875, -17.27734375, -14.1875, -11.09765625, -8.0078125, -4.91796875, -1.828125, 1.26171875, 4.3515625, 7.44140625, 10.53125, 13.62109375, 16.7109375, 19.80078125, 22.890625, 25.98046875, 29.0703125, 32.16015625, 35.25, 38.33984375, 41.4296875, 44.51953125, 47.609375, 50.69921875, 53.7890625, 56.87890625, 59.96875, 63.05859375, 66.1484375, 69.23828125, 72.328125, 75.41796875, 78.5078125, 81.59765625, 84.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 260.0, 675.0, 66.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-573.7492065429688, -563.7349243164062, -553.7206420898438, -543.7064208984375, -533.692138671875, -523.6778564453125, -513.66357421875, -503.6492919921875, -493.6350402832031, -483.6207580566406, -473.60650634765625, -463.59222412109375, -453.57794189453125, -443.5636901855469, -433.5494079589844, -423.53515625, -413.5208740234375, -403.506591796875, -393.4923400878906, -383.4780578613281, -373.4637756347656, -363.44952392578125, -353.43524169921875, -343.42095947265625, -333.40667724609375, -323.39239501953125, -313.3781433105469, -303.3638610839844, -293.3495788574219, -283.3353271484375, -273.321044921875, -263.3067626953125, -253.29254150390625, -243.2782745361328, -233.2639923095703, -223.24972534179688, -213.23545837402344, -203.22119140625, -193.2069091796875, -183.19264221191406, -173.17835998535156, -163.16409301757812, -153.14981079101562, -143.1355438232422, -133.12127685546875, -123.10700225830078, -113.09272766113281, -103.07846069335938, -93.0641860961914, -83.04991149902344, -73.03564453125, -63.02136993408203, -53.00709915161133, -42.992828369140625, -32.978553771972656, -22.96428680419922, -12.95001220703125, -2.9357404708862305, 7.078531265258789, 17.092803955078125, 27.107074737548828, 37.12134552001953, 47.1356201171875, 57.14988708496094, 67.1641616821289]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 3.0, 5.0, 13.0, 8.0, 12.0, 15.0, 13.0, 17.0, 19.0, 18.0, 18.0, 28.0, 31.0, 29.0, 37.0, 32.0, 40.0, 37.0, 37.0, 36.0, 40.0, 27.0, 38.0, 28.0, 28.0, 39.0, 35.0, 36.0, 28.0, 29.0, 35.0, 24.0, 17.0, 25.0, 24.0, 15.0, 9.0, 21.0, 7.0, 8.0, 5.0, 5.0, 5.0, 7.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-84.82170104980469, -82.07544708251953, -79.32918548583984, -76.58293151855469, -73.836669921875, -71.09041595458984, -68.34415435791016, -65.597900390625, -62.85163879394531, -60.10538101196289, -57.35912322998047, -54.61286544799805, -51.866607666015625, -49.1203498840332, -46.37409210205078, -43.627838134765625, -40.8815803527832, -38.13532257080078, -35.38906478881836, -32.64280700683594, -29.896549224853516, -27.150291442871094, -24.404035568237305, -21.657777786254883, -18.91152000427246, -16.16526222229004, -13.419004440307617, -10.672747611999512, -7.92648983001709, -5.180232048034668, -2.4339752197265625, 0.3122825622558594, 3.0585403442382812, 5.804798126220703, 8.551055908203125, 11.29731273651123, 14.043570518493652, 16.78982925415039, 19.53608512878418, 22.2823429107666, 25.028600692749023, 27.774858474731445, 30.521116256713867, 33.267372131347656, 36.01362991333008, 38.7598876953125, 41.50614547729492, 44.252403259277344, 46.998661041259766, 49.74491882324219, 52.49117660522461, 55.23743438720703, 57.98369216918945, 60.729949951171875, 63.47620391845703, 66.22246551513672, 68.96871948242188, 71.71497344970703, 74.46123504638672, 77.20748901367188, 79.95375061035156, 82.70000457763672, 85.4462661743164, 88.19252014160156, 90.93878173828125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 5.0, 9.0, 8.0, 12.0, 10.0, 20.0, 25.0, 21.0, 23.0, 37.0, 26.0, 32.0, 43.0, 41.0, 34.0, 53.0, 44.0, 54.0, 48.0, 56.0, 43.0, 35.0, 31.0, 29.0, 25.0, 36.0, 29.0, 26.0, 34.0, 17.0, 21.0, 9.0, 13.0, 8.0, 10.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.78125, -14.33056640625, -13.8798828125, -13.42919921875, -12.978515625, -12.52783203125, -12.0771484375, -11.62646484375, -11.17578125, -10.72509765625, -10.2744140625, -9.82373046875, -9.373046875, -8.92236328125, -8.4716796875, -8.02099609375, -7.5703125, -7.11962890625, -6.6689453125, -6.21826171875, -5.767578125, -5.31689453125, -4.8662109375, -4.41552734375, -3.96484375, -3.51416015625, -3.0634765625, -2.61279296875, -2.162109375, -1.71142578125, -1.2607421875, -0.81005859375, -0.359375, 0.09130859375, 0.5419921875, 0.99267578125, 1.443359375, 1.89404296875, 2.3447265625, 2.79541015625, 3.24609375, 3.69677734375, 4.1474609375, 4.59814453125, 5.048828125, 5.49951171875, 5.9501953125, 6.40087890625, 6.8515625, 7.30224609375, 7.7529296875, 8.20361328125, 8.654296875, 9.10498046875, 9.5556640625, 10.00634765625, 10.45703125, 10.90771484375, 11.3583984375, 11.80908203125, 12.259765625, 12.71044921875, 13.1611328125, 13.61181640625, 14.0625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 5.0, 11.0, 7.0, 12.0, 20.0, 28.0, 30.0, 31.0, 62.0, 90.0, 175.0, 399.0, 930.0, 2828.0, 9052.0, 40863.0, 616064.0, 3136114.0, 349498.0, 27801.0, 6621.0, 2100.0, 751.0, 296.0, 160.0, 85.0, 62.0, 33.0, 28.0, 25.0, 20.0, 14.0, 12.0, 11.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.9375, -37.77197265625, -36.6064453125, -35.44091796875, -34.275390625, -33.10986328125, -31.9443359375, -30.77880859375, -29.61328125, -28.44775390625, -27.2822265625, -26.11669921875, -24.951171875, -23.78564453125, -22.6201171875, -21.45458984375, -20.2890625, -19.12353515625, -17.9580078125, -16.79248046875, -15.626953125, -14.46142578125, -13.2958984375, -12.13037109375, -10.96484375, -9.79931640625, -8.6337890625, -7.46826171875, -6.302734375, -5.13720703125, -3.9716796875, -2.80615234375, -1.640625, -0.47509765625, 0.6904296875, 1.85595703125, 3.021484375, 4.18701171875, 5.3525390625, 6.51806640625, 7.68359375, 8.84912109375, 10.0146484375, 11.18017578125, 12.345703125, 13.51123046875, 14.6767578125, 15.84228515625, 17.0078125, 18.17333984375, 19.3388671875, 20.50439453125, 21.669921875, 22.83544921875, 24.0009765625, 25.16650390625, 26.33203125, 27.49755859375, 28.6630859375, 29.82861328125, 30.994140625, 32.15966796875, 33.3251953125, 34.49072265625, 35.65625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 9.0, 7.0, 17.0, 28.0, 25.0, 33.0, 51.0, 76.0, 124.0, 192.0, 274.0, 458.0, 725.0, 779.0, 481.0, 288.0, 157.0, 109.0, 73.0, 45.0, 32.0, 19.0, 14.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.953125, -30.9560546875, -29.958984375, -28.9619140625, -27.96484375, -26.9677734375, -25.970703125, -24.9736328125, -23.9765625, -22.9794921875, -21.982421875, -20.9853515625, -19.98828125, -18.9912109375, -17.994140625, -16.9970703125, -16.0, -15.0029296875, -14.005859375, -13.0087890625, -12.01171875, -11.0146484375, -10.017578125, -9.0205078125, -8.0234375, -7.0263671875, -6.029296875, -5.0322265625, -4.03515625, -3.0380859375, -2.041015625, -1.0439453125, -0.046875, 0.9501953125, 1.947265625, 2.9443359375, 3.94140625, 4.9384765625, 5.935546875, 6.9326171875, 7.9296875, 8.9267578125, 9.923828125, 10.9208984375, 11.91796875, 12.9150390625, 13.912109375, 14.9091796875, 15.90625, 16.9033203125, 17.900390625, 18.8974609375, 19.89453125, 20.8916015625, 21.888671875, 22.8857421875, 23.8828125, 24.8798828125, 25.876953125, 26.8740234375, 27.87109375, 28.8681640625, 29.865234375, 30.8623046875, 31.859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 4.0, 10.0, 9.0, 10.0, 16.0, 25.0, 42.0, 61.0, 99.0, 166.0, 339.0, 1213.0, 21730.0, 4045399.0, 121289.0, 2711.0, 513.0, 220.0, 153.0, 79.0, 46.0, 37.0, 26.0, 23.0, 13.0, 14.0, 6.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.625, -141.02734375, -136.4296875, -131.83203125, -127.234375, -122.63671875, -118.0390625, -113.44140625, -108.84375, -104.24609375, -99.6484375, -95.05078125, -90.453125, -85.85546875, -81.2578125, -76.66015625, -72.0625, -67.46484375, -62.8671875, -58.26953125, -53.671875, -49.07421875, -44.4765625, -39.87890625, -35.28125, -30.68359375, -26.0859375, -21.48828125, -16.890625, -12.29296875, -7.6953125, -3.09765625, 1.5, 6.09765625, 10.6953125, 15.29296875, 19.890625, 24.48828125, 29.0859375, 33.68359375, 38.28125, 42.87890625, 47.4765625, 52.07421875, 56.671875, 61.26953125, 65.8671875, 70.46484375, 75.0625, 79.66015625, 84.2578125, 88.85546875, 93.453125, 98.05078125, 102.6484375, 107.24609375, 111.84375, 116.44140625, 121.0390625, 125.63671875, 130.234375, 134.83203125, 139.4296875, 144.02734375, 148.625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 7.0, 19.0, 33.0, 53.0, 107.0, 161.0, 203.0, 168.0, 119.0, 65.0, 36.0, 21.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.8119354248047, -185.6131134033203, -180.41429138183594, -175.21548461914062, -170.01666259765625, -164.81784057617188, -159.6190185546875, -154.42019653320312, -149.22137451171875, -144.02255249023438, -138.82373046875, -133.62490844726562, -128.4261016845703, -123.22727966308594, -118.02845764160156, -112.82963562011719, -107.63082122802734, -102.43199920654297, -97.23318481445312, -92.03436279296875, -86.83554077148438, -81.63671875, -76.43790435791016, -71.23908233642578, -66.04026794433594, -60.84144973754883, -55.64262771606445, -50.443809509277344, -45.24498748779297, -40.04616928100586, -34.84735107421875, -29.648529052734375, -24.44970703125, -19.250886917114258, -14.052067756652832, -8.853248596191406, -3.654428482055664, 1.5443916320800781, 6.7432098388671875, 11.942031860351562, 17.140850067138672, 22.339670181274414, 27.538490295410156, 32.737308502197266, 37.936126708984375, 43.13494873046875, 48.33376693725586, 53.532588958740234, 58.731407165527344, 63.93022537231445, 69.12904357910156, 74.32786560058594, 79.52668762207031, 84.72550964355469, 89.92432403564453, 95.1231460571289, 100.32196044921875, 105.52078247070312, 110.71959686279297, 115.91841888427734, 121.11724090576172, 126.31605529785156, 131.51487731933594, 136.7136993408203, 141.9125213623047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 7.0, 6.0, 7.0, 12.0, 17.0, 13.0, 21.0, 21.0, 18.0, 22.0, 30.0, 27.0, 37.0, 19.0, 25.0, 35.0, 35.0, 45.0, 42.0, 58.0, 35.0, 37.0, 35.0, 40.0, 32.0, 41.0, 44.0, 28.0, 22.0, 24.0, 23.0, 25.0, 12.0, 7.0, 12.0, 12.0, 11.0, 8.0, 9.0, 13.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.4686279296875, -76.06810760498047, -73.66758728027344, -71.26707458496094, -68.8665542602539, -66.46603393554688, -64.06552124023438, -61.665000915527344, -59.26448059082031, -56.86396026611328, -54.463443756103516, -52.06292724609375, -49.66240692138672, -47.26188659667969, -44.86137008666992, -42.460853576660156, -40.060333251953125, -37.659812927246094, -35.25929641723633, -32.85877990722656, -30.45825958251953, -28.057741165161133, -25.657222747802734, -23.256704330444336, -20.856185913085938, -18.45566749572754, -16.05514907836914, -13.654630661010742, -11.254112243652344, -8.853593826293945, -6.453075408935547, -4.052556991577148, -1.65203857421875, 0.7484798431396484, 3.148998260498047, 5.549516677856445, 7.950035095214844, 10.350553512573242, 12.75107192993164, 15.151590347290039, 17.552108764648438, 19.952627182006836, 22.353145599365234, 24.753664016723633, 27.15418243408203, 29.55470085144043, 31.955219268798828, 34.355735778808594, 36.756256103515625, 39.156776428222656, 41.55729293823242, 43.95780944824219, 46.35832977294922, 48.75885009765625, 51.159366607666016, 53.55988311767578, 55.96040344238281, 58.360923767089844, 60.76144027709961, 63.161956787109375, 65.5624771118164, 67.96299743652344, 70.36351013183594, 72.76403045654297, 75.16455078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 3.0, 7.0, 6.0, 9.0, 17.0, 11.0, 18.0, 17.0, 17.0, 21.0, 32.0, 28.0, 28.0, 28.0, 35.0, 47.0, 37.0, 41.0, 46.0, 41.0, 46.0, 52.0, 44.0, 36.0, 39.0, 34.0, 28.0, 32.0, 20.0, 29.0, 24.0, 20.0, 15.0, 18.0, 17.0, 14.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.9765625, -12.5673828125, -12.158203125, -11.7490234375, -11.33984375, -10.9306640625, -10.521484375, -10.1123046875, -9.703125, -9.2939453125, -8.884765625, -8.4755859375, -8.06640625, -7.6572265625, -7.248046875, -6.8388671875, -6.4296875, -6.0205078125, -5.611328125, -5.2021484375, -4.79296875, -4.3837890625, -3.974609375, -3.5654296875, -3.15625, -2.7470703125, -2.337890625, -1.9287109375, -1.51953125, -1.1103515625, -0.701171875, -0.2919921875, 0.1171875, 0.5263671875, 0.935546875, 1.3447265625, 1.75390625, 2.1630859375, 2.572265625, 2.9814453125, 3.390625, 3.7998046875, 4.208984375, 4.6181640625, 5.02734375, 5.4365234375, 5.845703125, 6.2548828125, 6.6640625, 7.0732421875, 7.482421875, 7.8916015625, 8.30078125, 8.7099609375, 9.119140625, 9.5283203125, 9.9375, 10.3466796875, 10.755859375, 11.1650390625, 11.57421875, 11.9833984375, 12.392578125, 12.8017578125, 13.2109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 15.0, 17.0, 33.0, 53.0, 77.0, 166.0, 200.0, 349.0, 478.0, 787.0, 1226.0, 2041.0, 3305.0, 5289.0, 8342.0, 13797.0, 22954.0, 39434.0, 68076.0, 119629.0, 194175.0, 217200.0, 146038.0, 84727.0, 48798.0, 28128.0, 16661.0, 9847.0, 6135.0, 3885.0, 2467.0, 1588.0, 948.0, 668.0, 389.0, 224.0, 162.0, 79.0, 73.0, 38.0, 27.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.16705322265625, -2.0997314453125, -2.03240966796875, -1.965087890625, -1.89776611328125, -1.8304443359375, -1.76312255859375, -1.69580078125, -1.62847900390625, -1.5611572265625, -1.49383544921875, -1.426513671875, -1.35919189453125, -1.2918701171875, -1.22454833984375, -1.1572265625, -1.08990478515625, -1.0225830078125, -0.95526123046875, -0.887939453125, -0.82061767578125, -0.7532958984375, -0.68597412109375, -0.61865234375, -0.55133056640625, -0.4840087890625, -0.41668701171875, -0.349365234375, -0.28204345703125, -0.2147216796875, -0.14739990234375, -0.080078125, -0.01275634765625, 0.0545654296875, 0.12188720703125, 0.189208984375, 0.25653076171875, 0.3238525390625, 0.39117431640625, 0.45849609375, 0.52581787109375, 0.5931396484375, 0.66046142578125, 0.727783203125, 0.79510498046875, 0.8624267578125, 0.92974853515625, 0.9970703125, 1.06439208984375, 1.1317138671875, 1.19903564453125, 1.266357421875, 1.33367919921875, 1.4010009765625, 1.46832275390625, 1.53564453125, 1.60296630859375, 1.6702880859375, 1.73760986328125, 1.804931640625, 1.87225341796875, 1.9395751953125, 2.00689697265625, 2.07421875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 6.0, 13.0, 13.0, 9.0, 22.0, 22.0, 26.0, 36.0, 30.0, 34.0, 31.0, 43.0, 50.0, 32.0, 42.0, 48.0, 52.0, 1078.0, 44.0, 40.0, 50.0, 35.0, 29.0, 45.0, 40.0, 22.0, 19.0, 16.0, 19.0, 20.0, 14.0, 11.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.065185546875, -10.73974609375, -10.414306640625, -10.0888671875, -9.763427734375, -9.43798828125, -9.112548828125, -8.787109375, -8.461669921875, -8.13623046875, -7.810791015625, -7.4853515625, -7.159912109375, -6.83447265625, -6.509033203125, -6.18359375, -5.858154296875, -5.53271484375, -5.207275390625, -4.8818359375, -4.556396484375, -4.23095703125, -3.905517578125, -3.580078125, -3.254638671875, -2.92919921875, -2.603759765625, -2.2783203125, -1.952880859375, -1.62744140625, -1.302001953125, -0.9765625, -0.651123046875, -0.32568359375, -0.000244140625, 0.3251953125, 0.650634765625, 0.97607421875, 1.301513671875, 1.626953125, 1.952392578125, 2.27783203125, 2.603271484375, 2.9287109375, 3.254150390625, 3.57958984375, 3.905029296875, 4.23046875, 4.555908203125, 4.88134765625, 5.206787109375, 5.5322265625, 5.857666015625, 6.18310546875, 6.508544921875, 6.833984375, 7.159423828125, 7.48486328125, 7.810302734375, 8.1357421875, 8.461181640625, 8.78662109375, 9.112060546875, 9.4375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 3.0, 11.0, 11.0, 23.0, 33.0, 48.0, 70.0, 87.0, 152.0, 228.0, 310.0, 500.0, 743.0, 1288.0, 2066.0, 3398.0, 5874.0, 9633.0, 16190.0, 27883.0, 48698.0, 85767.0, 148569.0, 1265239.0, 197673.0, 118913.0, 68412.0, 39405.0, 22666.0, 13288.0, 7808.0, 4615.0, 2735.0, 1700.0, 1089.0, 665.0, 461.0, 284.0, 187.0, 131.0, 72.0, 64.0, 36.0, 36.0, 11.0, 17.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.322265625, -1.279327392578125, -1.23638916015625, -1.193450927734375, -1.1505126953125, -1.107574462890625, -1.06463623046875, -1.021697998046875, -0.978759765625, -0.935821533203125, -0.89288330078125, -0.849945068359375, -0.8070068359375, -0.764068603515625, -0.72113037109375, -0.678192138671875, -0.63525390625, -0.592315673828125, -0.54937744140625, -0.506439208984375, -0.4635009765625, -0.420562744140625, -0.37762451171875, -0.334686279296875, -0.291748046875, -0.248809814453125, -0.20587158203125, -0.162933349609375, -0.1199951171875, -0.077056884765625, -0.03411865234375, 0.008819580078125, 0.0517578125, 0.094696044921875, 0.13763427734375, 0.180572509765625, 0.2235107421875, 0.266448974609375, 0.30938720703125, 0.352325439453125, 0.395263671875, 0.438201904296875, 0.48114013671875, 0.524078369140625, 0.5670166015625, 0.609954833984375, 0.65289306640625, 0.695831298828125, 0.73876953125, 0.781707763671875, 0.82464599609375, 0.867584228515625, 0.9105224609375, 0.953460693359375, 0.99639892578125, 1.039337158203125, 1.082275390625, 1.125213623046875, 1.16815185546875, 1.211090087890625, 1.2540283203125, 1.296966552734375, 1.33990478515625, 1.382843017578125, 1.42578125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 11.0, 13.0, 6.0, 12.0, 14.0, 17.0, 26.0, 36.0, 32.0, 48.0, 69.0, 87.0, 122.0, 115.0, 74.0, 60.0, 50.0, 39.0, 33.0, 29.0, 17.0, 14.0, 9.0, 12.0, 15.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02679443359375, -0.02590203285217285, -0.025009632110595703, -0.024117231369018555, -0.023224830627441406, -0.022332429885864258, -0.02144002914428711, -0.02054762840270996, -0.019655227661132812, -0.018762826919555664, -0.017870426177978516, -0.016978025436401367, -0.01608562469482422, -0.01519322395324707, -0.014300823211669922, -0.013408422470092773, -0.012516021728515625, -0.011623620986938477, -0.010731220245361328, -0.00983881950378418, -0.008946418762207031, -0.008054018020629883, -0.007161617279052734, -0.006269216537475586, -0.0053768157958984375, -0.004484415054321289, -0.0035920143127441406, -0.002699613571166992, -0.0018072128295898438, -0.0009148120880126953, -2.2411346435546875e-05, 0.0008699893951416016, 0.00176239013671875, 0.0026547908782958984, 0.003547191619873047, 0.004439592361450195, 0.005331993103027344, 0.006224393844604492, 0.007116794586181641, 0.008009195327758789, 0.008901596069335938, 0.009793996810913086, 0.010686397552490234, 0.011578798294067383, 0.012471199035644531, 0.01336359977722168, 0.014256000518798828, 0.015148401260375977, 0.016040802001953125, 0.016933202743530273, 0.017825603485107422, 0.01871800422668457, 0.01961040496826172, 0.020502805709838867, 0.021395206451416016, 0.022287607192993164, 0.023180007934570312, 0.02407240867614746, 0.02496480941772461, 0.025857210159301758, 0.026749610900878906, 0.027642011642456055, 0.028534412384033203, 0.02942681312561035, 0.0303192138671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 0.0, 7.0, 5.0, 14.0, 13.0, 15.0, 14.0, 17.0, 32.0, 51.0, 66.0, 83.0, 164.0, 354.0, 1210.0, 805891.0, 238863.0, 963.0, 323.0, 152.0, 84.0, 51.0, 47.0, 28.0, 24.0, 16.0, 7.0, 14.0, 13.0, 8.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.630279541015625, -0.61114501953125, -0.592010498046875, -0.5728759765625, -0.553741455078125, -0.53460693359375, -0.515472412109375, -0.496337890625, -0.477203369140625, -0.45806884765625, -0.438934326171875, -0.4197998046875, -0.400665283203125, -0.38153076171875, -0.362396240234375, -0.34326171875, -0.324127197265625, -0.30499267578125, -0.285858154296875, -0.2667236328125, -0.247589111328125, -0.22845458984375, -0.209320068359375, -0.190185546875, -0.171051025390625, -0.15191650390625, -0.132781982421875, -0.1136474609375, -0.094512939453125, -0.07537841796875, -0.056243896484375, -0.037109375, -0.017974853515625, 0.00115966796875, 0.020294189453125, 0.0394287109375, 0.058563232421875, 0.07769775390625, 0.096832275390625, 0.115966796875, 0.135101318359375, 0.15423583984375, 0.173370361328125, 0.1925048828125, 0.211639404296875, 0.23077392578125, 0.249908447265625, 0.26904296875, 0.288177490234375, 0.30731201171875, 0.326446533203125, 0.3455810546875, 0.364715576171875, 0.38385009765625, 0.402984619140625, 0.422119140625, 0.441253662109375, 0.46038818359375, 0.479522705078125, 0.4986572265625, 0.517791748046875, 0.53692626953125, 0.556060791015625, 0.5751953125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 80.0, 881.0, 47.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11109989881515503, -0.09796919673681259, -0.08483849465847015, -0.07170780003070831, -0.05857709422707558, -0.04544639587402344, -0.032315693795681, -0.019184991717338562, -0.006054289638996124, 0.007076411508023739, 0.020207112655043602, 0.03333781287074089, 0.04646851494908333, 0.05959921330213547, 0.0727299153804779, 0.08586061745882034, 0.09899131953716278, 0.11212202161550522, 0.12525272369384766, 0.1383834183216095, 0.15151412785053253, 0.16464482247829437, 0.1777755320072174, 0.19090622663497925, 0.2040369212627411, 0.21716761589050293, 0.23029832541942596, 0.2434290200471878, 0.25655972957611084, 0.2696904242038727, 0.2828211188316345, 0.29595184326171875, 0.3090825378894806, 0.32221323251724243, 0.3353439271450043, 0.3484746515750885, 0.36160534620285034, 0.3747360408306122, 0.387866735458374, 0.40099745988845825, 0.4141281545162201, 0.42725884914398193, 0.4403895437717438, 0.453520268201828, 0.46665096282958984, 0.4797816574573517, 0.4929123520851135, 0.5060430765151978, 0.5191737413406372, 0.5323044657707214, 0.5454351305961609, 0.5585658550262451, 0.5716965198516846, 0.5848272442817688, 0.597957968711853, 0.6110886335372925, 0.6242193579673767, 0.6373500823974609, 0.6504807472229004, 0.6636114716529846, 0.6767421364784241, 0.6898728609085083, 0.7030035853385925, 0.716134250164032, 0.7292649745941162]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 11.0, 9.0, 16.0, 15.0, 16.0, 19.0, 18.0, 26.0, 30.0, 32.0, 33.0, 31.0, 30.0, 35.0, 37.0, 38.0, 36.0, 42.0, 37.0, 34.0, 28.0, 38.0, 30.0, 42.0, 32.0, 45.0, 24.0, 25.0, 20.0, 24.0, 30.0, 25.0, 19.0, 13.0, 9.0, 6.0, 5.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.03635573387145996, -0.03531833365559578, -0.0342809334397316, -0.033243533223867416, -0.032206133008003235, -0.031168732792139053, -0.030131332576274872, -0.02909393236041069, -0.02805653214454651, -0.027019131928682327, -0.025981731712818146, -0.024944331496953964, -0.023906931281089783, -0.0228695310652256, -0.02183213084936142, -0.020794730633497238, -0.019757330417633057, -0.018719930201768875, -0.017682529985904694, -0.016645129770040512, -0.01560772955417633, -0.014570329338312149, -0.013532929122447968, -0.012495528906583786, -0.011458128690719604, -0.010420728474855423, -0.009383328258991241, -0.00834592804312706, -0.007308527827262878, -0.006271127611398697, -0.005233727395534515, -0.004196327179670334, -0.0031589269638061523, -0.002121526747941971, -0.0010841265320777893, -4.672631621360779e-05, 0.0009906738996505737, 0.0020280741155147552, 0.0030654743313789368, 0.004102874547243118, 0.0051402747631073, 0.006177674978971481, 0.007215075194835663, 0.008252475410699844, 0.009289875626564026, 0.010327275842428207, 0.011364676058292389, 0.01240207627415657, 0.013439476490020752, 0.014476876705884933, 0.015514276921749115, 0.016551677137613297, 0.017589077353477478, 0.01862647756934166, 0.01966387778520584, 0.020701278001070023, 0.021738678216934204, 0.022776078432798386, 0.023813478648662567, 0.02485087886452675, 0.02588827908039093, 0.02692567929625511, 0.027963079512119293, 0.029000479727983475, 0.030037879943847656]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 3.0, 7.0, 6.0, 9.0, 17.0, 11.0, 18.0, 17.0, 17.0, 21.0, 32.0, 28.0, 28.0, 28.0, 35.0, 47.0, 36.0, 42.0, 46.0, 40.0, 44.0, 54.0, 45.0, 36.0, 39.0, 34.0, 28.0, 31.0, 20.0, 30.0, 24.0, 20.0, 15.0, 18.0, 17.0, 14.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.9765625, -12.5675048828125, -12.158447265625, -11.7493896484375, -11.34033203125, -10.9312744140625, -10.522216796875, -10.1131591796875, -9.7041015625, -9.2950439453125, -8.885986328125, -8.4769287109375, -8.06787109375, -7.6588134765625, -7.249755859375, -6.8406982421875, -6.431640625, -6.0225830078125, -5.613525390625, -5.2044677734375, -4.79541015625, -4.3863525390625, -3.977294921875, -3.5682373046875, -3.1591796875, -2.7501220703125, -2.341064453125, -1.9320068359375, -1.52294921875, -1.1138916015625, -0.704833984375, -0.2957763671875, 0.11328125, 0.5223388671875, 0.931396484375, 1.3404541015625, 1.74951171875, 2.1585693359375, 2.567626953125, 2.9766845703125, 3.3857421875, 3.7947998046875, 4.203857421875, 4.6129150390625, 5.02197265625, 5.4310302734375, 5.840087890625, 6.2491455078125, 6.658203125, 7.0672607421875, 7.476318359375, 7.8853759765625, 8.29443359375, 8.7034912109375, 9.112548828125, 9.5216064453125, 9.9306640625, 10.3397216796875, 10.748779296875, 11.1578369140625, 11.56689453125, 11.9759521484375, 12.385009765625, 12.7940673828125, 13.203125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 6.0, 5.0, 16.0, 16.0, 24.0, 13.0, 27.0, 51.0, 46.0, 88.0, 104.0, 147.0, 187.0, 261.0, 375.0, 551.0, 810.0, 1205.0, 1695.0, 2640.0, 4193.0, 6804.0, 11869.0, 23197.0, 53304.0, 167322.0, 509087.0, 159798.0, 51557.0, 22585.0, 11604.0, 6692.0, 4108.0, 2560.0, 1730.0, 1181.0, 806.0, 565.0, 350.0, 250.0, 202.0, 144.0, 97.0, 85.0, 38.0, 41.0, 36.0, 21.0, 21.0, 12.0, 5.0, 8.0, 5.0, 6.0, 2.0, 4.0, 1.0, 5.0], "bins": [-13.6796875, -13.258544921875, -12.83740234375, -12.416259765625, -11.9951171875, -11.573974609375, -11.15283203125, -10.731689453125, -10.310546875, -9.889404296875, -9.46826171875, -9.047119140625, -8.6259765625, -8.204833984375, -7.78369140625, -7.362548828125, -6.94140625, -6.520263671875, -6.09912109375, -5.677978515625, -5.2568359375, -4.835693359375, -4.41455078125, -3.993408203125, -3.572265625, -3.151123046875, -2.72998046875, -2.308837890625, -1.8876953125, -1.466552734375, -1.04541015625, -0.624267578125, -0.203125, 0.218017578125, 0.63916015625, 1.060302734375, 1.4814453125, 1.902587890625, 2.32373046875, 2.744873046875, 3.166015625, 3.587158203125, 4.00830078125, 4.429443359375, 4.8505859375, 5.271728515625, 5.69287109375, 6.114013671875, 6.53515625, 6.956298828125, 7.37744140625, 7.798583984375, 8.2197265625, 8.640869140625, 9.06201171875, 9.483154296875, 9.904296875, 10.325439453125, 10.74658203125, 11.167724609375, 11.5888671875, 12.010009765625, 12.43115234375, 12.852294921875, 13.2734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 6.0, 3.0, 10.0, 8.0, 6.0, 10.0, 16.0, 22.0, 22.0, 18.0, 24.0, 12.0, 36.0, 32.0, 44.0, 40.0, 43.0, 70.0, 100.0, 206.0, 1619.0, 188.0, 91.0, 63.0, 47.0, 42.0, 34.0, 45.0, 22.0, 27.0, 31.0, 28.0, 12.0, 17.0, 15.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.81689453125, -40.6025390625, -39.38818359375, -38.173828125, -36.95947265625, -35.7451171875, -34.53076171875, -33.31640625, -32.10205078125, -30.8876953125, -29.67333984375, -28.458984375, -27.24462890625, -26.0302734375, -24.81591796875, -23.6015625, -22.38720703125, -21.1728515625, -19.95849609375, -18.744140625, -17.52978515625, -16.3154296875, -15.10107421875, -13.88671875, -12.67236328125, -11.4580078125, -10.24365234375, -9.029296875, -7.81494140625, -6.6005859375, -5.38623046875, -4.171875, -2.95751953125, -1.7431640625, -0.52880859375, 0.685546875, 1.89990234375, 3.1142578125, 4.32861328125, 5.54296875, 6.75732421875, 7.9716796875, 9.18603515625, 10.400390625, 11.61474609375, 12.8291015625, 14.04345703125, 15.2578125, 16.47216796875, 17.6865234375, 18.90087890625, 20.115234375, 21.32958984375, 22.5439453125, 23.75830078125, 24.97265625, 26.18701171875, 27.4013671875, 28.61572265625, 29.830078125, 31.04443359375, 32.2587890625, 33.47314453125, 34.6875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 7.0, 8.0, 9.0, 9.0, 11.0, 23.0, 17.0, 29.0, 45.0, 68.0, 86.0, 117.0, 209.0, 320.0, 717.0, 2810.0, 41517.0, 3064573.0, 30974.0, 2517.0, 704.0, 310.0, 175.0, 106.0, 84.0, 61.0, 47.0, 34.0, 23.0, 21.0, 20.0, 12.0, 11.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-120.9375, -117.52734375, -114.1171875, -110.70703125, -107.296875, -103.88671875, -100.4765625, -97.06640625, -93.65625, -90.24609375, -86.8359375, -83.42578125, -80.015625, -76.60546875, -73.1953125, -69.78515625, -66.375, -62.96484375, -59.5546875, -56.14453125, -52.734375, -49.32421875, -45.9140625, -42.50390625, -39.09375, -35.68359375, -32.2734375, -28.86328125, -25.453125, -22.04296875, -18.6328125, -15.22265625, -11.8125, -8.40234375, -4.9921875, -1.58203125, 1.828125, 5.23828125, 8.6484375, 12.05859375, 15.46875, 18.87890625, 22.2890625, 25.69921875, 29.109375, 32.51953125, 35.9296875, 39.33984375, 42.75, 46.16015625, 49.5703125, 52.98046875, 56.390625, 59.80078125, 63.2109375, 66.62109375, 70.03125, 73.44140625, 76.8515625, 80.26171875, 83.671875, 87.08203125, 90.4921875, 93.90234375, 97.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 61.0, 434.0, 452.0, 54.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-414.2214660644531, -405.9256896972656, -397.6299133300781, -389.3341369628906, -381.0383605957031, -372.74261474609375, -364.44683837890625, -356.15106201171875, -347.85528564453125, -339.55950927734375, -331.26373291015625, -322.96795654296875, -314.67218017578125, -306.37640380859375, -298.08062744140625, -289.7848815917969, -281.48907470703125, -273.19329833984375, -264.89752197265625, -256.60174560546875, -248.3059844970703, -240.0102081298828, -231.7144317626953, -223.4186553955078, -215.12289428710938, -206.82711791992188, -198.53134155273438, -190.23556518554688, -181.93980407714844, -173.64402770996094, -165.34825134277344, -157.05247497558594, -148.75669860839844, -140.46092224121094, -132.16514587402344, -123.86937713623047, -115.5736083984375, -107.27783203125, -98.9820556640625, -90.686279296875, -82.39051055908203, -74.09473419189453, -65.79896545410156, -57.50318908691406, -49.20741653442383, -40.911643981933594, -32.615867614746094, -24.32009506225586, -16.024322509765625, -7.728549003601074, 0.5672245025634766, 8.862998962402344, 17.158771514892578, 25.454544067382812, 33.75032043457031, 42.04609298706055, 50.34186553955078, 58.637638092041016, 66.93341064453125, 75.22918701171875, 83.52496337890625, 91.82073211669922, 100.11650848388672, 108.41227722167969, 116.70805358886719]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 10.0, 12.0, 12.0, 14.0, 19.0, 13.0, 24.0, 23.0, 35.0, 34.0, 29.0, 35.0, 35.0, 38.0, 37.0, 38.0, 51.0, 45.0, 45.0, 41.0, 42.0, 34.0, 39.0, 40.0, 42.0, 45.0, 29.0, 28.0, 16.0, 25.0, 17.0, 11.0, 16.0, 5.0, 1.0, 2.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-105.38029479980469, -102.15509796142578, -98.92989349365234, -95.70469665527344, -92.4794921875, -89.2542953491211, -86.02909851074219, -82.80389404296875, -79.57869720458984, -76.35350036621094, -73.1282958984375, -69.9030990600586, -66.67789459228516, -63.45269775390625, -60.22749710083008, -57.002296447753906, -53.777095794677734, -50.55189514160156, -47.32669448852539, -44.10149383544922, -40.87629699707031, -37.65109634399414, -34.42589569091797, -31.20069694519043, -27.975496292114258, -24.750295639038086, -21.525096893310547, -18.299896240234375, -15.07469654083252, -11.849496841430664, -8.624296188354492, -5.399097442626953, -2.1738967895507812, 1.0513031482696533, 4.276503086090088, 7.501703262329102, 10.726902961730957, 13.952102661132812, 17.177303314208984, 20.402502059936523, 23.627702713012695, 26.852903366088867, 30.078102111816406, 33.30330276489258, 36.52850341796875, 39.753700256347656, 42.978904724121094, 46.2041015625, 49.42930221557617, 52.654502868652344, 55.879703521728516, 59.10490417480469, 62.330101013183594, 65.5552978515625, 68.78050231933594, 72.00569915771484, 75.23090362548828, 78.45610046386719, 81.68130493164062, 84.90650177001953, 88.13170623779297, 91.35690307617188, 94.58210754394531, 97.80730438232422, 101.03250122070312]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 13.0, 18.0, 21.0, 18.0, 26.0, 30.0, 20.0, 26.0, 38.0, 43.0, 41.0, 39.0, 37.0, 32.0, 40.0, 54.0, 51.0, 40.0, 42.0, 38.0, 27.0, 26.0, 25.0, 29.0, 24.0, 21.0, 29.0, 18.0, 14.0, 17.0, 10.0, 13.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.46875, -13.0440673828125, -12.619384765625, -12.1947021484375, -11.77001953125, -11.3453369140625, -10.920654296875, -10.4959716796875, -10.0712890625, -9.6466064453125, -9.221923828125, -8.7972412109375, -8.37255859375, -7.9478759765625, -7.523193359375, -7.0985107421875, -6.673828125, -6.2491455078125, -5.824462890625, -5.3997802734375, -4.97509765625, -4.5504150390625, -4.125732421875, -3.7010498046875, -3.2763671875, -2.8516845703125, -2.427001953125, -2.0023193359375, -1.57763671875, -1.1529541015625, -0.728271484375, -0.3035888671875, 0.12109375, 0.5457763671875, 0.970458984375, 1.3951416015625, 1.81982421875, 2.2445068359375, 2.669189453125, 3.0938720703125, 3.5185546875, 3.9432373046875, 4.367919921875, 4.7926025390625, 5.21728515625, 5.6419677734375, 6.066650390625, 6.4913330078125, 6.916015625, 7.3406982421875, 7.765380859375, 8.1900634765625, 8.61474609375, 9.0394287109375, 9.464111328125, 9.8887939453125, 10.3134765625, 10.7381591796875, 11.162841796875, 11.5875244140625, 12.01220703125, 12.4368896484375, 12.861572265625, 13.2862548828125, 13.7109375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 4.0, 11.0, 7.0, 14.0, 13.0, 26.0, 28.0, 32.0, 37.0, 60.0, 100.0, 225.0, 497.0, 1337.0, 3918.0, 16251.0, 190363.0, 3485395.0, 464503.0, 23695.0, 4881.0, 1574.0, 658.0, 244.0, 112.0, 64.0, 37.0, 23.0, 40.0, 21.0, 14.0, 8.0, 16.0, 11.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.25, -47.69189453125, -46.1337890625, -44.57568359375, -43.017578125, -41.45947265625, -39.9013671875, -38.34326171875, -36.78515625, -35.22705078125, -33.6689453125, -32.11083984375, -30.552734375, -28.99462890625, -27.4365234375, -25.87841796875, -24.3203125, -22.76220703125, -21.2041015625, -19.64599609375, -18.087890625, -16.52978515625, -14.9716796875, -13.41357421875, -11.85546875, -10.29736328125, -8.7392578125, -7.18115234375, -5.623046875, -4.06494140625, -2.5068359375, -0.94873046875, 0.609375, 2.16748046875, 3.7255859375, 5.28369140625, 6.841796875, 8.39990234375, 9.9580078125, 11.51611328125, 13.07421875, 14.63232421875, 16.1904296875, 17.74853515625, 19.306640625, 20.86474609375, 22.4228515625, 23.98095703125, 25.5390625, 27.09716796875, 28.6552734375, 30.21337890625, 31.771484375, 33.32958984375, 34.8876953125, 36.44580078125, 38.00390625, 39.56201171875, 41.1201171875, 42.67822265625, 44.236328125, 45.79443359375, 47.3525390625, 48.91064453125, 50.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 15.0, 17.0, 28.0, 38.0, 66.0, 117.0, 178.0, 394.0, 850.0, 1050.0, 649.0, 301.0, 143.0, 86.0, 46.0, 37.0, 22.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -25.75048828125, -24.3447265625, -22.93896484375, -21.533203125, -20.12744140625, -18.7216796875, -17.31591796875, -15.91015625, -14.50439453125, -13.0986328125, -11.69287109375, -10.287109375, -8.88134765625, -7.4755859375, -6.06982421875, -4.6640625, -3.25830078125, -1.8525390625, -0.44677734375, 0.958984375, 2.36474609375, 3.7705078125, 5.17626953125, 6.58203125, 7.98779296875, 9.3935546875, 10.79931640625, 12.205078125, 13.61083984375, 15.0166015625, 16.42236328125, 17.828125, 19.23388671875, 20.6396484375, 22.04541015625, 23.451171875, 24.85693359375, 26.2626953125, 27.66845703125, 29.07421875, 30.47998046875, 31.8857421875, 33.29150390625, 34.697265625, 36.10302734375, 37.5087890625, 38.91455078125, 40.3203125, 41.72607421875, 43.1318359375, 44.53759765625, 45.943359375, 47.34912109375, 48.7548828125, 50.16064453125, 51.56640625, 52.97216796875, 54.3779296875, 55.78369140625, 57.189453125, 58.59521484375, 60.0009765625, 61.40673828125, 62.8125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 11.0, 13.0, 20.0, 32.0, 60.0, 104.0, 249.0, 646.0, 4331.0, 4061637.0, 124892.0, 1441.0, 448.0, 179.0, 90.0, 43.0, 31.0, 15.0, 20.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-329.75, -322.38671875, -315.0234375, -307.66015625, -300.296875, -292.93359375, -285.5703125, -278.20703125, -270.84375, -263.48046875, -256.1171875, -248.75390625, -241.390625, -234.02734375, -226.6640625, -219.30078125, -211.9375, -204.57421875, -197.2109375, -189.84765625, -182.484375, -175.12109375, -167.7578125, -160.39453125, -153.03125, -145.66796875, -138.3046875, -130.94140625, -123.578125, -116.21484375, -108.8515625, -101.48828125, -94.125, -86.76171875, -79.3984375, -72.03515625, -64.671875, -57.30859375, -49.9453125, -42.58203125, -35.21875, -27.85546875, -20.4921875, -13.12890625, -5.765625, 1.59765625, 8.9609375, 16.32421875, 23.6875, 31.05078125, 38.4140625, 45.77734375, 53.140625, 60.50390625, 67.8671875, 75.23046875, 82.59375, 89.95703125, 97.3203125, 104.68359375, 112.046875, 119.41015625, 126.7734375, 134.13671875, 141.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 40.0, 94.0, 197.0, 285.0, 202.0, 113.0, 38.0, 24.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-355.6307067871094, -347.6522521972656, -339.6737976074219, -331.6953430175781, -323.7169189453125, -315.73846435546875, -307.760009765625, -299.78155517578125, -291.8031005859375, -283.82464599609375, -275.84619140625, -267.86773681640625, -259.8892822265625, -251.9108428955078, -243.93240356445312, -235.95394897460938, -227.97549438476562, -219.99703979492188, -212.01858520507812, -204.04014587402344, -196.0616912841797, -188.08323669433594, -180.10479736328125, -172.1263427734375, -164.14788818359375, -156.16943359375, -148.19097900390625, -140.21253967285156, -132.2340850830078, -124.25563049316406, -116.27718353271484, -108.29873657226562, -100.32029724121094, -92.34184265136719, -84.36339569091797, -76.38494873046875, -68.406494140625, -60.428043365478516, -52.44959259033203, -44.47114181518555, -36.49269104003906, -28.514240264892578, -20.535789489746094, -12.55733871459961, -4.578887939453125, 3.3995628356933594, 11.378013610839844, 19.356464385986328, 27.334915161132812, 35.3133659362793, 43.29181671142578, 51.270267486572266, 59.24871826171875, 67.2271728515625, 75.20561981201172, 83.18406677246094, 91.16252136230469, 99.14097595214844, 107.11942291259766, 115.09786987304688, 123.07632446289062, 131.05477905273438, 139.03323364257812, 147.0116729736328, 154.99012756347656]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 11.0, 11.0, 18.0, 20.0, 11.0, 26.0, 30.0, 32.0, 25.0, 26.0, 29.0, 33.0, 32.0, 39.0, 47.0, 40.0, 37.0, 47.0, 44.0, 48.0, 29.0, 35.0, 40.0, 29.0, 21.0, 33.0, 19.0, 21.0, 17.0, 14.0, 19.0, 11.0, 10.0, 12.0, 10.0, 5.0, 9.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.02896118164062, -75.58889770507812, -73.1488265991211, -70.70875549316406, -68.26869201660156, -65.82862854003906, -63.38855743408203, -60.948490142822266, -58.5084228515625, -56.068355560302734, -53.62828826904297, -51.1882209777832, -48.74815368652344, -46.30808639526367, -43.868019104003906, -41.42795181274414, -38.987884521484375, -36.54781723022461, -34.107749938964844, -31.667682647705078, -29.227615356445312, -26.787548065185547, -24.34748077392578, -21.907413482666016, -19.46734619140625, -17.027278900146484, -14.587211608886719, -12.147144317626953, -9.707077026367188, -7.267009735107422, -4.826942443847656, -2.3868751525878906, 0.053192138671875, 2.4932594299316406, 4.933326721191406, 7.373394012451172, 9.813461303710938, 12.253528594970703, 14.693595886230469, 17.133663177490234, 19.57373046875, 22.013797760009766, 24.45386505126953, 26.893932342529297, 29.333999633789062, 31.774066925048828, 34.214134216308594, 36.65420150756836, 39.094268798828125, 41.53433609008789, 43.974403381347656, 46.41447067260742, 48.85453796386719, 51.29460525512695, 53.73467254638672, 56.174739837646484, 58.61480712890625, 61.054874420166016, 63.49494171142578, 65.93501281738281, 68.37507629394531, 70.81513977050781, 73.25521087646484, 75.69528198242188, 78.13534545898438]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 6.0, 4.0, 6.0, 9.0, 15.0, 12.0, 12.0, 20.0, 20.0, 26.0, 24.0, 27.0, 28.0, 41.0, 34.0, 42.0, 43.0, 38.0, 41.0, 52.0, 43.0, 37.0, 37.0, 44.0, 32.0, 27.0, 47.0, 31.0, 27.0, 19.0, 19.0, 15.0, 22.0, 12.0, 11.0, 15.0, 10.0, 6.0, 9.0, 13.0, 0.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.265625, -12.83447265625, -12.4033203125, -11.97216796875, -11.541015625, -11.10986328125, -10.6787109375, -10.24755859375, -9.81640625, -9.38525390625, -8.9541015625, -8.52294921875, -8.091796875, -7.66064453125, -7.2294921875, -6.79833984375, -6.3671875, -5.93603515625, -5.5048828125, -5.07373046875, -4.642578125, -4.21142578125, -3.7802734375, -3.34912109375, -2.91796875, -2.48681640625, -2.0556640625, -1.62451171875, -1.193359375, -0.76220703125, -0.3310546875, 0.10009765625, 0.53125, 0.96240234375, 1.3935546875, 1.82470703125, 2.255859375, 2.68701171875, 3.1181640625, 3.54931640625, 3.98046875, 4.41162109375, 4.8427734375, 5.27392578125, 5.705078125, 6.13623046875, 6.5673828125, 6.99853515625, 7.4296875, 7.86083984375, 8.2919921875, 8.72314453125, 9.154296875, 9.58544921875, 10.0166015625, 10.44775390625, 10.87890625, 11.31005859375, 11.7412109375, 12.17236328125, 12.603515625, 13.03466796875, 13.4658203125, 13.89697265625, 14.328125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 7.0, 16.0, 14.0, 16.0, 30.0, 57.0, 47.0, 65.0, 98.0, 115.0, 208.0, 298.0, 419.0, 560.0, 815.0, 1073.0, 1652.0, 2395.0, 3436.0, 5203.0, 7661.0, 11775.0, 18419.0, 29264.0, 47035.0, 77668.0, 123369.0, 175577.0, 181923.0, 133307.0, 83893.0, 52063.0, 31786.0, 19458.0, 12816.0, 8256.0, 5576.0, 3738.0, 2581.0, 1785.0, 1186.0, 824.0, 608.0, 438.0, 310.0, 214.0, 138.0, 104.0, 63.0, 70.0, 48.0, 24.0, 22.0, 19.0, 14.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.9541015625, -1.8932037353515625, -1.832305908203125, -1.7714080810546875, -1.71051025390625, -1.6496124267578125, -1.588714599609375, -1.5278167724609375, -1.4669189453125, -1.4060211181640625, -1.345123291015625, -1.2842254638671875, -1.22332763671875, -1.1624298095703125, -1.101531982421875, -1.0406341552734375, -0.979736328125, -0.9188385009765625, -0.857940673828125, -0.7970428466796875, -0.73614501953125, -0.6752471923828125, -0.614349365234375, -0.5534515380859375, -0.4925537109375, -0.4316558837890625, -0.370758056640625, -0.3098602294921875, -0.24896240234375, -0.1880645751953125, -0.127166748046875, -0.0662689208984375, -0.00537109375, 0.0555267333984375, 0.116424560546875, 0.1773223876953125, 0.23822021484375, 0.2991180419921875, 0.360015869140625, 0.4209136962890625, 0.4818115234375, 0.5427093505859375, 0.603607177734375, 0.6645050048828125, 0.72540283203125, 0.7863006591796875, 0.847198486328125, 0.9080963134765625, 0.968994140625, 1.0298919677734375, 1.090789794921875, 1.1516876220703125, 1.21258544921875, 1.2734832763671875, 1.334381103515625, 1.3952789306640625, 1.4561767578125, 1.5170745849609375, 1.577972412109375, 1.6388702392578125, 1.69976806640625, 1.7606658935546875, 1.821563720703125, 1.8824615478515625, 1.943359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 9.0, 17.0, 15.0, 15.0, 29.0, 19.0, 17.0, 29.0, 24.0, 35.0, 31.0, 32.0, 34.0, 41.0, 28.0, 32.0, 1074.0, 43.0, 37.0, 37.0, 30.0, 23.0, 38.0, 35.0, 27.0, 21.0, 27.0, 26.0, 18.0, 12.0, 20.0, 15.0, 14.0, 11.0, 11.0, 9.0, 10.0, 6.0, 7.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.58203125, -7.30828857421875, -7.0345458984375, -6.76080322265625, -6.487060546875, -6.21331787109375, -5.9395751953125, -5.66583251953125, -5.39208984375, -5.11834716796875, -4.8446044921875, -4.57086181640625, -4.297119140625, -4.02337646484375, -3.7496337890625, -3.47589111328125, -3.2021484375, -2.92840576171875, -2.6546630859375, -2.38092041015625, -2.107177734375, -1.83343505859375, -1.5596923828125, -1.28594970703125, -1.01220703125, -0.73846435546875, -0.4647216796875, -0.19097900390625, 0.082763671875, 0.35650634765625, 0.6302490234375, 0.90399169921875, 1.177734375, 1.45147705078125, 1.7252197265625, 1.99896240234375, 2.272705078125, 2.54644775390625, 2.8201904296875, 3.09393310546875, 3.36767578125, 3.64141845703125, 3.9151611328125, 4.18890380859375, 4.462646484375, 4.73638916015625, 5.0101318359375, 5.28387451171875, 5.5576171875, 5.83135986328125, 6.1051025390625, 6.37884521484375, 6.652587890625, 6.92633056640625, 7.2000732421875, 7.47381591796875, 7.74755859375, 8.02130126953125, 8.2950439453125, 8.56878662109375, 8.842529296875, 9.11627197265625, 9.3900146484375, 9.66375732421875, 9.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 3.0, 4.0, 8.0, 14.0, 14.0, 24.0, 37.0, 58.0, 81.0, 90.0, 144.0, 203.0, 297.0, 420.0, 612.0, 878.0, 1225.0, 1790.0, 2556.0, 3815.0, 5557.0, 7992.0, 12076.0, 17665.0, 26861.0, 40769.0, 62201.0, 95199.0, 141202.0, 1223723.0, 149959.0, 102561.0, 67737.0, 43880.0, 28613.0, 18808.0, 12767.0, 8593.0, 5778.0, 4042.0, 2711.0, 1912.0, 1271.0, 916.0, 619.0, 424.0, 307.0, 219.0, 157.0, 113.0, 67.0, 43.0, 29.0, 23.0, 26.0, 15.0, 12.0, 7.0, 8.0, 1.0, 3.0], "bins": [-1.171875, -1.1359100341796875, -1.099945068359375, -1.0639801025390625, -1.02801513671875, -0.9920501708984375, -0.956085205078125, -0.9201202392578125, -0.8841552734375, -0.8481903076171875, -0.812225341796875, -0.7762603759765625, -0.74029541015625, -0.7043304443359375, -0.668365478515625, -0.6324005126953125, -0.596435546875, -0.5604705810546875, -0.524505615234375, -0.4885406494140625, -0.45257568359375, -0.4166107177734375, -0.380645751953125, -0.3446807861328125, -0.3087158203125, -0.2727508544921875, -0.236785888671875, -0.2008209228515625, -0.16485595703125, -0.1288909912109375, -0.092926025390625, -0.0569610595703125, -0.02099609375, 0.0149688720703125, 0.050933837890625, 0.0868988037109375, 0.12286376953125, 0.1588287353515625, 0.194793701171875, 0.2307586669921875, 0.2667236328125, 0.3026885986328125, 0.338653564453125, 0.3746185302734375, 0.41058349609375, 0.4465484619140625, 0.482513427734375, 0.5184783935546875, 0.554443359375, 0.5904083251953125, 0.626373291015625, 0.6623382568359375, 0.69830322265625, 0.7342681884765625, 0.770233154296875, 0.8061981201171875, 0.8421630859375, 0.8781280517578125, 0.914093017578125, 0.9500579833984375, 0.98602294921875, 1.0219879150390625, 1.057952880859375, 1.0939178466796875, 1.1298828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 2.0, 4.0, 3.0, 4.0, 7.0, 14.0, 22.0, 15.0, 16.0, 26.0, 31.0, 29.0, 31.0, 49.0, 53.0, 69.0, 90.0, 97.0, 72.0, 54.0, 47.0, 39.0, 22.0, 20.0, 19.0, 24.0, 16.0, 15.0, 16.0, 14.0, 16.0, 12.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02337646484375, -0.022624969482421875, -0.02187347412109375, -0.021121978759765625, -0.0203704833984375, -0.019618988037109375, -0.01886749267578125, -0.018115997314453125, -0.017364501953125, -0.016613006591796875, -0.01586151123046875, -0.015110015869140625, -0.0143585205078125, -0.013607025146484375, -0.01285552978515625, -0.012104034423828125, -0.0113525390625, -0.010601043701171875, -0.00984954833984375, -0.009098052978515625, -0.0083465576171875, -0.007595062255859375, -0.00684356689453125, -0.006092071533203125, -0.005340576171875, -0.004589080810546875, -0.00383758544921875, -0.003086090087890625, -0.0023345947265625, -0.001583099365234375, -0.00083160400390625, -8.0108642578125e-05, 0.00067138671875, 0.001422882080078125, 0.00217437744140625, 0.002925872802734375, 0.0036773681640625, 0.004428863525390625, 0.00518035888671875, 0.005931854248046875, 0.006683349609375, 0.007434844970703125, 0.00818634033203125, 0.008937835693359375, 0.0096893310546875, 0.010440826416015625, 0.01119232177734375, 0.011943817138671875, 0.0126953125, 0.013446807861328125, 0.01419830322265625, 0.014949798583984375, 0.0157012939453125, 0.016452789306640625, 0.01720428466796875, 0.017955780029296875, 0.018707275390625, 0.019458770751953125, 0.02021026611328125, 0.020961761474609375, 0.0217132568359375, 0.022464752197265625, 0.02321624755859375, 0.023967742919921875, 0.02471923828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 11.0, 4.0, 10.0, 17.0, 22.0, 20.0, 23.0, 27.0, 35.0, 57.0, 43.0, 70.0, 82.0, 150.0, 313.0, 743.0, 13045.0, 981130.0, 50563.0, 1190.0, 337.0, 204.0, 121.0, 75.0, 66.0, 37.0, 24.0, 29.0, 16.0, 21.0, 10.0, 9.0, 6.0, 4.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51318359375, -0.49745941162109375, -0.4817352294921875, -0.46601104736328125, -0.450286865234375, -0.43456268310546875, -0.4188385009765625, -0.40311431884765625, -0.38739013671875, -0.37166595458984375, -0.3559417724609375, -0.34021759033203125, -0.324493408203125, -0.30876922607421875, -0.2930450439453125, -0.27732086181640625, -0.2615966796875, -0.24587249755859375, -0.2301483154296875, -0.21442413330078125, -0.198699951171875, -0.18297576904296875, -0.1672515869140625, -0.15152740478515625, -0.13580322265625, -0.12007904052734375, -0.1043548583984375, -0.08863067626953125, -0.072906494140625, -0.05718231201171875, -0.0414581298828125, -0.02573394775390625, -0.010009765625, 0.00571441650390625, 0.0214385986328125, 0.03716278076171875, 0.052886962890625, 0.06861114501953125, 0.0843353271484375, 0.10005950927734375, 0.11578369140625, 0.13150787353515625, 0.1472320556640625, 0.16295623779296875, 0.178680419921875, 0.19440460205078125, 0.2101287841796875, 0.22585296630859375, 0.2415771484375, 0.25730133056640625, 0.2730255126953125, 0.28874969482421875, 0.304473876953125, 0.32019805908203125, 0.3359222412109375, 0.35164642333984375, 0.36737060546875, 0.38309478759765625, 0.3988189697265625, 0.41454315185546875, 0.430267333984375, 0.44599151611328125, 0.4617156982421875, 0.47743988037109375, 0.4931640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 74.0, 878.0, 60.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1237386167049408, -0.10448823124170303, -0.08523784577846527, -0.06598746031522751, -0.046737074851989746, -0.027486689388751984, -0.008236303925514221, 0.011014074087142944, 0.030264467000961304, 0.049514852464199066, 0.06876523792743683, 0.08801562339067459, 0.10726600885391235, 0.1265164017677307, 0.14576677978038788, 0.16501715779304504, 0.1842675507068634, 0.20351794362068176, 0.22276832163333893, 0.2420186996459961, 0.26126909255981445, 0.2805194854736328, 0.29976987838745117, 0.31902024149894714, 0.3382706344127655, 0.35752102732658386, 0.37677139043807983, 0.3960217833518982, 0.41527217626571655, 0.4345225691795349, 0.45377296209335327, 0.47302332520484924, 0.4922736883163452, 0.5115240812301636, 0.5307744741439819, 0.5500248670578003, 0.5692752599716187, 0.5885255932807922, 0.6077759861946106, 0.627026379108429, 0.6462767720222473, 0.6655271649360657, 0.684777557849884, 0.7040279507637024, 0.723278284072876, 0.7425286769866943, 0.7617790699005127, 0.781029462814331, 0.8002798557281494, 0.8195302486419678, 0.8387806415557861, 0.8580310344696045, 0.8772814273834229, 0.8965317606925964, 0.9157821536064148, 0.9350325465202332, 0.9542829394340515, 0.9735333323478699, 0.9927837252616882, 1.0120340585708618, 1.0312844514846802, 1.0505348443984985, 1.069785237312317, 1.0890356302261353, 1.1082860231399536]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 8.0, 8.0, 12.0, 10.0, 8.0, 15.0, 15.0, 19.0, 26.0, 25.0, 34.0, 30.0, 34.0, 36.0, 39.0, 50.0, 44.0, 37.0, 43.0, 42.0, 43.0, 39.0, 31.0, 47.0, 40.0, 34.0, 30.0, 30.0, 27.0, 27.0, 23.0, 18.0, 17.0, 10.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.05608034133911133, -0.05455788969993591, -0.0530354380607605, -0.051512982696294785, -0.04999053105711937, -0.048468079417943954, -0.04694562405347824, -0.045423172414302826, -0.04390072077512741, -0.042378269135951996, -0.04085581749677658, -0.03933336213231087, -0.03781091049313545, -0.03628845885396004, -0.034766003489494324, -0.03324355185031891, -0.031721100211143494, -0.03019864857196808, -0.028676195070147514, -0.02715374156832695, -0.025631289929151535, -0.02410883828997612, -0.022586384788155556, -0.02106393128633499, -0.019541479647159576, -0.01801902800798416, -0.016496574506163597, -0.014974121935665607, -0.013451669365167618, -0.011929216794669628, -0.010406764224171638, -0.008884311653673649, -0.007361859083175659, -0.0058394065126776695, -0.00431695394217968, -0.00279450137168169, -0.0012720488011837006, 0.0002504037693142891, 0.0017728563398122787, 0.0032953089103102684, 0.004817761480808258, 0.006340214051306248, 0.007862666621804237, 0.009385119192302227, 0.010907571762800217, 0.012430024333298206, 0.013952476903796196, 0.015474929474294186, 0.016997382044792175, 0.01851983368396759, 0.020042287185788155, 0.02156474068760872, 0.023087192326784134, 0.02460964396595955, 0.026132097467780113, 0.027654550969600677, 0.029177002608776093, 0.030699454247951508, 0.03222190588712692, 0.033744361251592636, 0.03526681289076805, 0.036789264529943466, 0.03831171989440918, 0.039834171533584595, 0.04135662317276001]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 6.0, 4.0, 6.0, 9.0, 15.0, 12.0, 12.0, 20.0, 20.0, 26.0, 24.0, 27.0, 28.0, 40.0, 35.0, 41.0, 43.0, 39.0, 41.0, 52.0, 42.0, 35.0, 40.0, 44.0, 32.0, 27.0, 47.0, 31.0, 27.0, 19.0, 19.0, 15.0, 22.0, 12.0, 11.0, 15.0, 10.0, 6.0, 8.0, 13.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.265625, -12.8345947265625, -12.403564453125, -11.9725341796875, -11.54150390625, -11.1104736328125, -10.679443359375, -10.2484130859375, -9.8173828125, -9.3863525390625, -8.955322265625, -8.5242919921875, -8.09326171875, -7.6622314453125, -7.231201171875, -6.8001708984375, -6.369140625, -5.9381103515625, -5.507080078125, -5.0760498046875, -4.64501953125, -4.2139892578125, -3.782958984375, -3.3519287109375, -2.9208984375, -2.4898681640625, -2.058837890625, -1.6278076171875, -1.19677734375, -0.7657470703125, -0.334716796875, 0.0963134765625, 0.52734375, 0.9583740234375, 1.389404296875, 1.8204345703125, 2.25146484375, 2.6824951171875, 3.113525390625, 3.5445556640625, 3.9755859375, 4.4066162109375, 4.837646484375, 5.2686767578125, 5.69970703125, 6.1307373046875, 6.561767578125, 6.9927978515625, 7.423828125, 7.8548583984375, 8.285888671875, 8.7169189453125, 9.14794921875, 9.5789794921875, 10.010009765625, 10.4410400390625, 10.8720703125, 11.3031005859375, 11.734130859375, 12.1651611328125, 12.59619140625, 13.0272216796875, 13.458251953125, 13.8892822265625, 14.3203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 9.0, 9.0, 12.0, 24.0, 31.0, 33.0, 59.0, 70.0, 102.0, 151.0, 254.0, 367.0, 629.0, 1105.0, 2096.0, 4636.0, 13537.0, 61674.0, 677438.0, 238463.0, 31887.0, 8535.0, 3418.0, 1650.0, 813.0, 510.0, 331.0, 188.0, 130.0, 86.0, 62.0, 62.0, 35.0, 22.0, 22.0, 15.0, 14.0, 11.0, 14.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-22.15625, -21.43701171875, -20.7177734375, -19.99853515625, -19.279296875, -18.56005859375, -17.8408203125, -17.12158203125, -16.40234375, -15.68310546875, -14.9638671875, -14.24462890625, -13.525390625, -12.80615234375, -12.0869140625, -11.36767578125, -10.6484375, -9.92919921875, -9.2099609375, -8.49072265625, -7.771484375, -7.05224609375, -6.3330078125, -5.61376953125, -4.89453125, -4.17529296875, -3.4560546875, -2.73681640625, -2.017578125, -1.29833984375, -0.5791015625, 0.14013671875, 0.859375, 1.57861328125, 2.2978515625, 3.01708984375, 3.736328125, 4.45556640625, 5.1748046875, 5.89404296875, 6.61328125, 7.33251953125, 8.0517578125, 8.77099609375, 9.490234375, 10.20947265625, 10.9287109375, 11.64794921875, 12.3671875, 13.08642578125, 13.8056640625, 14.52490234375, 15.244140625, 15.96337890625, 16.6826171875, 17.40185546875, 18.12109375, 18.84033203125, 19.5595703125, 20.27880859375, 20.998046875, 21.71728515625, 22.4365234375, 23.15576171875, 23.875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 14.0, 7.0, 16.0, 20.0, 21.0, 23.0, 18.0, 18.0, 28.0, 33.0, 43.0, 53.0, 54.0, 60.0, 153.0, 1821.0, 167.0, 67.0, 49.0, 49.0, 43.0, 45.0, 39.0, 17.0, 25.0, 23.0, 24.0, 22.0, 20.0, 10.0, 17.0, 10.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.20166015625, -37.7783203125, -36.35498046875, -34.931640625, -33.50830078125, -32.0849609375, -30.66162109375, -29.23828125, -27.81494140625, -26.3916015625, -24.96826171875, -23.544921875, -22.12158203125, -20.6982421875, -19.27490234375, -17.8515625, -16.42822265625, -15.0048828125, -13.58154296875, -12.158203125, -10.73486328125, -9.3115234375, -7.88818359375, -6.46484375, -5.04150390625, -3.6181640625, -2.19482421875, -0.771484375, 0.65185546875, 2.0751953125, 3.49853515625, 4.921875, 6.34521484375, 7.7685546875, 9.19189453125, 10.615234375, 12.03857421875, 13.4619140625, 14.88525390625, 16.30859375, 17.73193359375, 19.1552734375, 20.57861328125, 22.001953125, 23.42529296875, 24.8486328125, 26.27197265625, 27.6953125, 29.11865234375, 30.5419921875, 31.96533203125, 33.388671875, 34.81201171875, 36.2353515625, 37.65869140625, 39.08203125, 40.50537109375, 41.9287109375, 43.35205078125, 44.775390625, 46.19873046875, 47.6220703125, 49.04541015625, 50.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 8.0, 7.0, 4.0, 15.0, 18.0, 21.0, 28.0, 38.0, 34.0, 42.0, 68.0, 118.0, 202.0, 476.0, 2261.0, 2741268.0, 398352.0, 1824.0, 407.0, 186.0, 84.0, 61.0, 39.0, 24.0, 32.0, 29.0, 16.0, 15.0, 6.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.75, -138.607421875, -133.46484375, -128.322265625, -123.1796875, -118.037109375, -112.89453125, -107.751953125, -102.609375, -97.466796875, -92.32421875, -87.181640625, -82.0390625, -76.896484375, -71.75390625, -66.611328125, -61.46875, -56.326171875, -51.18359375, -46.041015625, -40.8984375, -35.755859375, -30.61328125, -25.470703125, -20.328125, -15.185546875, -10.04296875, -4.900390625, 0.2421875, 5.384765625, 10.52734375, 15.669921875, 20.8125, 25.955078125, 31.09765625, 36.240234375, 41.3828125, 46.525390625, 51.66796875, 56.810546875, 61.953125, 67.095703125, 72.23828125, 77.380859375, 82.5234375, 87.666015625, 92.80859375, 97.951171875, 103.09375, 108.236328125, 113.37890625, 118.521484375, 123.6640625, 128.806640625, 133.94921875, 139.091796875, 144.234375, 149.376953125, 154.51953125, 159.662109375, 164.8046875, 169.947265625, 175.08984375, 180.232421875, 185.375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 266.0, 726.0, 24.0], "bins": [-812.8474731445312, -799.777587890625, -786.707763671875, -773.6378784179688, -760.5680541992188, -747.4981689453125, -734.4283447265625, -721.3584594726562, -708.28857421875, -695.2186889648438, -682.1488647460938, -669.0789794921875, -656.0091552734375, -642.9392700195312, -629.869384765625, -616.799560546875, -603.729736328125, -590.6598510742188, -577.5900268554688, -564.5201416015625, -551.4503173828125, -538.3804321289062, -525.310546875, -512.24072265625, -499.17083740234375, -486.1009826660156, -473.0311279296875, -459.96124267578125, -446.8913879394531, -433.821533203125, -420.7516784667969, -407.68182373046875, -394.6119384765625, -381.5420837402344, -368.47222900390625, -355.40234375, -342.3324890136719, -329.26263427734375, -316.1927795410156, -303.1229248046875, -290.05303955078125, -276.9831848144531, -263.913330078125, -250.8434600830078, -237.77359008789062, -224.7037353515625, -211.63388061523438, -198.56402587890625, -185.49415588378906, -172.42430114746094, -159.35443115234375, -146.28457641601562, -133.2147216796875, -120.14485168457031, -107.07499694824219, -94.00513458251953, -80.93527221679688, -67.86540985107422, -54.79555130004883, -41.72569274902344, -28.65583038330078, -15.585968017578125, -2.51611328125, 10.553749084472656, 23.62360954284668]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 5.0, 4.0, 11.0, 4.0, 8.0, 21.0, 20.0, 19.0, 19.0, 23.0, 21.0, 37.0, 38.0, 31.0, 31.0, 37.0, 40.0, 43.0, 43.0, 36.0, 52.0, 30.0, 41.0, 32.0, 35.0, 29.0, 30.0, 28.0, 19.0, 26.0, 22.0, 25.0, 23.0, 19.0, 13.0, 14.0, 6.0, 12.0, 7.0, 7.0, 9.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-117.62258911132812, -114.00001525878906, -110.37743377685547, -106.75485229492188, -103.13227844238281, -99.50970458984375, -95.88712310791016, -92.26454162597656, -88.6419677734375, -85.01939392089844, -81.39681243896484, -77.77423095703125, -74.15165710449219, -70.52908325195312, -66.90650177001953, -63.2839241027832, -59.661346435546875, -56.03876876831055, -52.41619110107422, -48.79361343383789, -45.17103576660156, -41.548458099365234, -37.925880432128906, -34.30330276489258, -30.68072509765625, -27.058147430419922, -23.435569763183594, -19.812992095947266, -16.190414428710938, -12.56783676147461, -8.945259094238281, -5.322681427001953, -1.700103759765625, 1.9224739074707031, 5.545051574707031, 9.16762924194336, 12.790206909179688, 16.412784576416016, 20.035362243652344, 23.657939910888672, 27.280517578125, 30.903095245361328, 34.525672912597656, 38.148250579833984, 41.77082824707031, 45.39340591430664, 49.01598358154297, 52.6385612487793, 56.261138916015625, 59.88371658325195, 63.50629425048828, 67.12887573242188, 70.75144958496094, 74.3740234375, 77.9966049194336, 81.61918640136719, 85.24176025390625, 88.86433410644531, 92.4869155883789, 96.1094970703125, 99.73207092285156, 103.35464477539062, 106.97722625732422, 110.59980773925781, 114.22238159179688]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 4.0, 7.0, 8.0, 14.0, 18.0, 13.0, 20.0, 24.0, 27.0, 26.0, 27.0, 19.0, 48.0, 29.0, 34.0, 50.0, 47.0, 46.0, 42.0, 33.0, 41.0, 40.0, 46.0, 39.0, 36.0, 38.0, 29.0, 24.0, 17.0, 18.0, 23.0, 17.0, 15.0, 11.0, 11.0, 7.0, 2.0, 7.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.265625, -14.7945556640625, -14.323486328125, -13.8524169921875, -13.38134765625, -12.9102783203125, -12.439208984375, -11.9681396484375, -11.4970703125, -11.0260009765625, -10.554931640625, -10.0838623046875, -9.61279296875, -9.1417236328125, -8.670654296875, -8.1995849609375, -7.728515625, -7.2574462890625, -6.786376953125, -6.3153076171875, -5.84423828125, -5.3731689453125, -4.902099609375, -4.4310302734375, -3.9599609375, -3.4888916015625, -3.017822265625, -2.5467529296875, -2.07568359375, -1.6046142578125, -1.133544921875, -0.6624755859375, -0.19140625, 0.2796630859375, 0.750732421875, 1.2218017578125, 1.69287109375, 2.1639404296875, 2.635009765625, 3.1060791015625, 3.5771484375, 4.0482177734375, 4.519287109375, 4.9903564453125, 5.46142578125, 5.9324951171875, 6.403564453125, 6.8746337890625, 7.345703125, 7.8167724609375, 8.287841796875, 8.7589111328125, 9.22998046875, 9.7010498046875, 10.172119140625, 10.6431884765625, 11.1142578125, 11.5853271484375, 12.056396484375, 12.5274658203125, 12.99853515625, 13.4696044921875, 13.940673828125, 14.4117431640625, 14.8828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 8.0, 12.0, 26.0, 30.0, 42.0, 45.0, 80.0, 92.0, 120.0, 184.0, 263.0, 375.0, 561.0, 868.0, 1228.0, 2032.0, 3380.0, 5855.0, 10889.0, 22317.0, 59918.0, 198926.0, 727049.0, 1686282.0, 1018639.0, 305334.0, 88247.0, 30476.0, 13331.0, 7002.0, 3998.0, 2329.0, 1437.0, 938.0, 554.0, 445.0, 286.0, 197.0, 135.0, 92.0, 80.0, 34.0, 40.0, 31.0, 16.0, 19.0, 15.0, 10.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.40625, -17.859375, -17.3125, -16.765625, -16.21875, -15.671875, -15.125, -14.578125, -14.03125, -13.484375, -12.9375, -12.390625, -11.84375, -11.296875, -10.75, -10.203125, -9.65625, -9.109375, -8.5625, -8.015625, -7.46875, -6.921875, -6.375, -5.828125, -5.28125, -4.734375, -4.1875, -3.640625, -3.09375, -2.546875, -2.0, -1.453125, -0.90625, -0.359375, 0.1875, 0.734375, 1.28125, 1.828125, 2.375, 2.921875, 3.46875, 4.015625, 4.5625, 5.109375, 5.65625, 6.203125, 6.75, 7.296875, 7.84375, 8.390625, 8.9375, 9.484375, 10.03125, 10.578125, 11.125, 11.671875, 12.21875, 12.765625, 13.3125, 13.859375, 14.40625, 14.953125, 15.5, 16.046875, 16.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 9.0, 12.0, 9.0, 14.0, 18.0, 19.0, 22.0, 30.0, 36.0, 65.0, 64.0, 105.0, 126.0, 235.0, 317.0, 526.0, 670.0, 565.0, 436.0, 247.0, 161.0, 131.0, 74.0, 52.0, 32.0, 26.0, 14.0, 13.0, 9.0, 10.0, 11.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.765625, -29.825927734375, -28.88623046875, -27.946533203125, -27.0068359375, -26.067138671875, -25.12744140625, -24.187744140625, -23.248046875, -22.308349609375, -21.36865234375, -20.428955078125, -19.4892578125, -18.549560546875, -17.60986328125, -16.670166015625, -15.73046875, -14.790771484375, -13.85107421875, -12.911376953125, -11.9716796875, -11.031982421875, -10.09228515625, -9.152587890625, -8.212890625, -7.273193359375, -6.33349609375, -5.393798828125, -4.4541015625, -3.514404296875, -2.57470703125, -1.635009765625, -0.6953125, 0.244384765625, 1.18408203125, 2.123779296875, 3.0634765625, 4.003173828125, 4.94287109375, 5.882568359375, 6.822265625, 7.761962890625, 8.70166015625, 9.641357421875, 10.5810546875, 11.520751953125, 12.46044921875, 13.400146484375, 14.33984375, 15.279541015625, 16.21923828125, 17.158935546875, 18.0986328125, 19.038330078125, 19.97802734375, 20.917724609375, 21.857421875, 22.797119140625, 23.73681640625, 24.676513671875, 25.6162109375, 26.555908203125, 27.49560546875, 28.435302734375, 29.375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 16.0, 17.0, 26.0, 42.0, 61.0, 110.0, 199.0, 405.0, 1106.0, 6001.0, 112583.0, 3969315.0, 96469.0, 5717.0, 1116.0, 443.0, 206.0, 113.0, 73.0, 61.0, 39.0, 29.0, 23.0, 21.0, 14.0, 11.0, 11.0, 3.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.625, -110.126953125, -106.62890625, -103.130859375, -99.6328125, -96.134765625, -92.63671875, -89.138671875, -85.640625, -82.142578125, -78.64453125, -75.146484375, -71.6484375, -68.150390625, -64.65234375, -61.154296875, -57.65625, -54.158203125, -50.66015625, -47.162109375, -43.6640625, -40.166015625, -36.66796875, -33.169921875, -29.671875, -26.173828125, -22.67578125, -19.177734375, -15.6796875, -12.181640625, -8.68359375, -5.185546875, -1.6875, 1.810546875, 5.30859375, 8.806640625, 12.3046875, 15.802734375, 19.30078125, 22.798828125, 26.296875, 29.794921875, 33.29296875, 36.791015625, 40.2890625, 43.787109375, 47.28515625, 50.783203125, 54.28125, 57.779296875, 61.27734375, 64.775390625, 68.2734375, 71.771484375, 75.26953125, 78.767578125, 82.265625, 85.763671875, 89.26171875, 92.759765625, 96.2578125, 99.755859375, 103.25390625, 106.751953125, 110.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 26.0, 433.0, 523.0, 29.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1150.5728759765625, -1125.6065673828125, -1100.640380859375, -1075.674072265625, -1050.707763671875, -1025.7415771484375, -1000.7752685546875, -975.8089599609375, -950.8427124023438, -925.87646484375, -900.91015625, -875.9439086914062, -850.9776611328125, -826.0113525390625, -801.0451049804688, -776.078857421875, -751.112548828125, -726.1463012695312, -701.1799926757812, -676.2137451171875, -651.2474365234375, -626.2811889648438, -601.31494140625, -576.3486328125, -551.3823852539062, -526.4161376953125, -501.4498291015625, -476.48358154296875, -451.5173034667969, -426.551025390625, -401.58477783203125, -376.6184997558594, -351.65228271484375, -326.6860046386719, -301.7197265625, -276.75347900390625, -251.78720092773438, -226.8209228515625, -201.8546600341797, -176.88839721679688, -151.922119140625, -126.95584869384766, -101.98957824707031, -77.02330780029297, -52.057037353515625, -27.09076690673828, -2.1244964599609375, 22.841766357421875, 47.80804443359375, 72.7743148803711, 97.74058532714844, 122.70685577392578, 147.67312622070312, 172.639404296875, 197.6056671142578, 222.57192993164062, 247.5382080078125, 272.5044860839844, 297.47076416015625, 322.43701171875, 347.4032897949219, 372.36956787109375, 397.3358154296875, 422.3020935058594, 447.26837158203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 15.0, 17.0, 18.0, 9.0, 24.0, 29.0, 32.0, 25.0, 37.0, 46.0, 36.0, 47.0, 60.0, 53.0, 53.0, 58.0, 48.0, 49.0, 42.0, 49.0, 37.0, 29.0, 24.0, 28.0, 21.0, 16.0, 18.0, 21.0, 7.0, 11.0, 1.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.77984619140625, -95.31404113769531, -91.8482437133789, -88.38243865966797, -84.91664123535156, -81.45083618164062, -77.98503112792969, -74.51922607421875, -71.05342864990234, -67.5876235961914, -64.121826171875, -60.65602111816406, -57.19021987915039, -53.72441864013672, -50.25861358642578, -46.79281234741211, -43.32701110839844, -39.861209869384766, -36.395408630371094, -32.929603576660156, -29.463802337646484, -25.998001098632812, -22.532197952270508, -19.066394805908203, -15.600593566894531, -12.134791374206543, -8.668989181518555, -5.203186988830566, -1.7373847961425781, 1.7284164428710938, 5.194219589233398, 8.660022735595703, 12.125823974609375, 15.591626167297363, 19.05742835998535, 22.523231506347656, 25.989032745361328, 29.454833984375, 32.92063903808594, 36.38644027709961, 39.85224151611328, 43.31804275512695, 46.783843994140625, 50.24964904785156, 53.715450286865234, 57.181251525878906, 60.647056579589844, 64.11285400390625, 67.57865905761719, 71.04446411132812, 74.51026153564453, 77.97606658935547, 81.44186401367188, 84.90766906738281, 88.37347412109375, 91.83927917480469, 95.3050765991211, 98.77088165283203, 102.23667907714844, 105.70248413085938, 109.16828918457031, 112.63408660888672, 116.09989166259766, 119.56568908691406, 123.031494140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 13.0, 17.0, 12.0, 11.0, 22.0, 20.0, 24.0, 36.0, 35.0, 31.0, 54.0, 44.0, 55.0, 50.0, 53.0, 55.0, 52.0, 32.0, 32.0, 51.0, 41.0, 35.0, 22.0, 29.0, 24.0, 30.0, 19.0, 13.0, 16.0, 11.0, 5.0, 5.0, 8.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.7037353515625, -13.196533203125, -12.6893310546875, -12.18212890625, -11.6749267578125, -11.167724609375, -10.6605224609375, -10.1533203125, -9.6461181640625, -9.138916015625, -8.6317138671875, -8.12451171875, -7.6173095703125, -7.110107421875, -6.6029052734375, -6.095703125, -5.5885009765625, -5.081298828125, -4.5740966796875, -4.06689453125, -3.5596923828125, -3.052490234375, -2.5452880859375, -2.0380859375, -1.5308837890625, -1.023681640625, -0.5164794921875, -0.00927734375, 0.4979248046875, 1.005126953125, 1.5123291015625, 2.01953125, 2.5267333984375, 3.033935546875, 3.5411376953125, 4.04833984375, 4.5555419921875, 5.062744140625, 5.5699462890625, 6.0771484375, 6.5843505859375, 7.091552734375, 7.5987548828125, 8.10595703125, 8.6131591796875, 9.120361328125, 9.6275634765625, 10.134765625, 10.6419677734375, 11.149169921875, 11.6563720703125, 12.16357421875, 12.6707763671875, 13.177978515625, 13.6851806640625, 14.1923828125, 14.6995849609375, 15.206787109375, 15.7139892578125, 16.22119140625, 16.7283935546875, 17.235595703125, 17.7427978515625, 18.25]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 14.0, 23.0, 27.0, 43.0, 55.0, 107.0, 169.0, 265.0, 406.0, 616.0, 851.0, 1424.0, 2191.0, 3434.0, 5567.0, 8972.0, 14853.0, 24761.0, 41263.0, 69968.0, 117109.0, 186663.0, 209607.0, 144082.0, 86403.0, 51134.0, 30630.0, 18339.0, 11171.0, 6719.0, 4169.0, 2611.0, 1720.0, 1111.0, 707.0, 482.0, 323.0, 210.0, 115.0, 86.0, 51.0, 35.0, 23.0, 8.0, 11.0, 4.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.07958984375, -2.0107421875, -1.94189453125, -1.873046875, -1.80419921875, -1.7353515625, -1.66650390625, -1.59765625, -1.52880859375, -1.4599609375, -1.39111328125, -1.322265625, -1.25341796875, -1.1845703125, -1.11572265625, -1.046875, -0.97802734375, -0.9091796875, -0.84033203125, -0.771484375, -0.70263671875, -0.6337890625, -0.56494140625, -0.49609375, -0.42724609375, -0.3583984375, -0.28955078125, -0.220703125, -0.15185546875, -0.0830078125, -0.01416015625, 0.0546875, 0.12353515625, 0.1923828125, 0.26123046875, 0.330078125, 0.39892578125, 0.4677734375, 0.53662109375, 0.60546875, 0.67431640625, 0.7431640625, 0.81201171875, 0.880859375, 0.94970703125, 1.0185546875, 1.08740234375, 1.15625, 1.22509765625, 1.2939453125, 1.36279296875, 1.431640625, 1.50048828125, 1.5693359375, 1.63818359375, 1.70703125, 1.77587890625, 1.8447265625, 1.91357421875, 1.982421875, 2.05126953125, 2.1201171875, 2.18896484375, 2.2578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 5.0, 14.0, 11.0, 13.0, 12.0, 23.0, 20.0, 25.0, 31.0, 33.0, 33.0, 30.0, 26.0, 35.0, 41.0, 36.0, 39.0, 1054.0, 53.0, 43.0, 48.0, 28.0, 42.0, 35.0, 23.0, 33.0, 31.0, 24.0, 18.0, 20.0, 14.0, 17.0, 17.0, 13.0, 3.0, 8.0, 13.0, 5.0, 6.0, 5.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.634765625, -9.34765625, -9.060546875, -8.7734375, -8.486328125, -8.19921875, -7.912109375, -7.625, -7.337890625, -7.05078125, -6.763671875, -6.4765625, -6.189453125, -5.90234375, -5.615234375, -5.328125, -5.041015625, -4.75390625, -4.466796875, -4.1796875, -3.892578125, -3.60546875, -3.318359375, -3.03125, -2.744140625, -2.45703125, -2.169921875, -1.8828125, -1.595703125, -1.30859375, -1.021484375, -0.734375, -0.447265625, -0.16015625, 0.126953125, 0.4140625, 0.701171875, 0.98828125, 1.275390625, 1.5625, 1.849609375, 2.13671875, 2.423828125, 2.7109375, 2.998046875, 3.28515625, 3.572265625, 3.859375, 4.146484375, 4.43359375, 4.720703125, 5.0078125, 5.294921875, 5.58203125, 5.869140625, 6.15625, 6.443359375, 6.73046875, 7.017578125, 7.3046875, 7.591796875, 7.87890625, 8.166015625, 8.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 5.0, 12.0, 7.0, 19.0, 20.0, 23.0, 43.0, 67.0, 81.0, 105.0, 208.0, 266.0, 409.0, 554.0, 882.0, 1328.0, 1923.0, 3022.0, 4393.0, 6857.0, 10556.0, 16352.0, 26342.0, 42460.0, 69051.0, 110669.0, 167418.0, 1239147.0, 145560.0, 93444.0, 57842.0, 35542.0, 22284.0, 13977.0, 8907.0, 5825.0, 3834.0, 2489.0, 1668.0, 1128.0, 776.0, 497.0, 363.0, 247.0, 158.0, 132.0, 81.0, 56.0, 35.0, 23.0, 22.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2548828125, -1.214813232421875, -1.17474365234375, -1.134674072265625, -1.0946044921875, -1.054534912109375, -1.01446533203125, -0.974395751953125, -0.934326171875, -0.894256591796875, -0.85418701171875, -0.814117431640625, -0.7740478515625, -0.733978271484375, -0.69390869140625, -0.653839111328125, -0.61376953125, -0.573699951171875, -0.53363037109375, -0.493560791015625, -0.4534912109375, -0.413421630859375, -0.37335205078125, -0.333282470703125, -0.293212890625, -0.253143310546875, -0.21307373046875, -0.173004150390625, -0.1329345703125, -0.092864990234375, -0.05279541015625, -0.012725830078125, 0.02734375, 0.067413330078125, 0.10748291015625, 0.147552490234375, 0.1876220703125, 0.227691650390625, 0.26776123046875, 0.307830810546875, 0.347900390625, 0.387969970703125, 0.42803955078125, 0.468109130859375, 0.5081787109375, 0.548248291015625, 0.58831787109375, 0.628387451171875, 0.66845703125, 0.708526611328125, 0.74859619140625, 0.788665771484375, 0.8287353515625, 0.868804931640625, 0.90887451171875, 0.948944091796875, 0.989013671875, 1.029083251953125, 1.06915283203125, 1.109222412109375, 1.1492919921875, 1.189361572265625, 1.22943115234375, 1.269500732421875, 1.3095703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 2.0, 9.0, 10.0, 6.0, 11.0, 5.0, 8.0, 9.0, 20.0, 16.0, 33.0, 41.0, 47.0, 68.0, 80.0, 91.0, 132.0, 85.0, 64.0, 56.0, 48.0, 25.0, 27.0, 26.0, 13.0, 19.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.044281005859375, -0.043055057525634766, -0.04182910919189453, -0.0406031608581543, -0.03937721252441406, -0.03815126419067383, -0.036925315856933594, -0.03569936752319336, -0.034473419189453125, -0.03324747085571289, -0.032021522521972656, -0.030795574188232422, -0.029569625854492188, -0.028343677520751953, -0.02711772918701172, -0.025891780853271484, -0.02466583251953125, -0.023439884185791016, -0.02221393585205078, -0.020987987518310547, -0.019762039184570312, -0.018536090850830078, -0.017310142517089844, -0.01608419418334961, -0.014858245849609375, -0.01363229751586914, -0.012406349182128906, -0.011180400848388672, -0.009954452514648438, -0.008728504180908203, -0.007502555847167969, -0.006276607513427734, -0.0050506591796875, -0.0038247108459472656, -0.0025987625122070312, -0.0013728141784667969, -0.0001468658447265625, 0.0010790824890136719, 0.0023050308227539062, 0.0035309791564941406, 0.004756927490234375, 0.005982875823974609, 0.007208824157714844, 0.008434772491455078, 0.009660720825195312, 0.010886669158935547, 0.012112617492675781, 0.013338565826416016, 0.01456451416015625, 0.015790462493896484, 0.01701641082763672, 0.018242359161376953, 0.019468307495117188, 0.020694255828857422, 0.021920204162597656, 0.02314615249633789, 0.024372100830078125, 0.02559804916381836, 0.026823997497558594, 0.028049945831298828, 0.029275894165039062, 0.030501842498779297, 0.03172779083251953, 0.032953739166259766, 0.0341796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 15.0, 9.0, 26.0, 23.0, 32.0, 52.0, 87.0, 131.0, 208.0, 437.0, 3663.0, 1036305.0, 6359.0, 521.0, 242.0, 127.0, 77.0, 42.0, 40.0, 23.0, 19.0, 14.0, 18.0, 12.0, 15.0, 8.0, 5.0, 4.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.7218399047851562, -0.6946563720703125, -0.6674728393554688, -0.640289306640625, -0.6131057739257812, -0.5859222412109375, -0.5587387084960938, -0.53155517578125, -0.5043716430664062, -0.4771881103515625, -0.45000457763671875, -0.422821044921875, -0.39563751220703125, -0.3684539794921875, -0.34127044677734375, -0.3140869140625, -0.28690338134765625, -0.2597198486328125, -0.23253631591796875, -0.205352783203125, -0.17816925048828125, -0.1509857177734375, -0.12380218505859375, -0.09661865234375, -0.06943511962890625, -0.0422515869140625, -0.01506805419921875, 0.012115478515625, 0.03929901123046875, 0.0664825439453125, 0.09366607666015625, 0.120849609375, 0.14803314208984375, 0.1752166748046875, 0.20240020751953125, 0.229583740234375, 0.25676727294921875, 0.2839508056640625, 0.31113433837890625, 0.33831787109375, 0.36550140380859375, 0.3926849365234375, 0.41986846923828125, 0.447052001953125, 0.47423553466796875, 0.5014190673828125, 0.5286026000976562, 0.5557861328125, 0.5829696655273438, 0.6101531982421875, 0.6373367309570312, 0.664520263671875, 0.6917037963867188, 0.7188873291015625, 0.7460708618164062, 0.77325439453125, 0.8004379272460938, 0.8276214599609375, 0.8548049926757812, 0.881988525390625, 0.9091720581054688, 0.9363555908203125, 0.9635391235351562, 0.99072265625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 36.0, 960.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1442357897758484, -0.11770550906658173, -0.09117522090673447, -0.06464493274688721, -0.038114652037620544, -0.011584371328353882, 0.014945924282073975, 0.04147620499134064, 0.0680064857006073, 0.09453676640987396, 0.12106705456972122, 0.14759734272956848, 0.17412762343883514, 0.2006579041481018, 0.22718819975852966, 0.2537184953689575, 0.280248761177063, 0.30677905678749084, 0.3333093225955963, 0.35983961820602417, 0.38636988401412964, 0.4129001796245575, 0.43943047523498535, 0.4659607410430908, 0.4924910366535187, 0.5190213322639465, 0.545551598072052, 0.5720819234848022, 0.5986121892929077, 0.6251424551010132, 0.6516727209091187, 0.6782030463218689, 0.7047333717346191, 0.7312636375427246, 0.7577939629554749, 0.7843242287635803, 0.8108544945716858, 0.837384819984436, 0.8639150857925415, 0.890445351600647, 0.9169756174087524, 0.9435058832168579, 0.9700362086296082, 0.9965664744377136, 1.0230967998504639, 1.0496270656585693, 1.0761573314666748, 1.1026875972747803, 1.1292178630828857, 1.1557481288909912, 1.1822783946990967, 1.2088086605072021, 1.2353390455245972, 1.2618693113327026, 1.288399577140808, 1.3149298429489136, 1.3414602279663086, 1.367990493774414, 1.3945207595825195, 1.421051025390625, 1.44758141040802, 1.4741116762161255, 1.500641942024231, 1.5271722078323364, 1.553702473640442]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 10.0, 11.0, 12.0, 17.0, 22.0, 26.0, 24.0, 24.0, 39.0, 38.0, 26.0, 41.0, 37.0, 41.0, 54.0, 36.0, 41.0, 38.0, 40.0, 49.0, 29.0, 41.0, 35.0, 31.0, 30.0, 38.0, 31.0, 20.0, 23.0, 16.0, 15.0, 13.0, 10.0, 13.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07374215126037598, -0.07173891365528107, -0.06973568350076675, -0.06773245334625244, -0.06572921574115753, -0.06372597813606262, -0.06172274798154831, -0.0597195141017437, -0.05771628022193909, -0.055713046342134476, -0.053709812462329865, -0.05170657858252525, -0.04970334470272064, -0.04770011082291603, -0.04569687694311142, -0.04369364306330681, -0.0416904091835022, -0.039687175303697586, -0.037683941423892975, -0.035680707544088364, -0.03367747366428375, -0.03167423978447914, -0.02967100590467453, -0.02766777202486992, -0.025664538145065308, -0.023661304265260696, -0.021658070385456085, -0.019654836505651474, -0.017651602625846863, -0.01564836874604225, -0.01364513486623764, -0.01164190098643303, -0.009638667106628418, -0.007635433226823807, -0.0056321993470191956, -0.0036289654672145844, -0.0016257315874099731, 0.00037750229239463806, 0.0023807361721992493, 0.0043839700520038605, 0.006387203931808472, 0.008390437811613083, 0.010393671691417694, 0.012396905571222305, 0.014400139451026917, 0.016403373330831528, 0.01840660721063614, 0.02040984109044075, 0.02241307497024536, 0.024416308850049973, 0.026419542729854584, 0.028422776609659195, 0.030426010489463806, 0.03242924436926842, 0.03443247824907303, 0.03643571212887764, 0.03843894600868225, 0.04044217988848686, 0.04244541376829147, 0.044448647648096085, 0.046451881527900696, 0.04845511540770531, 0.05045834928750992, 0.05246158316731453, 0.05446481704711914]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 7.0, 11.0, 12.0, 17.0, 12.0, 11.0, 22.0, 20.0, 26.0, 34.0, 35.0, 32.0, 54.0, 44.0, 54.0, 50.0, 54.0, 54.0, 52.0, 32.0, 33.0, 50.0, 41.0, 35.0, 23.0, 28.0, 24.0, 30.0, 21.0, 11.0, 16.0, 11.0, 5.0, 5.0, 8.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.203125, -13.696044921875, -13.18896484375, -12.681884765625, -12.1748046875, -11.667724609375, -11.16064453125, -10.653564453125, -10.146484375, -9.639404296875, -9.13232421875, -8.625244140625, -8.1181640625, -7.611083984375, -7.10400390625, -6.596923828125, -6.08984375, -5.582763671875, -5.07568359375, -4.568603515625, -4.0615234375, -3.554443359375, -3.04736328125, -2.540283203125, -2.033203125, -1.526123046875, -1.01904296875, -0.511962890625, -0.0048828125, 0.502197265625, 1.00927734375, 1.516357421875, 2.0234375, 2.530517578125, 3.03759765625, 3.544677734375, 4.0517578125, 4.558837890625, 5.06591796875, 5.572998046875, 6.080078125, 6.587158203125, 7.09423828125, 7.601318359375, 8.1083984375, 8.615478515625, 9.12255859375, 9.629638671875, 10.13671875, 10.643798828125, 11.15087890625, 11.657958984375, 12.1650390625, 12.672119140625, 13.17919921875, 13.686279296875, 14.193359375, 14.700439453125, 15.20751953125, 15.714599609375, 16.2216796875, 16.728759765625, 17.23583984375, 17.742919921875, 18.25]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 12.0, 25.0, 21.0, 36.0, 65.0, 93.0, 136.0, 150.0, 263.0, 387.0, 631.0, 857.0, 1378.0, 2014.0, 3358.0, 5242.0, 9191.0, 17222.0, 38868.0, 122026.0, 549409.0, 195396.0, 52274.0, 21456.0, 10897.0, 6284.0, 3846.0, 2411.0, 1492.0, 1047.0, 704.0, 468.0, 275.0, 186.0, 121.0, 99.0, 59.0, 45.0, 35.0, 14.0, 21.0, 7.0, 7.0, 2.0, 7.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.46875, -17.88525390625, -17.3017578125, -16.71826171875, -16.134765625, -15.55126953125, -14.9677734375, -14.38427734375, -13.80078125, -13.21728515625, -12.6337890625, -12.05029296875, -11.466796875, -10.88330078125, -10.2998046875, -9.71630859375, -9.1328125, -8.54931640625, -7.9658203125, -7.38232421875, -6.798828125, -6.21533203125, -5.6318359375, -5.04833984375, -4.46484375, -3.88134765625, -3.2978515625, -2.71435546875, -2.130859375, -1.54736328125, -0.9638671875, -0.38037109375, 0.203125, 0.78662109375, 1.3701171875, 1.95361328125, 2.537109375, 3.12060546875, 3.7041015625, 4.28759765625, 4.87109375, 5.45458984375, 6.0380859375, 6.62158203125, 7.205078125, 7.78857421875, 8.3720703125, 8.95556640625, 9.5390625, 10.12255859375, 10.7060546875, 11.28955078125, 11.873046875, 12.45654296875, 13.0400390625, 13.62353515625, 14.20703125, 14.79052734375, 15.3740234375, 15.95751953125, 16.541015625, 17.12451171875, 17.7080078125, 18.29150390625, 18.875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 0.0, 5.0, 6.0, 13.0, 6.0, 7.0, 13.0, 11.0, 23.0, 28.0, 17.0, 31.0, 37.0, 29.0, 40.0, 34.0, 42.0, 58.0, 69.0, 212.0, 1696.0, 185.0, 71.0, 49.0, 40.0, 35.0, 35.0, 32.0, 22.0, 30.0, 23.0, 28.0, 20.0, 13.0, 9.0, 19.0, 13.0, 13.0, 5.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-47.25, -45.87841796875, -44.5068359375, -43.13525390625, -41.763671875, -40.39208984375, -39.0205078125, -37.64892578125, -36.27734375, -34.90576171875, -33.5341796875, -32.16259765625, -30.791015625, -29.41943359375, -28.0478515625, -26.67626953125, -25.3046875, -23.93310546875, -22.5615234375, -21.18994140625, -19.818359375, -18.44677734375, -17.0751953125, -15.70361328125, -14.33203125, -12.96044921875, -11.5888671875, -10.21728515625, -8.845703125, -7.47412109375, -6.1025390625, -4.73095703125, -3.359375, -1.98779296875, -0.6162109375, 0.75537109375, 2.126953125, 3.49853515625, 4.8701171875, 6.24169921875, 7.61328125, 8.98486328125, 10.3564453125, 11.72802734375, 13.099609375, 14.47119140625, 15.8427734375, 17.21435546875, 18.5859375, 19.95751953125, 21.3291015625, 22.70068359375, 24.072265625, 25.44384765625, 26.8154296875, 28.18701171875, 29.55859375, 30.93017578125, 32.3017578125, 33.67333984375, 35.044921875, 36.41650390625, 37.7880859375, 39.15966796875, 40.53125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 6.0, 13.0, 16.0, 27.0, 19.0, 29.0, 37.0, 61.0, 62.0, 97.0, 127.0, 197.0, 465.0, 1394.0, 7735.0, 103960.0, 2984984.0, 39871.0, 4650.0, 1029.0, 302.0, 166.0, 116.0, 86.0, 52.0, 46.0, 28.0, 20.0, 22.0, 19.0, 11.0, 10.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-91.0625, -88.412109375, -85.76171875, -83.111328125, -80.4609375, -77.810546875, -75.16015625, -72.509765625, -69.859375, -67.208984375, -64.55859375, -61.908203125, -59.2578125, -56.607421875, -53.95703125, -51.306640625, -48.65625, -46.005859375, -43.35546875, -40.705078125, -38.0546875, -35.404296875, -32.75390625, -30.103515625, -27.453125, -24.802734375, -22.15234375, -19.501953125, -16.8515625, -14.201171875, -11.55078125, -8.900390625, -6.25, -3.599609375, -0.94921875, 1.701171875, 4.3515625, 7.001953125, 9.65234375, 12.302734375, 14.953125, 17.603515625, 20.25390625, 22.904296875, 25.5546875, 28.205078125, 30.85546875, 33.505859375, 36.15625, 38.806640625, 41.45703125, 44.107421875, 46.7578125, 49.408203125, 52.05859375, 54.708984375, 57.359375, 60.009765625, 62.66015625, 65.310546875, 67.9609375, 70.611328125, 73.26171875, 75.912109375, 78.5625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 15.0, 21.0, 64.0, 147.0, 206.0, 223.0, 177.0, 89.0, 36.0, 13.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.734901428222656, -44.575138092041016, -41.41537857055664, -38.255615234375, -35.095855712890625, -31.936092376708984, -28.776329040527344, -25.616567611694336, -22.456806182861328, -19.29704475402832, -16.137283325195312, -12.977519989013672, -9.817758560180664, -6.657997131347656, -3.4982337951660156, -0.3384723663330078, 2.8212890625, 5.981050968170166, 9.140812873840332, 12.300575256347656, 15.460336685180664, 18.620098114013672, 21.779861450195312, 24.93962287902832, 28.099384307861328, 31.259145736694336, 34.418907165527344, 37.578670501708984, 40.738433837890625, 43.898193359375, 47.05795669555664, 50.21772003173828, 53.377471923828125, 56.537235260009766, 59.69699478149414, 62.85675811767578, 66.01651763916016, 69.17628479003906, 72.33604431152344, 75.49580383300781, 78.65556335449219, 81.81532287597656, 84.97509002685547, 88.13484954833984, 91.29460906982422, 94.45437622070312, 97.6141357421875, 100.77389526367188, 103.93366241455078, 107.09342193603516, 110.25318908691406, 113.41294860839844, 116.57270812988281, 119.73246765136719, 122.8922348022461, 126.05199432373047, 129.21176147460938, 132.37152099609375, 135.53128051757812, 138.6910400390625, 141.85081481933594, 145.0105743408203, 148.1703338623047, 151.33009338378906, 154.48985290527344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 19.0, 9.0, 16.0, 14.0, 26.0, 32.0, 26.0, 28.0, 32.0, 42.0, 40.0, 29.0, 57.0, 36.0, 46.0, 33.0, 39.0, 51.0, 36.0, 42.0, 40.0, 32.0, 21.0, 26.0, 24.0, 18.0, 24.0, 16.0, 15.0, 9.0, 15.0, 14.0, 14.0, 9.0, 5.0, 7.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.84426879882812, -109.51905822753906, -106.19384765625, -102.86863708496094, -99.5434341430664, -96.21822357177734, -92.89301300048828, -89.56780242919922, -86.24259185791016, -82.9173812866211, -79.59217071533203, -76.2669677734375, -72.94175720214844, -69.61654663085938, -66.29133605957031, -62.96612548828125, -59.64091873168945, -56.31570816040039, -52.990501403808594, -49.66529083251953, -46.34008026123047, -43.014869689941406, -39.68966293334961, -36.36445236206055, -33.03924560546875, -29.71403694152832, -26.388826370239258, -23.063617706298828, -19.738407135009766, -16.413198471069336, -13.087989807128906, -9.762779235839844, -6.437568664550781, -3.1123592853546143, 0.21285009384155273, 3.5380592346191406, 6.863268852233887, 10.188478469848633, 13.513687133789062, 16.838897705078125, 20.164106369018555, 23.489315032958984, 26.814525604248047, 30.139734268188477, 33.464942932128906, 36.79015350341797, 40.11536407470703, 43.440574645996094, 46.76578140258789, 50.09099197387695, 53.41619873046875, 56.74140930175781, 60.066619873046875, 63.39183044433594, 66.717041015625, 70.04225158691406, 73.3674545288086, 76.69266510009766, 80.01787567138672, 83.34307861328125, 86.66828918457031, 89.99349975585938, 93.31871032714844, 96.6439208984375, 99.96913146972656]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 8.0, 14.0, 15.0, 14.0, 9.0, 9.0, 18.0, 28.0, 24.0, 34.0, 25.0, 35.0, 52.0, 52.0, 41.0, 43.0, 56.0, 53.0, 48.0, 36.0, 42.0, 37.0, 29.0, 43.0, 28.0, 34.0, 18.0, 17.0, 16.0, 25.0, 14.0, 12.0, 5.0, 14.0, 2.0, 5.0, 9.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.9180908203125, -12.422119140625, -11.9261474609375, -11.43017578125, -10.9342041015625, -10.438232421875, -9.9422607421875, -9.4462890625, -8.9503173828125, -8.454345703125, -7.9583740234375, -7.46240234375, -6.9664306640625, -6.470458984375, -5.9744873046875, -5.478515625, -4.9825439453125, -4.486572265625, -3.9906005859375, -3.49462890625, -2.9986572265625, -2.502685546875, -2.0067138671875, -1.5107421875, -1.0147705078125, -0.518798828125, -0.0228271484375, 0.47314453125, 0.9691162109375, 1.465087890625, 1.9610595703125, 2.45703125, 2.9530029296875, 3.448974609375, 3.9449462890625, 4.44091796875, 4.9368896484375, 5.432861328125, 5.9288330078125, 6.4248046875, 6.9207763671875, 7.416748046875, 7.9127197265625, 8.40869140625, 8.9046630859375, 9.400634765625, 9.8966064453125, 10.392578125, 10.8885498046875, 11.384521484375, 11.8804931640625, 12.37646484375, 12.8724365234375, 13.368408203125, 13.8643798828125, 14.3603515625, 14.8563232421875, 15.352294921875, 15.8482666015625, 16.34423828125, 16.8402099609375, 17.336181640625, 17.8321533203125, 18.328125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 28.0, 22.0, 27.0, 53.0, 36.0, 69.0, 109.0, 125.0, 191.0, 267.0, 426.0, 621.0, 1023.0, 1844.0, 3525.0, 6804.0, 15238.0, 42193.0, 205703.0, 1542045.0, 2007388.0, 281362.0, 50585.0, 17529.0, 7731.0, 3885.0, 2101.0, 1175.0, 672.0, 440.0, 293.0, 184.0, 131.0, 98.0, 71.0, 58.0, 51.0, 34.0, 24.0, 23.0, 22.0, 13.0, 6.0, 7.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-26.875, -26.01025390625, -25.1455078125, -24.28076171875, -23.416015625, -22.55126953125, -21.6865234375, -20.82177734375, -19.95703125, -19.09228515625, -18.2275390625, -17.36279296875, -16.498046875, -15.63330078125, -14.7685546875, -13.90380859375, -13.0390625, -12.17431640625, -11.3095703125, -10.44482421875, -9.580078125, -8.71533203125, -7.8505859375, -6.98583984375, -6.12109375, -5.25634765625, -4.3916015625, -3.52685546875, -2.662109375, -1.79736328125, -0.9326171875, -0.06787109375, 0.796875, 1.66162109375, 2.5263671875, 3.39111328125, 4.255859375, 5.12060546875, 5.9853515625, 6.85009765625, 7.71484375, 8.57958984375, 9.4443359375, 10.30908203125, 11.173828125, 12.03857421875, 12.9033203125, 13.76806640625, 14.6328125, 15.49755859375, 16.3623046875, 17.22705078125, 18.091796875, 18.95654296875, 19.8212890625, 20.68603515625, 21.55078125, 22.41552734375, 23.2802734375, 24.14501953125, 25.009765625, 25.87451171875, 26.7392578125, 27.60400390625, 28.46875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 19.0, 24.0, 21.0, 24.0, 46.0, 78.0, 91.0, 164.0, 255.0, 516.0, 803.0, 784.0, 495.0, 282.0, 149.0, 81.0, 64.0, 53.0, 31.0, 21.0, 16.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.58837890625, -40.3642578125, -39.14013671875, -37.916015625, -36.69189453125, -35.4677734375, -34.24365234375, -33.01953125, -31.79541015625, -30.5712890625, -29.34716796875, -28.123046875, -26.89892578125, -25.6748046875, -24.45068359375, -23.2265625, -22.00244140625, -20.7783203125, -19.55419921875, -18.330078125, -17.10595703125, -15.8818359375, -14.65771484375, -13.43359375, -12.20947265625, -10.9853515625, -9.76123046875, -8.537109375, -7.31298828125, -6.0888671875, -4.86474609375, -3.640625, -2.41650390625, -1.1923828125, 0.03173828125, 1.255859375, 2.47998046875, 3.7041015625, 4.92822265625, 6.15234375, 7.37646484375, 8.6005859375, 9.82470703125, 11.048828125, 12.27294921875, 13.4970703125, 14.72119140625, 15.9453125, 17.16943359375, 18.3935546875, 19.61767578125, 20.841796875, 22.06591796875, 23.2900390625, 24.51416015625, 25.73828125, 26.96240234375, 28.1865234375, 29.41064453125, 30.634765625, 31.85888671875, 33.0830078125, 34.30712890625, 35.53125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 13.0, 24.0, 54.0, 72.0, 108.0, 207.0, 498.0, 1584.0, 8216.0, 174524.0, 3943099.0, 58996.0, 4922.0, 1049.0, 410.0, 172.0, 106.0, 54.0, 33.0, 35.0, 26.0, 13.0, 13.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.375, -121.24609375, -117.1171875, -112.98828125, -108.859375, -104.73046875, -100.6015625, -96.47265625, -92.34375, -88.21484375, -84.0859375, -79.95703125, -75.828125, -71.69921875, -67.5703125, -63.44140625, -59.3125, -55.18359375, -51.0546875, -46.92578125, -42.796875, -38.66796875, -34.5390625, -30.41015625, -26.28125, -22.15234375, -18.0234375, -13.89453125, -9.765625, -5.63671875, -1.5078125, 2.62109375, 6.75, 10.87890625, 15.0078125, 19.13671875, 23.265625, 27.39453125, 31.5234375, 35.65234375, 39.78125, 43.91015625, 48.0390625, 52.16796875, 56.296875, 60.42578125, 64.5546875, 68.68359375, 72.8125, 76.94140625, 81.0703125, 85.19921875, 89.328125, 93.45703125, 97.5859375, 101.71484375, 105.84375, 109.97265625, 114.1015625, 118.23046875, 122.359375, 126.48828125, 130.6171875, 134.74609375, 138.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 12.0, 27.0, 71.0, 159.0, 267.0, 257.0, 126.0, 50.0, 18.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.55860900878906, -246.32427978515625, -238.08995056152344, -229.85562133789062, -221.6212921142578, -213.386962890625, -205.15261840820312, -196.91830444335938, -188.6839599609375, -180.4496307373047, -172.21530151367188, -163.98097229003906, -155.74664306640625, -147.51231384277344, -139.27798461914062, -131.04364013671875, -122.809326171875, -114.57499694824219, -106.34066772460938, -98.10633850097656, -89.87200927734375, -81.63768005371094, -73.4033432006836, -65.16901397705078, -56.93468475341797, -48.700355529785156, -40.466026306152344, -32.231693267822266, -23.997364044189453, -15.76303482055664, -7.5287017822265625, 0.70562744140625, 8.93994140625, 17.174270629882812, 25.408601760864258, 33.6429328918457, 41.877262115478516, 50.11159133911133, 58.345924377441406, 66.58025360107422, 74.81458282470703, 83.04891204833984, 91.28324127197266, 99.517578125, 107.75190734863281, 115.98623657226562, 124.22056579589844, 132.45489501953125, 140.68922424316406, 148.92355346679688, 157.1578826904297, 165.3922119140625, 173.6265411376953, 181.86087036132812, 190.09521484375, 198.32952880859375, 206.56387329101562, 214.79820251464844, 223.03253173828125, 231.26686096191406, 239.50119018554688, 247.7355194091797, 255.9698486328125, 264.2041931152344, 272.4385070800781]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 16.0, 17.0, 21.0, 23.0, 13.0, 23.0, 16.0, 24.0, 24.0, 27.0, 29.0, 35.0, 32.0, 27.0, 48.0, 28.0, 27.0, 45.0, 41.0, 29.0, 37.0, 45.0, 30.0, 35.0, 24.0, 24.0, 22.0, 32.0, 22.0, 16.0, 19.0, 12.0, 12.0, 15.0, 8.0, 16.0, 10.0, 7.0, 7.0, 6.0, 11.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-86.99964141845703, -84.47054290771484, -81.94145202636719, -79.412353515625, -76.88325500488281, -74.35415649414062, -71.82505798339844, -69.29596710205078, -66.7668685913086, -64.2377700805664, -61.708675384521484, -59.17958068847656, -56.650482177734375, -54.12138366699219, -51.592288970947266, -49.063194274902344, -46.534095764160156, -44.00499725341797, -41.47590255737305, -38.946807861328125, -36.41770935058594, -33.88861083984375, -31.359516143798828, -28.830419540405273, -26.30132293701172, -23.772226333618164, -21.24312973022461, -18.714033126831055, -16.1849365234375, -13.655839920043945, -11.12674331665039, -8.597646713256836, -6.06854248046875, -3.5394458770751953, -1.0103492736816406, 1.518747329711914, 4.047843933105469, 6.576940536499023, 9.106037139892578, 11.635133743286133, 14.164230346679688, 16.693326950073242, 19.222423553466797, 21.75152015686035, 24.280616760253906, 26.80971336364746, 29.338809967041016, 31.86790657043457, 34.397003173828125, 36.92610168457031, 39.455196380615234, 41.984291076660156, 44.513389587402344, 47.04248809814453, 49.57158279418945, 52.100677490234375, 54.62977600097656, 57.15887451171875, 59.68796920776367, 62.217063903808594, 64.74616241455078, 67.27526092529297, 69.80435180664062, 72.33345031738281, 74.862548828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 12.0, 14.0, 9.0, 14.0, 16.0, 17.0, 17.0, 17.0, 27.0, 20.0, 37.0, 31.0, 40.0, 35.0, 41.0, 47.0, 38.0, 49.0, 52.0, 42.0, 39.0, 40.0, 40.0, 31.0, 24.0, 37.0, 19.0, 34.0, 18.0, 19.0, 11.0, 17.0, 16.0, 8.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0147705078125, -13.521728515625, -13.0286865234375, -12.53564453125, -12.0426025390625, -11.549560546875, -11.0565185546875, -10.5634765625, -10.0704345703125, -9.577392578125, -9.0843505859375, -8.59130859375, -8.0982666015625, -7.605224609375, -7.1121826171875, -6.619140625, -6.1260986328125, -5.633056640625, -5.1400146484375, -4.64697265625, -4.1539306640625, -3.660888671875, -3.1678466796875, -2.6748046875, -2.1817626953125, -1.688720703125, -1.1956787109375, -0.70263671875, -0.2095947265625, 0.283447265625, 0.7764892578125, 1.26953125, 1.7625732421875, 2.255615234375, 2.7486572265625, 3.24169921875, 3.7347412109375, 4.227783203125, 4.7208251953125, 5.2138671875, 5.7069091796875, 6.199951171875, 6.6929931640625, 7.18603515625, 7.6790771484375, 8.172119140625, 8.6651611328125, 9.158203125, 9.6512451171875, 10.144287109375, 10.6373291015625, 11.13037109375, 11.6234130859375, 12.116455078125, 12.6094970703125, 13.1025390625, 13.5955810546875, 14.088623046875, 14.5816650390625, 15.07470703125, 15.5677490234375, 16.060791015625, 16.5538330078125, 17.046875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 14.0, 20.0, 23.0, 50.0, 51.0, 86.0, 125.0, 203.0, 262.0, 422.0, 604.0, 828.0, 1233.0, 1849.0, 2826.0, 4154.0, 6204.0, 9636.0, 14995.0, 23201.0, 36201.0, 58353.0, 94616.0, 148274.0, 192784.0, 163235.0, 106790.0, 65888.0, 41187.0, 26008.0, 16504.0, 10861.0, 6946.0, 4666.0, 3014.0, 2103.0, 1384.0, 1022.0, 606.0, 432.0, 309.0, 172.0, 142.0, 80.0, 56.0, 61.0, 30.0, 14.0, 17.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.0693359375, -2.00390625, -1.9384765625, -1.873046875, -1.8076171875, -1.7421875, -1.6767578125, -1.611328125, -1.5458984375, -1.48046875, -1.4150390625, -1.349609375, -1.2841796875, -1.21875, -1.1533203125, -1.087890625, -1.0224609375, -0.95703125, -0.8916015625, -0.826171875, -0.7607421875, -0.6953125, -0.6298828125, -0.564453125, -0.4990234375, -0.43359375, -0.3681640625, -0.302734375, -0.2373046875, -0.171875, -0.1064453125, -0.041015625, 0.0244140625, 0.08984375, 0.1552734375, 0.220703125, 0.2861328125, 0.3515625, 0.4169921875, 0.482421875, 0.5478515625, 0.61328125, 0.6787109375, 0.744140625, 0.8095703125, 0.875, 0.9404296875, 1.005859375, 1.0712890625, 1.13671875, 1.2021484375, 1.267578125, 1.3330078125, 1.3984375, 1.4638671875, 1.529296875, 1.5947265625, 1.66015625, 1.7255859375, 1.791015625, 1.8564453125, 1.921875, 1.9873046875, 2.052734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 8.0, 5.0, 10.0, 4.0, 14.0, 6.0, 11.0, 14.0, 16.0, 15.0, 23.0, 21.0, 23.0, 25.0, 24.0, 24.0, 32.0, 28.0, 51.0, 39.0, 23.0, 43.0, 1060.0, 31.0, 36.0, 31.0, 44.0, 37.0, 31.0, 37.0, 25.0, 31.0, 28.0, 15.0, 17.0, 25.0, 15.0, 16.0, 16.0, 15.0, 12.0, 11.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0234375, -8.7313232421875, -8.439208984375, -8.1470947265625, -7.85498046875, -7.5628662109375, -7.270751953125, -6.9786376953125, -6.6865234375, -6.3944091796875, -6.102294921875, -5.8101806640625, -5.51806640625, -5.2259521484375, -4.933837890625, -4.6417236328125, -4.349609375, -4.0574951171875, -3.765380859375, -3.4732666015625, -3.18115234375, -2.8890380859375, -2.596923828125, -2.3048095703125, -2.0126953125, -1.7205810546875, -1.428466796875, -1.1363525390625, -0.84423828125, -0.5521240234375, -0.260009765625, 0.0321044921875, 0.32421875, 0.6163330078125, 0.908447265625, 1.2005615234375, 1.49267578125, 1.7847900390625, 2.076904296875, 2.3690185546875, 2.6611328125, 2.9532470703125, 3.245361328125, 3.5374755859375, 3.82958984375, 4.1217041015625, 4.413818359375, 4.7059326171875, 4.998046875, 5.2901611328125, 5.582275390625, 5.8743896484375, 6.16650390625, 6.4586181640625, 6.750732421875, 7.0428466796875, 7.3349609375, 7.6270751953125, 7.919189453125, 8.2113037109375, 8.50341796875, 8.7955322265625, 9.087646484375, 9.3797607421875, 9.671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 11.0, 7.0, 35.0, 26.0, 47.0, 65.0, 79.0, 125.0, 194.0, 257.0, 341.0, 512.0, 766.0, 1109.0, 1701.0, 2423.0, 3504.0, 4994.0, 7766.0, 11535.0, 17569.0, 27266.0, 42950.0, 69358.0, 110358.0, 167745.0, 1229901.0, 142878.0, 92214.0, 56904.0, 36257.0, 22877.0, 14894.0, 9735.0, 6592.0, 4550.0, 3045.0, 1979.0, 1421.0, 974.0, 662.0, 436.0, 342.0, 207.0, 158.0, 124.0, 71.0, 53.0, 34.0, 28.0, 19.0, 10.0, 9.0, 6.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.33984375, -1.298370361328125, -1.25689697265625, -1.215423583984375, -1.1739501953125, -1.132476806640625, -1.09100341796875, -1.049530029296875, -1.008056640625, -0.966583251953125, -0.92510986328125, -0.883636474609375, -0.8421630859375, -0.800689697265625, -0.75921630859375, -0.717742919921875, -0.67626953125, -0.634796142578125, -0.59332275390625, -0.551849365234375, -0.5103759765625, -0.468902587890625, -0.42742919921875, -0.385955810546875, -0.344482421875, -0.303009033203125, -0.26153564453125, -0.220062255859375, -0.1785888671875, -0.137115478515625, -0.09564208984375, -0.054168701171875, -0.0126953125, 0.028778076171875, 0.07025146484375, 0.111724853515625, 0.1531982421875, 0.194671630859375, 0.23614501953125, 0.277618408203125, 0.319091796875, 0.360565185546875, 0.40203857421875, 0.443511962890625, 0.4849853515625, 0.526458740234375, 0.56793212890625, 0.609405517578125, 0.65087890625, 0.692352294921875, 0.73382568359375, 0.775299072265625, 0.8167724609375, 0.858245849609375, 0.89971923828125, 0.941192626953125, 0.982666015625, 1.024139404296875, 1.06561279296875, 1.107086181640625, 1.1485595703125, 1.190032958984375, 1.23150634765625, 1.272979736328125, 1.314453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 2.0, 1.0, 6.0, 8.0, 7.0, 4.0, 6.0, 9.0, 2.0, 12.0, 11.0, 16.0, 20.0, 17.0, 31.0, 32.0, 33.0, 39.0, 53.0, 78.0, 125.0, 97.0, 79.0, 62.0, 44.0, 38.0, 34.0, 19.0, 21.0, 17.0, 18.0, 12.0, 9.0, 9.0, 11.0, 3.0, 2.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033294677734375, -0.03213977813720703, -0.030984878540039062, -0.029829978942871094, -0.028675079345703125, -0.027520179748535156, -0.026365280151367188, -0.02521038055419922, -0.02405548095703125, -0.02290058135986328, -0.021745681762695312, -0.020590782165527344, -0.019435882568359375, -0.018280982971191406, -0.017126083374023438, -0.01597118377685547, -0.0148162841796875, -0.013661384582519531, -0.012506484985351562, -0.011351585388183594, -0.010196685791015625, -0.009041786193847656, -0.007886886596679688, -0.006731986999511719, -0.00557708740234375, -0.004422187805175781, -0.0032672882080078125, -0.0021123886108398438, -0.000957489013671875, 0.00019741058349609375, 0.0013523101806640625, 0.0025072097778320312, 0.003662109375, 0.004817008972167969, 0.0059719085693359375, 0.007126808166503906, 0.008281707763671875, 0.009436607360839844, 0.010591506958007812, 0.011746406555175781, 0.01290130615234375, 0.014056205749511719, 0.015211105346679688, 0.016366004943847656, 0.017520904541015625, 0.018675804138183594, 0.019830703735351562, 0.02098560333251953, 0.0221405029296875, 0.02329540252685547, 0.024450302124023438, 0.025605201721191406, 0.026760101318359375, 0.027915000915527344, 0.029069900512695312, 0.03022480010986328, 0.03137969970703125, 0.03253459930419922, 0.03368949890136719, 0.034844398498535156, 0.035999298095703125, 0.037154197692871094, 0.03830909729003906, 0.03946399688720703, 0.040618896484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 2.0, 6.0, 13.0, 11.0, 11.0, 24.0, 24.0, 33.0, 34.0, 53.0, 82.0, 111.0, 168.0, 328.0, 819.0, 80248.0, 964046.0, 1478.0, 348.0, 228.0, 132.0, 81.0, 63.0, 32.0, 27.0, 29.0, 21.0, 18.0, 9.0, 15.0, 10.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87255859375, -0.8477325439453125, -0.822906494140625, -0.7980804443359375, -0.77325439453125, -0.7484283447265625, -0.723602294921875, -0.6987762451171875, -0.6739501953125, -0.6491241455078125, -0.624298095703125, -0.5994720458984375, -0.57464599609375, -0.5498199462890625, -0.524993896484375, -0.5001678466796875, -0.475341796875, -0.4505157470703125, -0.425689697265625, -0.4008636474609375, -0.37603759765625, -0.3512115478515625, -0.326385498046875, -0.3015594482421875, -0.2767333984375, -0.2519073486328125, -0.227081298828125, -0.2022552490234375, -0.17742919921875, -0.1526031494140625, -0.127777099609375, -0.1029510498046875, -0.078125, -0.0532989501953125, -0.028472900390625, -0.0036468505859375, 0.02117919921875, 0.0460052490234375, 0.070831298828125, 0.0956573486328125, 0.1204833984375, 0.1453094482421875, 0.170135498046875, 0.1949615478515625, 0.21978759765625, 0.2446136474609375, 0.269439697265625, 0.2942657470703125, 0.319091796875, 0.3439178466796875, 0.368743896484375, 0.3935699462890625, 0.41839599609375, 0.4432220458984375, 0.468048095703125, 0.4928741455078125, 0.5177001953125, 0.5425262451171875, 0.567352294921875, 0.5921783447265625, 0.61700439453125, 0.6418304443359375, 0.666656494140625, 0.6914825439453125, 0.71630859375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 79.0, 928.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2220216691493988, -0.19803713262081146, -0.17405261099338531, -0.15006807446479797, -0.12608355283737183, -0.10209901630878448, -0.07811447978019714, -0.054129958152770996, -0.030145421624183655, -0.006160890683531761, 0.017823640257120132, 0.041808173060417175, 0.06579270213842392, 0.08977723121643066, 0.113761767745018, 0.13774628937244415, 0.1617308259010315, 0.18571536242961884, 0.20969988405704498, 0.23368442058563232, 0.25766894221305847, 0.2816534638404846, 0.30563801527023315, 0.3296225368976593, 0.35360705852508545, 0.3775915801525116, 0.40157613158226013, 0.4255606532096863, 0.4495451748371124, 0.4735296964645386, 0.4975142478942871, 0.5214987993240356, 0.5454832911491394, 0.5694678425788879, 0.5934523344039917, 0.6174368858337402, 0.6414214372634888, 0.6654059290885925, 0.6893904805183411, 0.7133749723434448, 0.7373595237731934, 0.7613440752029419, 0.7853285670280457, 0.8093131184577942, 0.8332976698875427, 0.8572821617126465, 0.881266713142395, 0.9052512645721436, 0.9292358160018921, 0.9532203674316406, 0.9772048592567444, 1.0011894702911377, 1.0251739025115967, 1.0491584539413452, 1.0731430053710938, 1.0971275568008423, 1.1211119890213013, 1.1450965404510498, 1.1690810918807983, 1.1930656433105469, 1.2170500755310059, 1.2410346269607544, 1.265019178390503, 1.2890037298202515, 1.31298828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 4.0, 8.0, 11.0, 17.0, 19.0, 21.0, 19.0, 35.0, 34.0, 26.0, 41.0, 30.0, 42.0, 46.0, 45.0, 52.0, 40.0, 49.0, 44.0, 46.0, 45.0, 28.0, 51.0, 24.0, 28.0, 22.0, 28.0, 30.0, 13.0, 14.0, 14.0, 10.0, 14.0, 6.0, 7.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06216925382614136, -0.06041756272315979, -0.05866587162017822, -0.05691417679190636, -0.05516248568892479, -0.05341079458594322, -0.051659099757671356, -0.04990740865468979, -0.04815571755170822, -0.046404026448726654, -0.04465233534574509, -0.04290064051747322, -0.04114894941449165, -0.039397258311510086, -0.03764556348323822, -0.03589387238025665, -0.034142181277275085, -0.03239049017429352, -0.0306387972086668, -0.028887104243040085, -0.027135413140058517, -0.02538372203707695, -0.023632029071450233, -0.021880336105823517, -0.02012864500284195, -0.018376953899860382, -0.016625260934233665, -0.014873568899929523, -0.013121876865625381, -0.01137018483132124, -0.009618492797017097, -0.007866800762712955, -0.0061151087284088135, -0.0043634166941046715, -0.0026117246598005295, -0.0008600326254963875, 0.0008916594088077545, 0.0026433514431118965, 0.0043950434774160385, 0.0061467355117201805, 0.007898427546024323, 0.009650119580328465, 0.011401811614632607, 0.013153503648936749, 0.01490519568324089, 0.016656886786222458, 0.018408579751849174, 0.02016027271747589, 0.02191196382045746, 0.023663654923439026, 0.025415347889065742, 0.02716704085469246, 0.028918731957674026, 0.030670423060655594, 0.03242211788892746, 0.03417380899190903, 0.035925500094890594, 0.03767719119787216, 0.03942888230085373, 0.041180577129125595, 0.04293226823210716, 0.04468395933508873, 0.046435654163360596, 0.04818734526634216, 0.04993903636932373]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 12.0, 14.0, 9.0, 14.0, 16.0, 17.0, 17.0, 16.0, 28.0, 20.0, 35.0, 33.0, 40.0, 34.0, 42.0, 47.0, 38.0, 49.0, 52.0, 42.0, 39.0, 40.0, 40.0, 31.0, 24.0, 37.0, 19.0, 34.0, 17.0, 20.0, 11.0, 17.0, 16.0, 8.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0147705078125, -13.521728515625, -13.0286865234375, -12.53564453125, -12.0426025390625, -11.549560546875, -11.0565185546875, -10.5634765625, -10.0704345703125, -9.577392578125, -9.0843505859375, -8.59130859375, -8.0982666015625, -7.605224609375, -7.1121826171875, -6.619140625, -6.1260986328125, -5.633056640625, -5.1400146484375, -4.64697265625, -4.1539306640625, -3.660888671875, -3.1678466796875, -2.6748046875, -2.1817626953125, -1.688720703125, -1.1956787109375, -0.70263671875, -0.2095947265625, 0.283447265625, 0.7764892578125, 1.26953125, 1.7625732421875, 2.255615234375, 2.7486572265625, 3.24169921875, 3.7347412109375, 4.227783203125, 4.7208251953125, 5.2138671875, 5.7069091796875, 6.199951171875, 6.6929931640625, 7.18603515625, 7.6790771484375, 8.172119140625, 8.6651611328125, 9.158203125, 9.6512451171875, 10.144287109375, 10.6373291015625, 11.13037109375, 11.6234130859375, 12.116455078125, 12.6094970703125, 13.1025390625, 13.5955810546875, 14.088623046875, 14.5816650390625, 15.07470703125, 15.5677490234375, 16.060791015625, 16.5538330078125, 17.046875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 10.0, 14.0, 26.0, 32.0, 37.0, 40.0, 43.0, 80.0, 103.0, 135.0, 189.0, 300.0, 495.0, 753.0, 1101.0, 1767.0, 3100.0, 6164.0, 15083.0, 79838.0, 829055.0, 80390.0, 15412.0, 6122.0, 3116.0, 1783.0, 1132.0, 722.0, 453.0, 306.0, 221.0, 151.0, 81.0, 67.0, 38.0, 38.0, 33.0, 31.0, 16.0, 15.0, 17.0, 5.0, 6.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.328125, -27.367919921875, -26.40771484375, -25.447509765625, -24.4873046875, -23.527099609375, -22.56689453125, -21.606689453125, -20.646484375, -19.686279296875, -18.72607421875, -17.765869140625, -16.8056640625, -15.845458984375, -14.88525390625, -13.925048828125, -12.96484375, -12.004638671875, -11.04443359375, -10.084228515625, -9.1240234375, -8.163818359375, -7.20361328125, -6.243408203125, -5.283203125, -4.322998046875, -3.36279296875, -2.402587890625, -1.4423828125, -0.482177734375, 0.47802734375, 1.438232421875, 2.3984375, 3.358642578125, 4.31884765625, 5.279052734375, 6.2392578125, 7.199462890625, 8.15966796875, 9.119873046875, 10.080078125, 11.040283203125, 12.00048828125, 12.960693359375, 13.9208984375, 14.881103515625, 15.84130859375, 16.801513671875, 17.76171875, 18.721923828125, 19.68212890625, 20.642333984375, 21.6025390625, 22.562744140625, 23.52294921875, 24.483154296875, 25.443359375, 26.403564453125, 27.36376953125, 28.323974609375, 29.2841796875, 30.244384765625, 31.20458984375, 32.164794921875, 33.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 14.0, 20.0, 24.0, 22.0, 35.0, 37.0, 51.0, 39.0, 52.0, 50.0, 97.0, 510.0, 1571.0, 84.0, 36.0, 55.0, 45.0, 43.0, 31.0, 35.0, 19.0, 16.0, 16.0, 11.0, 12.0, 9.0, 7.0, 15.0, 7.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-60.0, -58.33349609375, -56.6669921875, -55.00048828125, -53.333984375, -51.66748046875, -50.0009765625, -48.33447265625, -46.66796875, -45.00146484375, -43.3349609375, -41.66845703125, -40.001953125, -38.33544921875, -36.6689453125, -35.00244140625, -33.3359375, -31.66943359375, -30.0029296875, -28.33642578125, -26.669921875, -25.00341796875, -23.3369140625, -21.67041015625, -20.00390625, -18.33740234375, -16.6708984375, -15.00439453125, -13.337890625, -11.67138671875, -10.0048828125, -8.33837890625, -6.671875, -5.00537109375, -3.3388671875, -1.67236328125, -0.005859375, 1.66064453125, 3.3271484375, 4.99365234375, 6.66015625, 8.32666015625, 9.9931640625, 11.65966796875, 13.326171875, 14.99267578125, 16.6591796875, 18.32568359375, 19.9921875, 21.65869140625, 23.3251953125, 24.99169921875, 26.658203125, 28.32470703125, 29.9912109375, 31.65771484375, 33.32421875, 34.99072265625, 36.6572265625, 38.32373046875, 39.990234375, 41.65673828125, 43.3232421875, 44.98974609375, 46.65625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 5.0, 15.0, 7.0, 12.0, 17.0, 15.0, 15.0, 19.0, 32.0, 52.0, 58.0, 83.0, 119.0, 272.0, 905.0, 6549.0, 2945620.0, 186451.0, 4103.0, 622.0, 231.0, 124.0, 87.0, 50.0, 49.0, 40.0, 26.0, 22.0, 14.0, 19.0, 13.0, 9.0, 10.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.25, -101.4765625, -97.703125, -93.9296875, -90.15625, -86.3828125, -82.609375, -78.8359375, -75.0625, -71.2890625, -67.515625, -63.7421875, -59.96875, -56.1953125, -52.421875, -48.6484375, -44.875, -41.1015625, -37.328125, -33.5546875, -29.78125, -26.0078125, -22.234375, -18.4609375, -14.6875, -10.9140625, -7.140625, -3.3671875, 0.40625, 4.1796875, 7.953125, 11.7265625, 15.5, 19.2734375, 23.046875, 26.8203125, 30.59375, 34.3671875, 38.140625, 41.9140625, 45.6875, 49.4609375, 53.234375, 57.0078125, 60.78125, 64.5546875, 68.328125, 72.1015625, 75.875, 79.6484375, 83.421875, 87.1953125, 90.96875, 94.7421875, 98.515625, 102.2890625, 106.0625, 109.8359375, 113.609375, 117.3828125, 121.15625, 124.9296875, 128.703125, 132.4765625, 136.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 40.0, 214.0, 478.0, 220.0, 48.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.16341781616211, -35.44236373901367, -30.721309661865234, -26.000255584716797, -21.27920150756836, -16.558147430419922, -11.837093353271484, -7.116039276123047, -2.3949851989746094, 2.326068878173828, 7.047122955322266, 11.768177032470703, 16.48923110961914, 21.210285186767578, 25.931339263916016, 30.652393341064453, 35.37344741821289, 40.09450149536133, 44.815555572509766, 49.5366096496582, 54.25766372680664, 58.97871780395508, 63.699771881103516, 68.42082214355469, 73.14187622070312, 77.86293029785156, 82.583984375, 87.30503845214844, 92.02609252929688, 96.74714660644531, 101.46820068359375, 106.18925476074219, 110.91030883789062, 115.63136291503906, 120.3524169921875, 125.07347106933594, 129.79452514648438, 134.5155792236328, 139.23663330078125, 143.9576873779297, 148.67874145507812, 153.39979553222656, 158.120849609375, 162.84190368652344, 167.56295776367188, 172.2840118408203, 177.00506591796875, 181.7261199951172, 186.44717407226562, 191.16822814941406, 195.8892822265625, 200.61033630371094, 205.33139038085938, 210.0524444580078, 214.77349853515625, 219.4945526123047, 224.21560668945312, 228.93666076660156, 233.65771484375, 238.37876892089844, 243.09982299804688, 247.8208770751953, 252.54193115234375, 257.26300048828125, 261.9840393066406]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 13.0, 16.0, 18.0, 25.0, 13.0, 23.0, 21.0, 31.0, 33.0, 29.0, 26.0, 43.0, 42.0, 33.0, 28.0, 29.0, 39.0, 36.0, 42.0, 48.0, 33.0, 32.0, 31.0, 33.0, 30.0, 25.0, 31.0, 31.0, 20.0, 24.0, 16.0, 18.0, 9.0, 5.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-109.09172821044922, -105.55287170410156, -102.01400756835938, -98.47515106201172, -94.93629455566406, -91.3974380493164, -87.85858154296875, -84.31971740722656, -80.7808609008789, -77.24200439453125, -73.70314025878906, -70.1642837524414, -66.62542724609375, -63.086570739746094, -59.54771041870117, -56.00885009765625, -52.469993591308594, -48.93113708496094, -45.392276763916016, -41.853416442871094, -38.31455993652344, -34.77570343017578, -31.23684310913086, -27.69798469543457, -24.15912628173828, -20.620267868041992, -17.081409454345703, -13.542551040649414, -10.003692626953125, -6.464834213256836, -2.925975799560547, 0.6128826141357422, 4.1517486572265625, 7.690607070922852, 11.22946548461914, 14.76832389831543, 18.30718231201172, 21.846040725708008, 25.384899139404297, 28.923757553100586, 32.462615966796875, 36.00147247314453, 39.54033279418945, 43.079193115234375, 46.61804962158203, 50.15690612792969, 53.69576644897461, 57.23462677001953, 60.77348327636719, 64.31233978271484, 67.8511962890625, 71.39006042480469, 74.92891693115234, 78.4677734375, 82.00663757324219, 85.54549407958984, 89.0843505859375, 92.62320709228516, 96.16206359863281, 99.700927734375, 103.23978424072266, 106.77864074707031, 110.3175048828125, 113.85636138916016, 117.39521789550781]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 16.0, 12.0, 18.0, 15.0, 15.0, 22.0, 15.0, 27.0, 24.0, 34.0, 35.0, 32.0, 42.0, 46.0, 46.0, 49.0, 47.0, 40.0, 46.0, 41.0, 41.0, 39.0, 30.0, 32.0, 22.0, 26.0, 21.0, 26.0, 17.0, 18.0, 11.0, 14.0, 11.0, 15.0, 6.0, 10.0, 3.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9609375, -15.4285888671875, -14.896240234375, -14.3638916015625, -13.83154296875, -13.2991943359375, -12.766845703125, -12.2344970703125, -11.7021484375, -11.1697998046875, -10.637451171875, -10.1051025390625, -9.57275390625, -9.0404052734375, -8.508056640625, -7.9757080078125, -7.443359375, -6.9110107421875, -6.378662109375, -5.8463134765625, -5.31396484375, -4.7816162109375, -4.249267578125, -3.7169189453125, -3.1845703125, -2.6522216796875, -2.119873046875, -1.5875244140625, -1.05517578125, -0.5228271484375, 0.009521484375, 0.5418701171875, 1.07421875, 1.6065673828125, 2.138916015625, 2.6712646484375, 3.20361328125, 3.7359619140625, 4.268310546875, 4.8006591796875, 5.3330078125, 5.8653564453125, 6.397705078125, 6.9300537109375, 7.46240234375, 7.9947509765625, 8.527099609375, 9.0594482421875, 9.591796875, 10.1241455078125, 10.656494140625, 11.1888427734375, 11.72119140625, 12.2535400390625, 12.785888671875, 13.3182373046875, 13.8505859375, 14.3829345703125, 14.915283203125, 15.4476318359375, 15.97998046875, 16.5123291015625, 17.044677734375, 17.5770263671875, 18.109375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 15.0, 3.0, 12.0, 19.0, 17.0, 30.0, 35.0, 55.0, 95.0, 154.0, 253.0, 528.0, 1022.0, 2143.0, 4781.0, 11839.0, 38206.0, 233782.0, 1949356.0, 1712486.0, 187415.0, 32706.0, 10530.0, 4500.0, 2028.0, 958.0, 551.0, 283.0, 149.0, 88.0, 70.0, 42.0, 36.0, 22.0, 13.0, 10.0, 11.0, 4.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-35.0, -33.93798828125, -32.8759765625, -31.81396484375, -30.751953125, -29.68994140625, -28.6279296875, -27.56591796875, -26.50390625, -25.44189453125, -24.3798828125, -23.31787109375, -22.255859375, -21.19384765625, -20.1318359375, -19.06982421875, -18.0078125, -16.94580078125, -15.8837890625, -14.82177734375, -13.759765625, -12.69775390625, -11.6357421875, -10.57373046875, -9.51171875, -8.44970703125, -7.3876953125, -6.32568359375, -5.263671875, -4.20166015625, -3.1396484375, -2.07763671875, -1.015625, 0.04638671875, 1.1083984375, 2.17041015625, 3.232421875, 4.29443359375, 5.3564453125, 6.41845703125, 7.48046875, 8.54248046875, 9.6044921875, 10.66650390625, 11.728515625, 12.79052734375, 13.8525390625, 14.91455078125, 15.9765625, 17.03857421875, 18.1005859375, 19.16259765625, 20.224609375, 21.28662109375, 22.3486328125, 23.41064453125, 24.47265625, 25.53466796875, 26.5966796875, 27.65869140625, 28.720703125, 29.78271484375, 30.8447265625, 31.90673828125, 32.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 12.0, 9.0, 12.0, 17.0, 32.0, 38.0, 48.0, 79.0, 113.0, 157.0, 325.0, 598.0, 763.0, 699.0, 470.0, 257.0, 138.0, 85.0, 57.0, 40.0, 36.0, 18.0, 19.0, 16.0, 3.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-51.625, -50.41845703125, -49.2119140625, -48.00537109375, -46.798828125, -45.59228515625, -44.3857421875, -43.17919921875, -41.97265625, -40.76611328125, -39.5595703125, -38.35302734375, -37.146484375, -35.93994140625, -34.7333984375, -33.52685546875, -32.3203125, -31.11376953125, -29.9072265625, -28.70068359375, -27.494140625, -26.28759765625, -25.0810546875, -23.87451171875, -22.66796875, -21.46142578125, -20.2548828125, -19.04833984375, -17.841796875, -16.63525390625, -15.4287109375, -14.22216796875, -13.015625, -11.80908203125, -10.6025390625, -9.39599609375, -8.189453125, -6.98291015625, -5.7763671875, -4.56982421875, -3.36328125, -2.15673828125, -0.9501953125, 0.25634765625, 1.462890625, 2.66943359375, 3.8759765625, 5.08251953125, 6.2890625, 7.49560546875, 8.7021484375, 9.90869140625, 11.115234375, 12.32177734375, 13.5283203125, 14.73486328125, 15.94140625, 17.14794921875, 18.3544921875, 19.56103515625, 20.767578125, 21.97412109375, 23.1806640625, 24.38720703125, 25.59375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 9.0, 17.0, 37.0, 39.0, 78.0, 98.0, 163.0, 321.0, 825.0, 2465.0, 12273.0, 139031.0, 3772167.0, 244627.0, 17226.0, 3008.0, 936.0, 391.0, 212.0, 115.0, 83.0, 40.0, 35.0, 17.0, 20.0, 14.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -61.6904296875, -58.693359375, -55.6962890625, -52.69921875, -49.7021484375, -46.705078125, -43.7080078125, -40.7109375, -37.7138671875, -34.716796875, -31.7197265625, -28.72265625, -25.7255859375, -22.728515625, -19.7314453125, -16.734375, -13.7373046875, -10.740234375, -7.7431640625, -4.74609375, -1.7490234375, 1.248046875, 4.2451171875, 7.2421875, 10.2392578125, 13.236328125, 16.2333984375, 19.23046875, 22.2275390625, 25.224609375, 28.2216796875, 31.21875, 34.2158203125, 37.212890625, 40.2099609375, 43.20703125, 46.2041015625, 49.201171875, 52.1982421875, 55.1953125, 58.1923828125, 61.189453125, 64.1865234375, 67.18359375, 70.1806640625, 73.177734375, 76.1748046875, 79.171875, 82.1689453125, 85.166015625, 88.1630859375, 91.16015625, 94.1572265625, 97.154296875, 100.1513671875, 103.1484375, 106.1455078125, 109.142578125, 112.1396484375, 115.13671875, 118.1337890625, 121.130859375, 124.1279296875, 127.125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 23.0, 55.0, 182.0, 317.0, 260.0, 118.0, 43.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6817626953125, -96.8416519165039, -87.00153350830078, -77.16142272949219, -67.32130432128906, -57.48119354248047, -47.641082763671875, -37.80096435546875, -27.960853576660156, -18.120738983154297, -8.28062629699707, 1.5594863891601562, 11.399600982666016, 21.239715576171875, 31.07982635498047, 40.919944763183594, 50.76005554199219, 60.60017013549805, 70.4402847290039, 80.2803955078125, 90.12051391601562, 99.96062469482422, 109.80073547363281, 119.64085388183594, 129.48095703125, 139.32107543945312, 149.1611785888672, 159.0012969970703, 168.84141540527344, 178.6815185546875, 188.52163696289062, 198.36175537109375, 208.20187377929688, 218.0419921875, 227.88209533691406, 237.7222137451172, 247.5623321533203, 257.4024353027344, 267.2425537109375, 277.0826721191406, 286.92279052734375, 296.7629089355469, 306.60302734375, 316.443115234375, 326.2832336425781, 336.12335205078125, 345.9634704589844, 355.8035888671875, 365.6436767578125, 375.4837951660156, 385.32391357421875, 395.16400146484375, 405.0041198730469, 414.84423828125, 424.6843566894531, 434.52447509765625, 444.3645935058594, 454.2047119140625, 464.0448303222656, 473.88494873046875, 483.72503662109375, 493.5651550292969, 503.4052734375, 513.245361328125, 523.0855102539062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 5.0, 15.0, 7.0, 19.0, 14.0, 28.0, 22.0, 28.0, 25.0, 28.0, 24.0, 26.0, 31.0, 44.0, 34.0, 30.0, 38.0, 55.0, 40.0, 43.0, 34.0, 38.0, 44.0, 26.0, 42.0, 20.0, 23.0, 25.0, 24.0, 17.0, 16.0, 14.0, 22.0, 12.0, 12.0, 5.0, 9.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-90.29818725585938, -87.43455505371094, -84.5709228515625, -81.70728302001953, -78.8436508178711, -75.98001861572266, -73.11637878417969, -70.25274658203125, -67.38911437988281, -64.52548217773438, -61.66184616088867, -58.79821014404297, -55.93457794189453, -53.070945739746094, -50.20730972290039, -47.34367370605469, -44.48004150390625, -41.61640930175781, -38.75277328491211, -35.889137268066406, -33.02550506591797, -30.1618709564209, -27.298236846923828, -24.434602737426758, -21.570968627929688, -18.707334518432617, -15.843700408935547, -12.980066299438477, -10.116432189941406, -7.252798080444336, -4.389163970947266, -1.5255298614501953, 1.338104248046875, 4.201738357543945, 7.065372467041016, 9.929006576538086, 12.792640686035156, 15.656274795532227, 18.519908905029297, 21.383543014526367, 24.247177124023438, 27.110811233520508, 29.974445343017578, 32.83808135986328, 35.70171356201172, 38.565345764160156, 41.42898178100586, 44.29261779785156, 47.15625, 50.01988220214844, 52.88351821899414, 55.747154235839844, 58.61078643798828, 61.47441864013672, 64.33805847167969, 67.20169067382812, 70.06532287597656, 72.928955078125, 75.79258728027344, 78.6562271118164, 81.51985931396484, 84.38349151611328, 87.24713134765625, 90.11076354980469, 92.97439575195312]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 14.0, 7.0, 14.0, 17.0, 19.0, 20.0, 28.0, 31.0, 33.0, 37.0, 46.0, 31.0, 33.0, 37.0, 44.0, 57.0, 48.0, 40.0, 41.0, 41.0, 44.0, 48.0, 27.0, 32.0, 26.0, 26.0, 24.0, 19.0, 21.0, 12.0, 15.0, 12.0, 11.0, 6.0, 7.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.1484375, -15.578125, -15.0078125, -14.4375, -13.8671875, -13.296875, -12.7265625, -12.15625, -11.5859375, -11.015625, -10.4453125, -9.875, -9.3046875, -8.734375, -8.1640625, -7.59375, -7.0234375, -6.453125, -5.8828125, -5.3125, -4.7421875, -4.171875, -3.6015625, -3.03125, -2.4609375, -1.890625, -1.3203125, -0.75, -0.1796875, 0.390625, 0.9609375, 1.53125, 2.1015625, 2.671875, 3.2421875, 3.8125, 4.3828125, 4.953125, 5.5234375, 6.09375, 6.6640625, 7.234375, 7.8046875, 8.375, 8.9453125, 9.515625, 10.0859375, 10.65625, 11.2265625, 11.796875, 12.3671875, 12.9375, 13.5078125, 14.078125, 14.6484375, 15.21875, 15.7890625, 16.359375, 16.9296875, 17.5, 18.0703125, 18.640625, 19.2109375, 19.78125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 10.0, 17.0, 30.0, 28.0, 42.0, 61.0, 91.0, 141.0, 231.0, 335.0, 544.0, 802.0, 1172.0, 2024.0, 3120.0, 4852.0, 7819.0, 12196.0, 19614.0, 31750.0, 52371.0, 86873.0, 138996.0, 197384.0, 180678.0, 118911.0, 72402.0, 44045.0, 26704.0, 16876.0, 10341.0, 6469.0, 4198.0, 2723.0, 1637.0, 1081.0, 704.0, 419.0, 265.0, 178.0, 147.0, 89.0, 69.0, 29.0, 28.0, 17.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-2.291015625, -2.221221923828125, -2.15142822265625, -2.081634521484375, -2.0118408203125, -1.942047119140625, -1.87225341796875, -1.802459716796875, -1.732666015625, -1.662872314453125, -1.59307861328125, -1.523284912109375, -1.4534912109375, -1.383697509765625, -1.31390380859375, -1.244110107421875, -1.17431640625, -1.104522705078125, -1.03472900390625, -0.964935302734375, -0.8951416015625, -0.825347900390625, -0.75555419921875, -0.685760498046875, -0.615966796875, -0.546173095703125, -0.47637939453125, -0.406585693359375, -0.3367919921875, -0.266998291015625, -0.19720458984375, -0.127410888671875, -0.0576171875, 0.012176513671875, 0.08197021484375, 0.151763916015625, 0.2215576171875, 0.291351318359375, 0.36114501953125, 0.430938720703125, 0.500732421875, 0.570526123046875, 0.64031982421875, 0.710113525390625, 0.7799072265625, 0.849700927734375, 0.91949462890625, 0.989288330078125, 1.05908203125, 1.128875732421875, 1.19866943359375, 1.268463134765625, 1.3382568359375, 1.408050537109375, 1.47784423828125, 1.547637939453125, 1.617431640625, 1.687225341796875, 1.75701904296875, 1.826812744140625, 1.8966064453125, 1.966400146484375, 2.03619384765625, 2.105987548828125, 2.17578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 0.0, 4.0, 4.0, 5.0, 11.0, 7.0, 9.0, 9.0, 16.0, 16.0, 19.0, 20.0, 40.0, 15.0, 32.0, 42.0, 32.0, 32.0, 39.0, 36.0, 29.0, 36.0, 48.0, 1057.0, 45.0, 38.0, 36.0, 34.0, 37.0, 25.0, 32.0, 20.0, 28.0, 18.0, 26.0, 13.0, 20.0, 23.0, 12.0, 10.0, 10.0, 12.0, 6.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.4921875, -10.1650390625, -9.837890625, -9.5107421875, -9.18359375, -8.8564453125, -8.529296875, -8.2021484375, -7.875, -7.5478515625, -7.220703125, -6.8935546875, -6.56640625, -6.2392578125, -5.912109375, -5.5849609375, -5.2578125, -4.9306640625, -4.603515625, -4.2763671875, -3.94921875, -3.6220703125, -3.294921875, -2.9677734375, -2.640625, -2.3134765625, -1.986328125, -1.6591796875, -1.33203125, -1.0048828125, -0.677734375, -0.3505859375, -0.0234375, 0.3037109375, 0.630859375, 0.9580078125, 1.28515625, 1.6123046875, 1.939453125, 2.2666015625, 2.59375, 2.9208984375, 3.248046875, 3.5751953125, 3.90234375, 4.2294921875, 4.556640625, 4.8837890625, 5.2109375, 5.5380859375, 5.865234375, 6.1923828125, 6.51953125, 6.8466796875, 7.173828125, 7.5009765625, 7.828125, 8.1552734375, 8.482421875, 8.8095703125, 9.13671875, 9.4638671875, 9.791015625, 10.1181640625, 10.4453125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 19.0, 25.0, 35.0, 65.0, 104.0, 133.0, 197.0, 283.0, 388.0, 595.0, 900.0, 1344.0, 2110.0, 3088.0, 4718.0, 7200.0, 11483.0, 18208.0, 29490.0, 49203.0, 82090.0, 136959.0, 1219943.0, 216907.0, 122380.0, 73075.0, 43764.0, 26457.0, 16543.0, 10285.0, 6614.0, 4220.0, 2754.0, 1826.0, 1224.0, 812.0, 569.0, 327.0, 256.0, 156.0, 111.0, 74.0, 52.0, 30.0, 33.0, 25.0, 19.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5272979736328125, -1.479400634765625, -1.4315032958984375, -1.38360595703125, -1.3357086181640625, -1.287811279296875, -1.2399139404296875, -1.1920166015625, -1.1441192626953125, -1.096221923828125, -1.0483245849609375, -1.00042724609375, -0.9525299072265625, -0.904632568359375, -0.8567352294921875, -0.808837890625, -0.7609405517578125, -0.713043212890625, -0.6651458740234375, -0.61724853515625, -0.5693511962890625, -0.521453857421875, -0.4735565185546875, -0.4256591796875, -0.3777618408203125, -0.329864501953125, -0.2819671630859375, -0.23406982421875, -0.1861724853515625, -0.138275146484375, -0.0903778076171875, -0.04248046875, 0.0054168701171875, 0.053314208984375, 0.1012115478515625, 0.14910888671875, 0.1970062255859375, 0.244903564453125, 0.2928009033203125, 0.3406982421875, 0.3885955810546875, 0.436492919921875, 0.4843902587890625, 0.53228759765625, 0.5801849365234375, 0.628082275390625, 0.6759796142578125, 0.723876953125, 0.7717742919921875, 0.819671630859375, 0.8675689697265625, 0.91546630859375, 0.9633636474609375, 1.011260986328125, 1.0591583251953125, 1.1070556640625, 1.1549530029296875, 1.202850341796875, 1.2507476806640625, 1.29864501953125, 1.3465423583984375, 1.394439697265625, 1.4423370361328125, 1.490234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 3.0, 7.0, 11.0, 14.0, 11.0, 18.0, 22.0, 36.0, 50.0, 47.0, 82.0, 95.0, 105.0, 105.0, 84.0, 58.0, 53.0, 41.0, 32.0, 31.0, 21.0, 12.0, 8.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0380859375, -0.03703045845031738, -0.035974979400634766, -0.03491950035095215, -0.03386402130126953, -0.032808542251586914, -0.0317530632019043, -0.03069758415222168, -0.029642105102539062, -0.028586626052856445, -0.027531147003173828, -0.02647566795349121, -0.025420188903808594, -0.024364709854125977, -0.02330923080444336, -0.022253751754760742, -0.021198272705078125, -0.020142793655395508, -0.01908731460571289, -0.018031835556030273, -0.016976356506347656, -0.01592087745666504, -0.014865398406982422, -0.013809919357299805, -0.012754440307617188, -0.01169896125793457, -0.010643482208251953, -0.009588003158569336, -0.008532524108886719, -0.0074770450592041016, -0.006421566009521484, -0.005366086959838867, -0.00431060791015625, -0.003255128860473633, -0.0021996498107910156, -0.0011441707611083984, -8.869171142578125e-05, 0.0009667873382568359, 0.002022266387939453, 0.0030777454376220703, 0.0041332244873046875, 0.005188703536987305, 0.006244182586669922, 0.007299661636352539, 0.008355140686035156, 0.009410619735717773, 0.01046609878540039, 0.011521577835083008, 0.012577056884765625, 0.013632535934448242, 0.01468801498413086, 0.015743494033813477, 0.016798973083496094, 0.01785445213317871, 0.018909931182861328, 0.019965410232543945, 0.021020889282226562, 0.02207636833190918, 0.023131847381591797, 0.024187326431274414, 0.02524280548095703, 0.02629828453063965, 0.027353763580322266, 0.028409242630004883, 0.0294647216796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 3.0, 3.0, 15.0, 9.0, 13.0, 22.0, 23.0, 34.0, 52.0, 64.0, 111.0, 143.0, 299.0, 988.0, 683170.0, 361801.0, 913.0, 318.0, 174.0, 108.0, 73.0, 48.0, 40.0, 24.0, 21.0, 18.0, 14.0, 3.0, 8.0, 3.0, 10.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5965423583984375, -0.574432373046875, -0.5523223876953125, -0.53021240234375, -0.5081024169921875, -0.485992431640625, -0.4638824462890625, -0.4417724609375, -0.4196624755859375, -0.397552490234375, -0.3754425048828125, -0.35333251953125, -0.3312225341796875, -0.309112548828125, -0.2870025634765625, -0.264892578125, -0.2427825927734375, -0.220672607421875, -0.1985626220703125, -0.17645263671875, -0.1543426513671875, -0.132232666015625, -0.1101226806640625, -0.0880126953125, -0.0659027099609375, -0.043792724609375, -0.0216827392578125, 0.00042724609375, 0.0225372314453125, 0.044647216796875, 0.0667572021484375, 0.0888671875, 0.1109771728515625, 0.133087158203125, 0.1551971435546875, 0.17730712890625, 0.1994171142578125, 0.221527099609375, 0.2436370849609375, 0.2657470703125, 0.2878570556640625, 0.309967041015625, 0.3320770263671875, 0.35418701171875, 0.3762969970703125, 0.398406982421875, 0.4205169677734375, 0.442626953125, 0.4647369384765625, 0.486846923828125, 0.5089569091796875, 0.53106689453125, 0.5531768798828125, 0.575286865234375, 0.5973968505859375, 0.6195068359375, 0.6416168212890625, 0.663726806640625, 0.6858367919921875, 0.70794677734375, 0.7300567626953125, 0.752166748046875, 0.7742767333984375, 0.79638671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 13.0, 998.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344381958246231, -0.21398285031318665, -0.19352751970291138, -0.17307217419147491, -0.15261682868003845, -0.13216149806976318, -0.11170615255832672, -0.09125082194805145, -0.07079547643661499, -0.050340138375759125, -0.02988479658961296, -0.009429454803466797, 0.011025883257389069, 0.031481221318244934, 0.051936566829681396, 0.07239189743995667, 0.09284724295139313, 0.11330258101224899, 0.13375791907310486, 0.15421326458454132, 0.17466861009597778, 0.19512394070625305, 0.21557928621768951, 0.23603461682796478, 0.25648996233940125, 0.2769452929496765, 0.29740065336227417, 0.31785598397254944, 0.3383113145828247, 0.35876667499542236, 0.37922200560569763, 0.3996773362159729, 0.42013269662857056, 0.4405880272388458, 0.4610433876514435, 0.48149871826171875, 0.5019540786743164, 0.5224093794822693, 0.5428647398948669, 0.5633200407028198, 0.5837754011154175, 0.6042307615280151, 0.624686062335968, 0.6451414227485657, 0.6655967831611633, 0.6860520839691162, 0.7065074443817139, 0.7269628047943115, 0.7474181652069092, 0.7678735256195068, 0.7883288264274597, 0.8087841868400574, 0.829239547252655, 0.8496948480606079, 0.8701502084732056, 0.8906055688858032, 0.9110608696937561, 0.9315162301063538, 0.9519715309143066, 0.9724268913269043, 0.992882251739502, 1.0133376121520996, 1.0337929725646973, 1.0542482137680054, 1.074703574180603]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 5.0, 10.0, 9.0, 13.0, 18.0, 17.0, 41.0, 26.0, 33.0, 38.0, 43.0, 43.0, 46.0, 49.0, 48.0, 53.0, 63.0, 54.0, 49.0, 48.0, 41.0, 32.0, 41.0, 25.0, 28.0, 21.0, 17.0, 15.0, 19.0, 14.0, 8.0, 9.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05061835050582886, -0.049346547573804855, -0.04807474464178085, -0.04680294543504715, -0.04553114250302315, -0.044259339570999146, -0.04298754036426544, -0.04171573743224144, -0.04044393450021744, -0.039172131568193436, -0.037900328636169434, -0.03662852942943573, -0.03535672649741173, -0.034084923565387726, -0.03281312435865402, -0.03154132142663002, -0.030269518494606018, -0.028997715562582016, -0.027725914493203163, -0.02645411342382431, -0.025182310491800308, -0.023910507559776306, -0.022638706490397453, -0.0213669054210186, -0.0200951024889946, -0.018823299556970596, -0.017551498487591743, -0.01627969741821289, -0.015007894486188889, -0.013736092485487461, -0.012464290484786034, -0.011192488484084606, -0.009920686483383179, -0.008648884482681751, -0.007377082481980324, -0.006105280481278896, -0.004833478480577469, -0.0035616764798760414, -0.002289874479174614, -0.0010180724784731865, 0.00025372952222824097, 0.0015255315229296684, 0.002797333523631096, 0.004069135524332523, 0.005340937525033951, 0.006612739525735378, 0.007884541526436806, 0.009156343527138233, 0.01042814552783966, 0.011699947528541088, 0.012971749529242516, 0.014243551529943943, 0.01551535353064537, 0.016787156462669373, 0.018058957532048225, 0.019330758601427078, 0.02060256153345108, 0.021874364465475082, 0.023146165534853935, 0.024417966604232788, 0.02568976953625679, 0.026961572468280792, 0.028233373537659645, 0.029505174607038498, 0.0307769775390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 14.0, 7.0, 14.0, 17.0, 19.0, 20.0, 28.0, 31.0, 33.0, 37.0, 46.0, 31.0, 33.0, 38.0, 43.0, 57.0, 49.0, 39.0, 41.0, 41.0, 44.0, 48.0, 27.0, 32.0, 26.0, 26.0, 24.0, 19.0, 21.0, 12.0, 15.0, 12.0, 11.0, 6.0, 7.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.1484375, -15.578125, -15.0078125, -14.4375, -13.8671875, -13.296875, -12.7265625, -12.15625, -11.5859375, -11.015625, -10.4453125, -9.875, -9.3046875, -8.734375, -8.1640625, -7.59375, -7.0234375, -6.453125, -5.8828125, -5.3125, -4.7421875, -4.171875, -3.6015625, -3.03125, -2.4609375, -1.890625, -1.3203125, -0.75, -0.1796875, 0.390625, 0.9609375, 1.53125, 2.1015625, 2.671875, 3.2421875, 3.8125, 4.3828125, 4.953125, 5.5234375, 6.09375, 6.6640625, 7.234375, 7.8046875, 8.375, 8.9453125, 9.515625, 10.0859375, 10.65625, 11.2265625, 11.796875, 12.3671875, 12.9375, 13.5078125, 14.078125, 14.6484375, 15.21875, 15.7890625, 16.359375, 16.9296875, 17.5, 18.0703125, 18.640625, 19.2109375, 19.78125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 9.0, 17.0, 12.0, 24.0, 32.0, 28.0, 35.0, 62.0, 83.0, 107.0, 176.0, 233.0, 351.0, 534.0, 903.0, 1591.0, 3207.0, 7541.0, 20627.0, 116183.0, 825612.0, 46312.0, 13477.0, 5560.0, 2500.0, 1220.0, 697.0, 420.0, 267.0, 189.0, 138.0, 105.0, 78.0, 55.0, 44.0, 37.0, 23.0, 16.0, 19.0, 15.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.875, -37.54833984375, -36.2216796875, -34.89501953125, -33.568359375, -32.24169921875, -30.9150390625, -29.58837890625, -28.26171875, -26.93505859375, -25.6083984375, -24.28173828125, -22.955078125, -21.62841796875, -20.3017578125, -18.97509765625, -17.6484375, -16.32177734375, -14.9951171875, -13.66845703125, -12.341796875, -11.01513671875, -9.6884765625, -8.36181640625, -7.03515625, -5.70849609375, -4.3818359375, -3.05517578125, -1.728515625, -0.40185546875, 0.9248046875, 2.25146484375, 3.578125, 4.90478515625, 6.2314453125, 7.55810546875, 8.884765625, 10.21142578125, 11.5380859375, 12.86474609375, 14.19140625, 15.51806640625, 16.8447265625, 18.17138671875, 19.498046875, 20.82470703125, 22.1513671875, 23.47802734375, 24.8046875, 26.13134765625, 27.4580078125, 28.78466796875, 30.111328125, 31.43798828125, 32.7646484375, 34.09130859375, 35.41796875, 36.74462890625, 38.0712890625, 39.39794921875, 40.724609375, 42.05126953125, 43.3779296875, 44.70458984375, 46.03125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 12.0, 11.0, 23.0, 18.0, 16.0, 18.0, 17.0, 22.0, 35.0, 43.0, 49.0, 45.0, 41.0, 60.0, 75.0, 130.0, 1702.0, 192.0, 88.0, 60.0, 37.0, 50.0, 42.0, 36.0, 22.0, 33.0, 26.0, 21.0, 14.0, 17.0, 17.0, 15.0, 7.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.9375, -44.4375, -42.9375, -41.4375, -39.9375, -38.4375, -36.9375, -35.4375, -33.9375, -32.4375, -30.9375, -29.4375, -27.9375, -26.4375, -24.9375, -23.4375, -21.9375, -20.4375, -18.9375, -17.4375, -15.9375, -14.4375, -12.9375, -11.4375, -9.9375, -8.4375, -6.9375, -5.4375, -3.9375, -2.4375, -0.9375, 0.5625, 2.0625, 3.5625, 5.0625, 6.5625, 8.0625, 9.5625, 11.0625, 12.5625, 14.0625, 15.5625, 17.0625, 18.5625, 20.0625, 21.5625, 23.0625, 24.5625, 26.0625, 27.5625, 29.0625, 30.5625, 32.0625, 33.5625, 35.0625, 36.5625, 38.0625, 39.5625, 41.0625, 42.5625, 44.0625, 45.5625, 47.0625, 48.5625, 50.0625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 9.0, 13.0, 19.0, 18.0, 19.0, 32.0, 29.0, 43.0, 31.0, 52.0, 70.0, 136.0, 206.0, 468.0, 2515.0, 38791.0, 3073519.0, 26538.0, 2064.0, 440.0, 170.0, 109.0, 79.0, 67.0, 42.0, 27.0, 22.0, 20.0, 23.0, 23.0, 23.0, 13.0, 15.0, 5.0, 8.0, 5.0, 4.0, 2.0, 9.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-126.375, -122.5966796875, -118.818359375, -115.0400390625, -111.26171875, -107.4833984375, -103.705078125, -99.9267578125, -96.1484375, -92.3701171875, -88.591796875, -84.8134765625, -81.03515625, -77.2568359375, -73.478515625, -69.7001953125, -65.921875, -62.1435546875, -58.365234375, -54.5869140625, -50.80859375, -47.0302734375, -43.251953125, -39.4736328125, -35.6953125, -31.9169921875, -28.138671875, -24.3603515625, -20.58203125, -16.8037109375, -13.025390625, -9.2470703125, -5.46875, -1.6904296875, 2.087890625, 5.8662109375, 9.64453125, 13.4228515625, 17.201171875, 20.9794921875, 24.7578125, 28.5361328125, 32.314453125, 36.0927734375, 39.87109375, 43.6494140625, 47.427734375, 51.2060546875, 54.984375, 58.7626953125, 62.541015625, 66.3193359375, 70.09765625, 73.8759765625, 77.654296875, 81.4326171875, 85.2109375, 88.9892578125, 92.767578125, 96.5458984375, 100.32421875, 104.1025390625, 107.880859375, 111.6591796875, 115.4375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 38.0, 91.0, 259.0, 325.0, 190.0, 63.0, 26.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.94204711914062, -183.37054443359375, -179.79905700683594, -176.22755432128906, -172.65606689453125, -169.08456420898438, -165.5130615234375, -161.9415740966797, -158.3700714111328, -154.79856872558594, -151.22708129882812, -147.65557861328125, -144.08407592773438, -140.51258850097656, -136.9410858154297, -133.36959838867188, -129.798095703125, -126.22660064697266, -122.65510559082031, -119.08360290527344, -115.5121078491211, -111.94061279296875, -108.36911010742188, -104.79761505126953, -101.22611999511719, -97.65462493896484, -94.0831298828125, -90.51162719726562, -86.94013214111328, -83.36863708496094, -79.79713439941406, -76.22563934326172, -72.65414428710938, -69.08264923095703, -65.51115417480469, -61.93965148925781, -58.36815643310547, -54.796661376953125, -51.225162506103516, -47.653663635253906, -44.08216857910156, -40.51067352294922, -36.93917465209961, -33.36767578125, -29.796180725097656, -26.22468376159668, -22.653186798095703, -19.081689834594727, -15.51019287109375, -11.938695907592773, -8.367198944091797, -4.79570198059082, -1.2242050170898438, 2.347291946411133, 5.918788909912109, 9.490285873413086, 13.061782836914062, 16.63327980041504, 20.204776763916016, 23.776273727416992, 27.34777069091797, 30.919267654418945, 34.49076461791992, 38.06226348876953, 41.633758544921875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 7.0, 7.0, 17.0, 19.0, 18.0, 21.0, 24.0, 38.0, 30.0, 26.0, 31.0, 40.0, 35.0, 41.0, 37.0, 51.0, 48.0, 43.0, 43.0, 42.0, 43.0, 47.0, 32.0, 33.0, 43.0, 25.0, 25.0, 18.0, 22.0, 12.0, 21.0, 12.0, 14.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.14675903320312, -117.2154312133789, -113.28410339355469, -109.35276794433594, -105.42144012451172, -101.4901123046875, -97.55877685546875, -93.62744903564453, -89.69612121582031, -85.7647933959961, -81.83346557617188, -77.90213012695312, -73.9708023071289, -70.03947448730469, -66.10813903808594, -62.17681121826172, -58.2454833984375, -54.31415557861328, -50.3828239440918, -46.45149230957031, -42.520164489746094, -38.588836669921875, -34.65750503540039, -30.72617530822754, -26.794845581054688, -22.863515853881836, -18.932186126708984, -15.000856399536133, -11.069526672363281, -7.13819694519043, -3.206867218017578, 0.7244625091552734, 4.655792236328125, 8.587121963500977, 12.518451690673828, 16.44978141784668, 20.38111114501953, 24.312440872192383, 28.243770599365234, 32.17510223388672, 36.10643005371094, 40.037757873535156, 43.96908950805664, 47.900421142578125, 51.831748962402344, 55.76307678222656, 59.69440841674805, 63.62574005126953, 67.55706787109375, 71.48839569091797, 75.41972351074219, 79.35105895996094, 83.28238677978516, 87.21371459960938, 91.14505004882812, 95.07637786865234, 99.00770568847656, 102.93903350830078, 106.870361328125, 110.80169677734375, 114.73302459716797, 118.66435241699219, 122.59568786621094, 126.52701568603516, 130.45834350585938]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 8.0, 8.0, 9.0, 21.0, 14.0, 25.0, 28.0, 26.0, 24.0, 49.0, 36.0, 23.0, 36.0, 51.0, 33.0, 38.0, 51.0, 45.0, 39.0, 34.0, 56.0, 45.0, 28.0, 38.0, 28.0, 24.0, 20.0, 25.0, 26.0, 18.0, 18.0, 13.0, 15.0, 7.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.947021484375, -15.37841796875, -14.809814453125, -14.2412109375, -13.672607421875, -13.10400390625, -12.535400390625, -11.966796875, -11.398193359375, -10.82958984375, -10.260986328125, -9.6923828125, -9.123779296875, -8.55517578125, -7.986572265625, -7.41796875, -6.849365234375, -6.28076171875, -5.712158203125, -5.1435546875, -4.574951171875, -4.00634765625, -3.437744140625, -2.869140625, -2.300537109375, -1.73193359375, -1.163330078125, -0.5947265625, -0.026123046875, 0.54248046875, 1.111083984375, 1.6796875, 2.248291015625, 2.81689453125, 3.385498046875, 3.9541015625, 4.522705078125, 5.09130859375, 5.659912109375, 6.228515625, 6.797119140625, 7.36572265625, 7.934326171875, 8.5029296875, 9.071533203125, 9.64013671875, 10.208740234375, 10.77734375, 11.345947265625, 11.91455078125, 12.483154296875, 13.0517578125, 13.620361328125, 14.18896484375, 14.757568359375, 15.326171875, 15.894775390625, 16.46337890625, 17.031982421875, 17.6005859375, 18.169189453125, 18.73779296875, 19.306396484375, 19.875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 17.0, 10.0, 11.0, 31.0, 35.0, 42.0, 79.0, 106.0, 162.0, 234.0, 284.0, 481.0, 720.0, 1070.0, 1714.0, 2772.0, 4913.0, 9476.0, 19690.0, 51195.0, 219985.0, 1248779.0, 2039224.0, 453061.0, 84242.0, 27476.0, 12640.0, 6294.0, 3630.0, 2088.0, 1219.0, 781.0, 545.0, 347.0, 269.0, 187.0, 119.0, 107.0, 58.0, 41.0, 35.0, 26.0, 18.0, 21.0, 10.0, 6.0, 2.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.28125, -25.43896484375, -24.5966796875, -23.75439453125, -22.912109375, -22.06982421875, -21.2275390625, -20.38525390625, -19.54296875, -18.70068359375, -17.8583984375, -17.01611328125, -16.173828125, -15.33154296875, -14.4892578125, -13.64697265625, -12.8046875, -11.96240234375, -11.1201171875, -10.27783203125, -9.435546875, -8.59326171875, -7.7509765625, -6.90869140625, -6.06640625, -5.22412109375, -4.3818359375, -3.53955078125, -2.697265625, -1.85498046875, -1.0126953125, -0.17041015625, 0.671875, 1.51416015625, 2.3564453125, 3.19873046875, 4.041015625, 4.88330078125, 5.7255859375, 6.56787109375, 7.41015625, 8.25244140625, 9.0947265625, 9.93701171875, 10.779296875, 11.62158203125, 12.4638671875, 13.30615234375, 14.1484375, 14.99072265625, 15.8330078125, 16.67529296875, 17.517578125, 18.35986328125, 19.2021484375, 20.04443359375, 20.88671875, 21.72900390625, 22.5712890625, 23.41357421875, 24.255859375, 25.09814453125, 25.9404296875, 26.78271484375, 27.625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 13.0, 19.0, 27.0, 43.0, 74.0, 109.0, 214.0, 370.0, 688.0, 916.0, 625.0, 353.0, 212.0, 116.0, 72.0, 53.0, 32.0, 27.0, 19.0, 19.0, 7.0, 12.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.59375, -41.28271484375, -39.9716796875, -38.66064453125, -37.349609375, -36.03857421875, -34.7275390625, -33.41650390625, -32.10546875, -30.79443359375, -29.4833984375, -28.17236328125, -26.861328125, -25.55029296875, -24.2392578125, -22.92822265625, -21.6171875, -20.30615234375, -18.9951171875, -17.68408203125, -16.373046875, -15.06201171875, -13.7509765625, -12.43994140625, -11.12890625, -9.81787109375, -8.5068359375, -7.19580078125, -5.884765625, -4.57373046875, -3.2626953125, -1.95166015625, -0.640625, 0.67041015625, 1.9814453125, 3.29248046875, 4.603515625, 5.91455078125, 7.2255859375, 8.53662109375, 9.84765625, 11.15869140625, 12.4697265625, 13.78076171875, 15.091796875, 16.40283203125, 17.7138671875, 19.02490234375, 20.3359375, 21.64697265625, 22.9580078125, 24.26904296875, 25.580078125, 26.89111328125, 28.2021484375, 29.51318359375, 30.82421875, 32.13525390625, 33.4462890625, 34.75732421875, 36.068359375, 37.37939453125, 38.6904296875, 40.00146484375, 41.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 2.0, 8.0, 7.0, 13.0, 10.0, 18.0, 39.0, 41.0, 76.0, 122.0, 258.0, 539.0, 1556.0, 5682.0, 37895.0, 2050940.0, 2050177.0, 38406.0, 5870.0, 1538.0, 538.0, 248.0, 116.0, 66.0, 44.0, 23.0, 18.0, 10.0, 5.0, 3.0, 1.0, 4.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-105.625, -102.32421875, -99.0234375, -95.72265625, -92.421875, -89.12109375, -85.8203125, -82.51953125, -79.21875, -75.91796875, -72.6171875, -69.31640625, -66.015625, -62.71484375, -59.4140625, -56.11328125, -52.8125, -49.51171875, -46.2109375, -42.91015625, -39.609375, -36.30859375, -33.0078125, -29.70703125, -26.40625, -23.10546875, -19.8046875, -16.50390625, -13.203125, -9.90234375, -6.6015625, -3.30078125, 0.0, 3.30078125, 6.6015625, 9.90234375, 13.203125, 16.50390625, 19.8046875, 23.10546875, 26.40625, 29.70703125, 33.0078125, 36.30859375, 39.609375, 42.91015625, 46.2109375, 49.51171875, 52.8125, 56.11328125, 59.4140625, 62.71484375, 66.015625, 69.31640625, 72.6171875, 75.91796875, 79.21875, 82.51953125, 85.8203125, 89.12109375, 92.421875, 95.72265625, 99.0234375, 102.32421875, 105.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 15.0, 40.0, 88.0, 175.0, 251.0, 206.0, 110.0, 58.0, 29.0, 16.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.80262756347656, -212.37191772460938, -204.9412078857422, -197.510498046875, -190.0797882080078, -182.64907836914062, -175.21836853027344, -167.78765869140625, -160.35694885253906, -152.92623901367188, -145.4955291748047, -138.0648193359375, -130.6341094970703, -123.20339965820312, -115.77268981933594, -108.34197998046875, -100.91127014160156, -93.48056030273438, -86.04985046386719, -78.619140625, -71.18843078613281, -63.757720947265625, -56.32701110839844, -48.89630126953125, -41.46559143066406, -34.034881591796875, -26.604171752929688, -19.1734619140625, -11.742752075195312, -4.312042236328125, 3.1186676025390625, 10.54937744140625, 17.980087280273438, 25.410797119140625, 32.84150695800781, 40.272216796875, 47.70292663574219, 55.133636474609375, 62.56434631347656, 69.99505615234375, 77.42576599121094, 84.85647583007812, 92.28718566894531, 99.7178955078125, 107.14860534667969, 114.57931518554688, 122.01002502441406, 129.44073486328125, 136.87144470214844, 144.30215454101562, 151.7328643798828, 159.16357421875, 166.5942840576172, 174.02499389648438, 181.45570373535156, 188.88641357421875, 196.31712341308594, 203.74783325195312, 211.1785430908203, 218.6092529296875, 226.0399627685547, 233.47067260742188, 240.90138244628906, 248.33209228515625, 255.76280212402344]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 8.0, 4.0, 7.0, 13.0, 11.0, 15.0, 16.0, 24.0, 19.0, 31.0, 31.0, 27.0, 40.0, 32.0, 40.0, 36.0, 33.0, 44.0, 36.0, 41.0, 40.0, 45.0, 49.0, 38.0, 39.0, 33.0, 31.0, 20.0, 25.0, 25.0, 24.0, 19.0, 15.0, 14.0, 10.0, 6.0, 13.0, 12.0, 6.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-112.84909057617188, -109.6712875366211, -106.49348449707031, -103.31568908691406, -100.13788604736328, -96.9600830078125, -93.78228759765625, -90.60448455810547, -87.42668151855469, -84.2488784790039, -81.07107543945312, -77.89328002929688, -74.7154769897461, -71.53767395019531, -68.35987854003906, -65.18207550048828, -62.0042724609375, -58.82646942138672, -55.6486701965332, -52.47087097167969, -49.293067932128906, -46.115264892578125, -42.93746566772461, -39.759666442871094, -36.58186340332031, -33.40406036376953, -30.226261138916016, -27.048460006713867, -23.87065887451172, -20.69285774230957, -17.515056610107422, -14.337255477905273, -11.159446716308594, -7.981645584106445, -4.803844451904297, -1.6260433197021484, 1.5517578125, 4.729558944702148, 7.907360076904297, 11.085161209106445, 14.262962341308594, 17.440763473510742, 20.61856460571289, 23.79636573791504, 26.974166870117188, 30.151968002319336, 33.329769134521484, 36.507568359375, 39.68537139892578, 42.86317443847656, 46.04097366333008, 49.218772888183594, 52.396575927734375, 55.574378967285156, 58.75217819213867, 61.92997741699219, 65.10778045654297, 68.28558349609375, 71.46337890625, 74.64118194580078, 77.81898498535156, 80.99678802490234, 84.17459106445312, 87.35238647460938, 90.53018951416016]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 12.0, 10.0, 19.0, 17.0, 21.0, 20.0, 21.0, 24.0, 29.0, 40.0, 34.0, 53.0, 49.0, 54.0, 42.0, 41.0, 52.0, 32.0, 45.0, 44.0, 40.0, 33.0, 35.0, 44.0, 26.0, 28.0, 16.0, 14.0, 16.0, 12.0, 16.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.5146484375, -16.888671875, -16.2626953125, -15.63671875, -15.0107421875, -14.384765625, -13.7587890625, -13.1328125, -12.5068359375, -11.880859375, -11.2548828125, -10.62890625, -10.0029296875, -9.376953125, -8.7509765625, -8.125, -7.4990234375, -6.873046875, -6.2470703125, -5.62109375, -4.9951171875, -4.369140625, -3.7431640625, -3.1171875, -2.4912109375, -1.865234375, -1.2392578125, -0.61328125, 0.0126953125, 0.638671875, 1.2646484375, 1.890625, 2.5166015625, 3.142578125, 3.7685546875, 4.39453125, 5.0205078125, 5.646484375, 6.2724609375, 6.8984375, 7.5244140625, 8.150390625, 8.7763671875, 9.40234375, 10.0283203125, 10.654296875, 11.2802734375, 11.90625, 12.5322265625, 13.158203125, 13.7841796875, 14.41015625, 15.0361328125, 15.662109375, 16.2880859375, 16.9140625, 17.5400390625, 18.166015625, 18.7919921875, 19.41796875, 20.0439453125, 20.669921875, 21.2958984375, 21.921875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 13.0, 23.0, 33.0, 37.0, 61.0, 86.0, 134.0, 209.0, 282.0, 451.0, 667.0, 1016.0, 1445.0, 2141.0, 3124.0, 4751.0, 7268.0, 10926.0, 16641.0, 25959.0, 41367.0, 66914.0, 107649.0, 164079.0, 192996.0, 147133.0, 92905.0, 57577.0, 35951.0, 22978.0, 14579.0, 9526.0, 6507.0, 4233.0, 2873.0, 1950.0, 1353.0, 824.0, 596.0, 432.0, 266.0, 206.0, 122.0, 85.0, 64.0, 38.0, 32.0, 23.0, 11.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.21484375, -2.1484375, -2.08203125, -2.015625, -1.94921875, -1.8828125, -1.81640625, -1.75, -1.68359375, -1.6171875, -1.55078125, -1.484375, -1.41796875, -1.3515625, -1.28515625, -1.21875, -1.15234375, -1.0859375, -1.01953125, -0.953125, -0.88671875, -0.8203125, -0.75390625, -0.6875, -0.62109375, -0.5546875, -0.48828125, -0.421875, -0.35546875, -0.2890625, -0.22265625, -0.15625, -0.08984375, -0.0234375, 0.04296875, 0.109375, 0.17578125, 0.2421875, 0.30859375, 0.375, 0.44140625, 0.5078125, 0.57421875, 0.640625, 0.70703125, 0.7734375, 0.83984375, 0.90625, 0.97265625, 1.0390625, 1.10546875, 1.171875, 1.23828125, 1.3046875, 1.37109375, 1.4375, 1.50390625, 1.5703125, 1.63671875, 1.703125, 1.76953125, 1.8359375, 1.90234375, 1.96875, 2.03515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 3.0, 15.0, 12.0, 13.0, 12.0, 28.0, 20.0, 22.0, 30.0, 27.0, 28.0, 33.0, 42.0, 35.0, 48.0, 37.0, 40.0, 1076.0, 43.0, 43.0, 42.0, 45.0, 38.0, 34.0, 38.0, 32.0, 30.0, 26.0, 18.0, 21.0, 25.0, 11.0, 12.0, 10.0, 9.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.37158203125, -11.9697265625, -11.56787109375, -11.166015625, -10.76416015625, -10.3623046875, -9.96044921875, -9.55859375, -9.15673828125, -8.7548828125, -8.35302734375, -7.951171875, -7.54931640625, -7.1474609375, -6.74560546875, -6.34375, -5.94189453125, -5.5400390625, -5.13818359375, -4.736328125, -4.33447265625, -3.9326171875, -3.53076171875, -3.12890625, -2.72705078125, -2.3251953125, -1.92333984375, -1.521484375, -1.11962890625, -0.7177734375, -0.31591796875, 0.0859375, 0.48779296875, 0.8896484375, 1.29150390625, 1.693359375, 2.09521484375, 2.4970703125, 2.89892578125, 3.30078125, 3.70263671875, 4.1044921875, 4.50634765625, 4.908203125, 5.31005859375, 5.7119140625, 6.11376953125, 6.515625, 6.91748046875, 7.3193359375, 7.72119140625, 8.123046875, 8.52490234375, 8.9267578125, 9.32861328125, 9.73046875, 10.13232421875, 10.5341796875, 10.93603515625, 11.337890625, 11.73974609375, 12.1416015625, 12.54345703125, 12.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 17.0, 11.0, 20.0, 27.0, 49.0, 67.0, 97.0, 150.0, 223.0, 327.0, 529.0, 724.0, 1158.0, 1787.0, 2723.0, 4545.0, 6907.0, 11304.0, 18385.0, 30085.0, 50352.0, 84460.0, 137591.0, 1224226.0, 206976.0, 123975.0, 74994.0, 44669.0, 26678.0, 16498.0, 10034.0, 6381.0, 3922.0, 2506.0, 1662.0, 986.0, 702.0, 433.0, 311.0, 197.0, 114.0, 101.0, 71.0, 53.0, 34.0, 18.0, 16.0, 9.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.58203125, -1.5308074951171875, -1.479583740234375, -1.4283599853515625, -1.37713623046875, -1.3259124755859375, -1.274688720703125, -1.2234649658203125, -1.1722412109375, -1.1210174560546875, -1.069793701171875, -1.0185699462890625, -0.96734619140625, -0.9161224365234375, -0.864898681640625, -0.8136749267578125, -0.762451171875, -0.7112274169921875, -0.660003662109375, -0.6087799072265625, -0.55755615234375, -0.5063323974609375, -0.455108642578125, -0.4038848876953125, -0.3526611328125, -0.3014373779296875, -0.250213623046875, -0.1989898681640625, -0.14776611328125, -0.0965423583984375, -0.045318603515625, 0.0059051513671875, 0.05712890625, 0.1083526611328125, 0.159576416015625, 0.2108001708984375, 0.26202392578125, 0.3132476806640625, 0.364471435546875, 0.4156951904296875, 0.4669189453125, 0.5181427001953125, 0.569366455078125, 0.6205902099609375, 0.67181396484375, 0.7230377197265625, 0.774261474609375, 0.8254852294921875, 0.876708984375, 0.9279327392578125, 0.979156494140625, 1.0303802490234375, 1.08160400390625, 1.1328277587890625, 1.184051513671875, 1.2352752685546875, 1.2864990234375, 1.3377227783203125, 1.388946533203125, 1.4401702880859375, 1.49139404296875, 1.5426177978515625, 1.593841552734375, 1.6450653076171875, 1.6962890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 11.0, 16.0, 18.0, 22.0, 23.0, 11.0, 33.0, 22.0, 36.0, 37.0, 39.0, 71.0, 48.0, 39.0, 48.0, 47.0, 57.0, 37.0, 39.0, 41.0, 37.0, 35.0, 30.0, 29.0, 27.0, 20.0, 9.0, 19.0, 5.0, 10.0, 12.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0205841064453125, -0.01998114585876465, -0.019378185272216797, -0.018775224685668945, -0.018172264099121094, -0.017569303512573242, -0.01696634292602539, -0.01636338233947754, -0.015760421752929688, -0.015157461166381836, -0.014554500579833984, -0.013951539993286133, -0.013348579406738281, -0.01274561882019043, -0.012142658233642578, -0.011539697647094727, -0.010936737060546875, -0.010333776473999023, -0.009730815887451172, -0.00912785530090332, -0.008524894714355469, -0.007921934127807617, -0.007318973541259766, -0.006716012954711914, -0.0061130523681640625, -0.005510091781616211, -0.004907131195068359, -0.004304170608520508, -0.0037012100219726562, -0.0030982494354248047, -0.002495288848876953, -0.0018923282623291016, -0.00128936767578125, -0.0006864070892333984, -8.344650268554688e-05, 0.0005195140838623047, 0.0011224746704101562, 0.0017254352569580078, 0.0023283958435058594, 0.002931356430053711, 0.0035343170166015625, 0.004137277603149414, 0.004740238189697266, 0.005343198776245117, 0.005946159362792969, 0.00654911994934082, 0.007152080535888672, 0.0077550411224365234, 0.008358001708984375, 0.008960962295532227, 0.009563922882080078, 0.01016688346862793, 0.010769844055175781, 0.011372804641723633, 0.011975765228271484, 0.012578725814819336, 0.013181686401367188, 0.013784646987915039, 0.01438760757446289, 0.014990568161010742, 0.015593528747558594, 0.016196489334106445, 0.016799449920654297, 0.01740241050720215, 0.01800537109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 4.0, 11.0, 9.0, 10.0, 13.0, 11.0, 17.0, 20.0, 22.0, 34.0, 30.0, 45.0, 62.0, 73.0, 95.0, 127.0, 144.0, 248.0, 362.0, 724.0, 6963.0, 1015027.0, 22288.0, 897.0, 407.0, 229.0, 160.0, 101.0, 70.0, 68.0, 59.0, 39.0, 33.0, 27.0, 25.0, 13.0, 10.0, 16.0, 11.0, 10.0, 7.0, 4.0, 4.0, 5.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36572265625, -0.3537712097167969, -0.34181976318359375, -0.3298683166503906, -0.3179168701171875, -0.3059654235839844, -0.29401397705078125, -0.2820625305175781, -0.270111083984375, -0.2581596374511719, -0.24620819091796875, -0.23425674438476562, -0.2223052978515625, -0.21035385131835938, -0.19840240478515625, -0.18645095825195312, -0.17449951171875, -0.16254806518554688, -0.15059661865234375, -0.13864517211914062, -0.1266937255859375, -0.11474227905273438, -0.10279083251953125, -0.09083938598632812, -0.078887939453125, -0.06693649291992188, -0.05498504638671875, -0.043033599853515625, -0.0310821533203125, -0.019130706787109375, -0.00717926025390625, 0.004772186279296875, 0.0167236328125, 0.028675079345703125, 0.04062652587890625, 0.052577972412109375, 0.0645294189453125, 0.07648086547851562, 0.08843231201171875, 0.10038375854492188, 0.112335205078125, 0.12428665161132812, 0.13623809814453125, 0.14818954467773438, 0.1601409912109375, 0.17209243774414062, 0.18404388427734375, 0.19599533081054688, 0.20794677734375, 0.21989822387695312, 0.23184967041015625, 0.24380111694335938, 0.2557525634765625, 0.2677040100097656, 0.27965545654296875, 0.2916069030761719, 0.303558349609375, 0.3155097961425781, 0.32746124267578125, 0.3394126892089844, 0.3513641357421875, 0.3633155822753906, 0.37526702880859375, 0.3872184753417969, 0.399169921875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 989.0, 23.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3351563811302185, -0.3203372359275818, -0.30551812052726746, -0.29069897532463074, -0.275879830121994, -0.2610607147216797, -0.24624156951904297, -0.23142242431640625, -0.21660329401493073, -0.2017841637134552, -0.18696501851081848, -0.17214588820934296, -0.15732675790786743, -0.1425076127052307, -0.1276884824037552, -0.11286934465169907, -0.09805020689964294, -0.08323106914758682, -0.0684119313955307, -0.053592801094055176, -0.038773663341999054, -0.023954525589942932, -0.009135395288467407, 0.005683742463588715, 0.020502880215644836, 0.03532201796770096, 0.05014115199446678, 0.0649602860212326, 0.07977942377328873, 0.09459856152534485, 0.10941769182682037, 0.1242368295788765, 0.13905596733093262, 0.15387509763240814, 0.16869424283504486, 0.18351337313652039, 0.1983325183391571, 0.21315164864063263, 0.22797077894210815, 0.24278992414474487, 0.2576090693473816, 0.2724282145500183, 0.28724732995033264, 0.30206647515296936, 0.3168856203556061, 0.3317047357559204, 0.34652388095855713, 0.36134302616119385, 0.3761621415615082, 0.3909812867641449, 0.40580040216445923, 0.42061954736709595, 0.43543869256973267, 0.4502578377723694, 0.4650769531726837, 0.47989609837532043, 0.49471521377563477, 0.5095343589782715, 0.5243535041809082, 0.5391726493835449, 0.5539917349815369, 0.5688108801841736, 0.5836300253868103, 0.598449170589447, 0.6132683157920837]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 8.0, 6.0, 9.0, 10.0, 16.0, 10.0, 14.0, 15.0, 18.0, 20.0, 24.0, 36.0, 40.0, 33.0, 44.0, 38.0, 31.0, 44.0, 46.0, 28.0, 37.0, 48.0, 27.0, 54.0, 37.0, 33.0, 36.0, 37.0, 34.0, 26.0, 24.0, 22.0, 19.0, 13.0, 14.0, 15.0, 9.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.029133617877960205, -0.028279069811105728, -0.0274245236068964, -0.026569977402687073, -0.025715429335832596, -0.02486088126897812, -0.02400633506476879, -0.023151788860559464, -0.022297240793704987, -0.02144269272685051, -0.020588146522641182, -0.019733600318431854, -0.018879052251577377, -0.0180245041847229, -0.017169957980513573, -0.016315411776304245, -0.015460863709449768, -0.014606316573917866, -0.013751769438385963, -0.012897222302854061, -0.012042675167322159, -0.011188128031790257, -0.010333580896258354, -0.009479033760726452, -0.00862448662519455, -0.007769939489662647, -0.006915392354130745, -0.006060845218598843, -0.00520629808306694, -0.004351750947535038, -0.0034972038120031357, -0.0026426566764712334, -0.001788109540939331, -0.0009335624054074287, -7.901526987552643e-05, 0.0007755318656563759, 0.0016300790011882782, 0.0024846261367201805, 0.003339173272252083, 0.004193720407783985, 0.0050482675433158875, 0.00590281467884779, 0.006757361814379692, 0.007611908949911594, 0.008466456085443497, 0.009321003220975399, 0.010175550356507301, 0.011030097492039204, 0.011884644627571106, 0.012739191763103008, 0.01359373889863491, 0.014448286034166813, 0.015302833169698715, 0.016157381236553192, 0.01701192744076252, 0.017866473644971848, 0.018721021711826324, 0.0195755697786808, 0.02043011598289013, 0.021284662187099457, 0.022139210253953934, 0.02299375832080841, 0.02384830452501774, 0.024702850729227066, 0.025557398796081543]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 19.0, 17.0, 21.0, 19.0, 22.0, 24.0, 29.0, 40.0, 34.0, 53.0, 49.0, 54.0, 42.0, 41.0, 52.0, 32.0, 46.0, 44.0, 39.0, 33.0, 35.0, 44.0, 26.0, 28.0, 16.0, 14.0, 16.0, 12.0, 16.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.5146484375, -16.888671875, -16.2626953125, -15.63671875, -15.0107421875, -14.384765625, -13.7587890625, -13.1328125, -12.5068359375, -11.880859375, -11.2548828125, -10.62890625, -10.0029296875, -9.376953125, -8.7509765625, -8.125, -7.4990234375, -6.873046875, -6.2470703125, -5.62109375, -4.9951171875, -4.369140625, -3.7431640625, -3.1171875, -2.4912109375, -1.865234375, -1.2392578125, -0.61328125, 0.0126953125, 0.638671875, 1.2646484375, 1.890625, 2.5166015625, 3.142578125, 3.7685546875, 4.39453125, 5.0205078125, 5.646484375, 6.2724609375, 6.8984375, 7.5244140625, 8.150390625, 8.7763671875, 9.40234375, 10.0283203125, 10.654296875, 11.2802734375, 11.90625, 12.5322265625, 13.158203125, 13.7841796875, 14.41015625, 15.0361328125, 15.662109375, 16.2880859375, 16.9140625, 17.5400390625, 18.166015625, 18.7919921875, 19.41796875, 20.0439453125, 20.669921875, 21.2958984375, 21.921875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 10.0, 8.0, 10.0, 18.0, 29.0, 37.0, 62.0, 74.0, 96.0, 142.0, 212.0, 310.0, 462.0, 704.0, 1092.0, 1891.0, 3137.0, 5899.0, 11618.0, 25956.0, 75306.0, 351236.0, 427334.0, 86200.0, 29051.0, 12481.0, 6336.0, 3372.0, 2041.0, 1186.0, 651.0, 501.0, 338.0, 211.0, 157.0, 130.0, 69.0, 55.0, 42.0, 26.0, 20.0, 10.0, 7.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.0, -26.15771484375, -25.3154296875, -24.47314453125, -23.630859375, -22.78857421875, -21.9462890625, -21.10400390625, -20.26171875, -19.41943359375, -18.5771484375, -17.73486328125, -16.892578125, -16.05029296875, -15.2080078125, -14.36572265625, -13.5234375, -12.68115234375, -11.8388671875, -10.99658203125, -10.154296875, -9.31201171875, -8.4697265625, -7.62744140625, -6.78515625, -5.94287109375, -5.1005859375, -4.25830078125, -3.416015625, -2.57373046875, -1.7314453125, -0.88916015625, -0.046875, 0.79541015625, 1.6376953125, 2.47998046875, 3.322265625, 4.16455078125, 5.0068359375, 5.84912109375, 6.69140625, 7.53369140625, 8.3759765625, 9.21826171875, 10.060546875, 10.90283203125, 11.7451171875, 12.58740234375, 13.4296875, 14.27197265625, 15.1142578125, 15.95654296875, 16.798828125, 17.64111328125, 18.4833984375, 19.32568359375, 20.16796875, 21.01025390625, 21.8525390625, 22.69482421875, 23.537109375, 24.37939453125, 25.2216796875, 26.06396484375, 26.90625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 10.0, 9.0, 10.0, 16.0, 13.0, 16.0, 9.0, 22.0, 29.0, 26.0, 30.0, 47.0, 35.0, 46.0, 65.0, 63.0, 93.0, 278.0, 1560.0, 143.0, 92.0, 68.0, 44.0, 45.0, 39.0, 27.0, 34.0, 27.0, 27.0, 24.0, 12.0, 14.0, 17.0, 9.0, 10.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.03125, -46.4931640625, -44.955078125, -43.4169921875, -41.87890625, -40.3408203125, -38.802734375, -37.2646484375, -35.7265625, -34.1884765625, -32.650390625, -31.1123046875, -29.57421875, -28.0361328125, -26.498046875, -24.9599609375, -23.421875, -21.8837890625, -20.345703125, -18.8076171875, -17.26953125, -15.7314453125, -14.193359375, -12.6552734375, -11.1171875, -9.5791015625, -8.041015625, -6.5029296875, -4.96484375, -3.4267578125, -1.888671875, -0.3505859375, 1.1875, 2.7255859375, 4.263671875, 5.8017578125, 7.33984375, 8.8779296875, 10.416015625, 11.9541015625, 13.4921875, 15.0302734375, 16.568359375, 18.1064453125, 19.64453125, 21.1826171875, 22.720703125, 24.2587890625, 25.796875, 27.3349609375, 28.873046875, 30.4111328125, 31.94921875, 33.4873046875, 35.025390625, 36.5634765625, 38.1015625, 39.6396484375, 41.177734375, 42.7158203125, 44.25390625, 45.7919921875, 47.330078125, 48.8681640625, 50.40625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 20.0, 14.0, 26.0, 42.0, 63.0, 85.0, 141.0, 272.0, 799.0, 4174.0, 49132.0, 2977227.0, 105410.0, 6443.0, 1021.0, 327.0, 162.0, 108.0, 76.0, 40.0, 27.0, 24.0, 19.0, 14.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.3125, -104.119140625, -100.92578125, -97.732421875, -94.5390625, -91.345703125, -88.15234375, -84.958984375, -81.765625, -78.572265625, -75.37890625, -72.185546875, -68.9921875, -65.798828125, -62.60546875, -59.412109375, -56.21875, -53.025390625, -49.83203125, -46.638671875, -43.4453125, -40.251953125, -37.05859375, -33.865234375, -30.671875, -27.478515625, -24.28515625, -21.091796875, -17.8984375, -14.705078125, -11.51171875, -8.318359375, -5.125, -1.931640625, 1.26171875, 4.455078125, 7.6484375, 10.841796875, 14.03515625, 17.228515625, 20.421875, 23.615234375, 26.80859375, 30.001953125, 33.1953125, 36.388671875, 39.58203125, 42.775390625, 45.96875, 49.162109375, 52.35546875, 55.548828125, 58.7421875, 61.935546875, 65.12890625, 68.322265625, 71.515625, 74.708984375, 77.90234375, 81.095703125, 84.2890625, 87.482421875, 90.67578125, 93.869140625, 97.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 115.0, 725.0, 161.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.76318359375, -318.2472229003906, -304.7312927246094, -291.21533203125, -277.69940185546875, -264.1834411621094, -250.66748046875, -237.1515350341797, -223.63558959960938, -210.11964416503906, -196.60369873046875, -183.08773803710938, -169.57179260253906, -156.05584716796875, -142.53988647460938, -129.02394104003906, -115.50799560546875, -101.99205017089844, -88.4760971069336, -74.96014404296875, -61.44419860839844, -47.928253173828125, -34.41230010986328, -20.896347045898438, -7.380401611328125, 6.135547637939453, 19.65149688720703, 33.16744613647461, 46.68339538574219, 60.1993408203125, 73.71529388427734, 87.23124694824219, 100.7471923828125, 114.26313781738281, 127.77909088134766, 141.2950439453125, 154.8109893798828, 168.32693481445312, 181.8428955078125, 195.3588409423828, 208.87478637695312, 222.39073181152344, 235.90667724609375, 249.42263793945312, 262.9385986328125, 276.45452880859375, 289.9704895019531, 303.4864501953125, 317.00238037109375, 330.5183410644531, 344.0342712402344, 357.55023193359375, 371.066162109375, 384.5821228027344, 398.09808349609375, 411.614013671875, 425.1299743652344, 438.64593505859375, 452.161865234375, 465.6778259277344, 479.19378662109375, 492.709716796875, 506.2256774902344, 519.7416381835938, 533.257568359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 9.0, 11.0, 13.0, 18.0, 27.0, 24.0, 27.0, 34.0, 28.0, 42.0, 36.0, 43.0, 49.0, 42.0, 55.0, 41.0, 52.0, 51.0, 39.0, 48.0, 39.0, 31.0, 31.0, 24.0, 27.0, 15.0, 22.0, 19.0, 20.0, 18.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-123.12319946289062, -119.35442352294922, -115.58563995361328, -111.81686401367188, -108.04808807373047, -104.27931213378906, -100.51052856445312, -96.74175262451172, -92.97297668457031, -89.2042007446289, -85.43541717529297, -81.66664123535156, -77.89786529541016, -74.12908935546875, -70.36030578613281, -66.5915298461914, -62.82274627685547, -59.0539665222168, -55.28519058227539, -51.51641082763672, -47.74763488769531, -43.97885513305664, -40.21007537841797, -36.44129943847656, -32.67251968383789, -28.90374183654785, -25.134963989257812, -21.36618423461914, -17.5974063873291, -13.828628540039062, -10.05984878540039, -6.291070938110352, -2.5222930908203125, 1.2464852333068848, 5.015263557434082, 8.784042358398438, 12.552820205688477, 16.321598052978516, 20.090377807617188, 23.859155654907227, 27.627933502197266, 31.396711349487305, 35.165489196777344, 38.934268951416016, 42.70304870605469, 46.471824645996094, 50.240604400634766, 54.00938415527344, 57.778160095214844, 61.546939849853516, 65.31571960449219, 69.0844955444336, 72.853271484375, 76.62205505371094, 80.39083099365234, 84.15960693359375, 87.92839050292969, 91.6971664428711, 95.46595001220703, 99.23472595214844, 103.00350189208984, 106.77227783203125, 110.54106140136719, 114.3098373413086, 118.07861328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 6.0, 8.0, 14.0, 10.0, 17.0, 27.0, 26.0, 25.0, 29.0, 45.0, 36.0, 36.0, 62.0, 53.0, 53.0, 56.0, 43.0, 55.0, 32.0, 39.0, 44.0, 46.0, 34.0, 37.0, 30.0, 17.0, 22.0, 16.0, 21.0, 14.0, 15.0, 7.0, 6.0, 5.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.153564453125, -20.44775390625, -19.741943359375, -19.0361328125, -18.330322265625, -17.62451171875, -16.918701171875, -16.212890625, -15.507080078125, -14.80126953125, -14.095458984375, -13.3896484375, -12.683837890625, -11.97802734375, -11.272216796875, -10.56640625, -9.860595703125, -9.15478515625, -8.448974609375, -7.7431640625, -7.037353515625, -6.33154296875, -5.625732421875, -4.919921875, -4.214111328125, -3.50830078125, -2.802490234375, -2.0966796875, -1.390869140625, -0.68505859375, 0.020751953125, 0.7265625, 1.432373046875, 2.13818359375, 2.843994140625, 3.5498046875, 4.255615234375, 4.96142578125, 5.667236328125, 6.373046875, 7.078857421875, 7.78466796875, 8.490478515625, 9.1962890625, 9.902099609375, 10.60791015625, 11.313720703125, 12.01953125, 12.725341796875, 13.43115234375, 14.136962890625, 14.8427734375, 15.548583984375, 16.25439453125, 16.960205078125, 17.666015625, 18.371826171875, 19.07763671875, 19.783447265625, 20.4892578125, 21.195068359375, 21.90087890625, 22.606689453125, 23.3125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 6.0, 7.0, 17.0, 16.0, 25.0, 26.0, 46.0, 66.0, 105.0, 150.0, 203.0, 272.0, 345.0, 534.0, 787.0, 1279.0, 2093.0, 3497.0, 6446.0, 13314.0, 31647.0, 107435.0, 603633.0, 2287241.0, 905489.0, 153450.0, 40799.0, 16120.0, 7860.0, 4225.0, 2511.0, 1553.0, 896.0, 632.0, 418.0, 310.0, 219.0, 170.0, 115.0, 86.0, 77.0, 47.0, 32.0, 19.0, 17.0, 15.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-27.6875, -26.783203125, -25.87890625, -24.974609375, -24.0703125, -23.166015625, -22.26171875, -21.357421875, -20.453125, -19.548828125, -18.64453125, -17.740234375, -16.8359375, -15.931640625, -15.02734375, -14.123046875, -13.21875, -12.314453125, -11.41015625, -10.505859375, -9.6015625, -8.697265625, -7.79296875, -6.888671875, -5.984375, -5.080078125, -4.17578125, -3.271484375, -2.3671875, -1.462890625, -0.55859375, 0.345703125, 1.25, 2.154296875, 3.05859375, 3.962890625, 4.8671875, 5.771484375, 6.67578125, 7.580078125, 8.484375, 9.388671875, 10.29296875, 11.197265625, 12.1015625, 13.005859375, 13.91015625, 14.814453125, 15.71875, 16.623046875, 17.52734375, 18.431640625, 19.3359375, 20.240234375, 21.14453125, 22.048828125, 22.953125, 23.857421875, 24.76171875, 25.666015625, 26.5703125, 27.474609375, 28.37890625, 29.283203125, 30.1875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 20.0, 17.0, 44.0, 52.0, 82.0, 121.0, 208.0, 468.0, 996.0, 986.0, 518.0, 207.0, 122.0, 63.0, 45.0, 28.0, 22.0, 13.0, 18.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.21875, -43.603515625, -41.98828125, -40.373046875, -38.7578125, -37.142578125, -35.52734375, -33.912109375, -32.296875, -30.681640625, -29.06640625, -27.451171875, -25.8359375, -24.220703125, -22.60546875, -20.990234375, -19.375, -17.759765625, -16.14453125, -14.529296875, -12.9140625, -11.298828125, -9.68359375, -8.068359375, -6.453125, -4.837890625, -3.22265625, -1.607421875, 0.0078125, 1.623046875, 3.23828125, 4.853515625, 6.46875, 8.083984375, 9.69921875, 11.314453125, 12.9296875, 14.544921875, 16.16015625, 17.775390625, 19.390625, 21.005859375, 22.62109375, 24.236328125, 25.8515625, 27.466796875, 29.08203125, 30.697265625, 32.3125, 33.927734375, 35.54296875, 37.158203125, 38.7734375, 40.388671875, 42.00390625, 43.619140625, 45.234375, 46.849609375, 48.46484375, 50.080078125, 51.6953125, 53.310546875, 54.92578125, 56.541015625, 58.15625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 5.0, 3.0, 10.0, 14.0, 22.0, 41.0, 68.0, 93.0, 146.0, 241.0, 466.0, 767.0, 1497.0, 3620.0, 10690.0, 43793.0, 358778.0, 3494957.0, 229714.0, 34190.0, 8818.0, 3142.0, 1410.0, 743.0, 399.0, 255.0, 148.0, 79.0, 59.0, 34.0, 20.0, 12.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.4375, -74.216796875, -71.99609375, -69.775390625, -67.5546875, -65.333984375, -63.11328125, -60.892578125, -58.671875, -56.451171875, -54.23046875, -52.009765625, -49.7890625, -47.568359375, -45.34765625, -43.126953125, -40.90625, -38.685546875, -36.46484375, -34.244140625, -32.0234375, -29.802734375, -27.58203125, -25.361328125, -23.140625, -20.919921875, -18.69921875, -16.478515625, -14.2578125, -12.037109375, -9.81640625, -7.595703125, -5.375, -3.154296875, -0.93359375, 1.287109375, 3.5078125, 5.728515625, 7.94921875, 10.169921875, 12.390625, 14.611328125, 16.83203125, 19.052734375, 21.2734375, 23.494140625, 25.71484375, 27.935546875, 30.15625, 32.376953125, 34.59765625, 36.818359375, 39.0390625, 41.259765625, 43.48046875, 45.701171875, 47.921875, 50.142578125, 52.36328125, 54.583984375, 56.8046875, 59.025390625, 61.24609375, 63.466796875, 65.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 24.0, 21.0, 75.0, 131.0, 199.0, 206.0, 147.0, 89.0, 57.0, 26.0, 14.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.29751586914062, -207.6337127685547, -200.9698944091797, -194.30609130859375, -187.64227294921875, -180.9784698486328, -174.31466674804688, -167.65084838867188, -160.98704528808594, -154.3232421875, -147.659423828125, -140.99562072753906, -134.33181762695312, -127.66799926757812, -121.00419616699219, -114.34038543701172, -107.67657470703125, -101.01276397705078, -94.34895324707031, -87.68515014648438, -81.0213394165039, -74.35752868652344, -67.6937255859375, -61.02991485595703, -54.36610412597656, -47.702293395996094, -41.03848648071289, -34.37467956542969, -27.71086883544922, -21.04705810546875, -14.383251190185547, -7.719444274902344, -1.0556182861328125, 5.608190536499023, 12.27199935913086, 18.935808181762695, 25.59961700439453, 32.263427734375, 38.9272346496582, 45.591041564941406, 52.254852294921875, 58.918663024902344, 65.58247375488281, 72.24627685546875, 78.91008758544922, 85.57389831542969, 92.23770141601562, 98.9015121459961, 105.56532287597656, 112.22913360595703, 118.8929443359375, 125.55674743652344, 132.22055053710938, 138.88436889648438, 145.5481719970703, 152.21197509765625, 158.87579345703125, 165.5395965576172, 172.2034149169922, 178.86721801757812, 185.53103637695312, 192.19483947753906, 198.858642578125, 205.5224609375, 212.18626403808594]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 10.0, 10.0, 18.0, 10.0, 15.0, 24.0, 24.0, 22.0, 27.0, 39.0, 28.0, 39.0, 26.0, 29.0, 36.0, 37.0, 49.0, 51.0, 38.0, 38.0, 43.0, 50.0, 32.0, 35.0, 40.0, 28.0, 34.0, 34.0, 21.0, 21.0, 16.0, 8.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-104.46060180664062, -101.18244171142578, -97.90428161621094, -94.6261215209961, -91.34796142578125, -88.0698013305664, -84.79164123535156, -81.51348114013672, -78.23532104492188, -74.95716094970703, -71.67900085449219, -68.40084075927734, -65.1226806640625, -61.844520568847656, -58.56636047363281, -55.28820037841797, -52.01003646850586, -48.731876373291016, -45.45371627807617, -42.17555618286133, -38.897396087646484, -35.619232177734375, -32.34107208251953, -29.06291389465332, -25.784753799438477, -22.506593704223633, -19.22843360900879, -15.950272560119629, -12.672112464904785, -9.393951416015625, -6.115791320800781, -2.8376312255859375, 0.44052886962890625, 3.718689203262329, 6.996849536895752, 10.275010108947754, 13.553170204162598, 16.831331253051758, 20.1094913482666, 23.387651443481445, 26.66581153869629, 29.943971633911133, 33.22213363647461, 36.50029373168945, 39.7784538269043, 43.05661392211914, 46.334774017333984, 49.61293411254883, 52.89109420776367, 56.169254302978516, 59.44741439819336, 62.7255744934082, 66.00373840332031, 69.28189849853516, 72.56005859375, 75.83821868896484, 79.11637878417969, 82.39453887939453, 85.67269897460938, 88.95085906982422, 92.22901916503906, 95.5071792602539, 98.78533935546875, 102.0634994506836, 105.34165954589844]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 4.0, 13.0, 10.0, 15.0, 16.0, 19.0, 18.0, 22.0, 24.0, 30.0, 32.0, 32.0, 25.0, 53.0, 25.0, 45.0, 54.0, 40.0, 38.0, 50.0, 38.0, 52.0, 40.0, 41.0, 42.0, 21.0, 26.0, 22.0, 31.0, 20.0, 19.0, 14.0, 10.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.9375, -20.236572265625, -19.53564453125, -18.834716796875, -18.1337890625, -17.432861328125, -16.73193359375, -16.031005859375, -15.330078125, -14.629150390625, -13.92822265625, -13.227294921875, -12.5263671875, -11.825439453125, -11.12451171875, -10.423583984375, -9.72265625, -9.021728515625, -8.32080078125, -7.619873046875, -6.9189453125, -6.218017578125, -5.51708984375, -4.816162109375, -4.115234375, -3.414306640625, -2.71337890625, -2.012451171875, -1.3115234375, -0.610595703125, 0.09033203125, 0.791259765625, 1.4921875, 2.193115234375, 2.89404296875, 3.594970703125, 4.2958984375, 4.996826171875, 5.69775390625, 6.398681640625, 7.099609375, 7.800537109375, 8.50146484375, 9.202392578125, 9.9033203125, 10.604248046875, 11.30517578125, 12.006103515625, 12.70703125, 13.407958984375, 14.10888671875, 14.809814453125, 15.5107421875, 16.211669921875, 16.91259765625, 17.613525390625, 18.314453125, 19.015380859375, 19.71630859375, 20.417236328125, 21.1181640625, 21.819091796875, 22.52001953125, 23.220947265625, 23.921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 10.0, 13.0, 25.0, 41.0, 49.0, 61.0, 97.0, 190.0, 274.0, 340.0, 506.0, 836.0, 1252.0, 1825.0, 2913.0, 4340.0, 6270.0, 10008.0, 15681.0, 25039.0, 40556.0, 67727.0, 112451.0, 174691.0, 200655.0, 146583.0, 90524.0, 54958.0, 32948.0, 20469.0, 12800.0, 8411.0, 5434.0, 3520.0, 2280.0, 1631.0, 1025.0, 712.0, 464.0, 322.0, 206.0, 125.0, 89.0, 63.0, 56.0, 29.0, 17.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.48828125, -2.40875244140625, -2.3292236328125, -2.24969482421875, -2.170166015625, -2.09063720703125, -2.0111083984375, -1.93157958984375, -1.85205078125, -1.77252197265625, -1.6929931640625, -1.61346435546875, -1.533935546875, -1.45440673828125, -1.3748779296875, -1.29534912109375, -1.2158203125, -1.13629150390625, -1.0567626953125, -0.97723388671875, -0.897705078125, -0.81817626953125, -0.7386474609375, -0.65911865234375, -0.57958984375, -0.50006103515625, -0.4205322265625, -0.34100341796875, -0.261474609375, -0.18194580078125, -0.1024169921875, -0.02288818359375, 0.056640625, 0.13616943359375, 0.2156982421875, 0.29522705078125, 0.374755859375, 0.45428466796875, 0.5338134765625, 0.61334228515625, 0.69287109375, 0.77239990234375, 0.8519287109375, 0.93145751953125, 1.010986328125, 1.09051513671875, 1.1700439453125, 1.24957275390625, 1.3291015625, 1.40863037109375, 1.4881591796875, 1.56768798828125, 1.647216796875, 1.72674560546875, 1.8062744140625, 1.88580322265625, 1.96533203125, 2.04486083984375, 2.1243896484375, 2.20391845703125, 2.283447265625, 2.36297607421875, 2.4425048828125, 2.52203369140625, 2.6015625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 5.0, 11.0, 16.0, 17.0, 19.0, 26.0, 20.0, 21.0, 28.0, 33.0, 35.0, 35.0, 42.0, 39.0, 37.0, 44.0, 1069.0, 39.0, 40.0, 39.0, 34.0, 54.0, 38.0, 32.0, 33.0, 23.0, 24.0, 25.0, 23.0, 26.0, 15.0, 16.0, 7.0, 10.0, 8.0, 6.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-15.6796875, -15.243408203125, -14.80712890625, -14.370849609375, -13.9345703125, -13.498291015625, -13.06201171875, -12.625732421875, -12.189453125, -11.753173828125, -11.31689453125, -10.880615234375, -10.4443359375, -10.008056640625, -9.57177734375, -9.135498046875, -8.69921875, -8.262939453125, -7.82666015625, -7.390380859375, -6.9541015625, -6.517822265625, -6.08154296875, -5.645263671875, -5.208984375, -4.772705078125, -4.33642578125, -3.900146484375, -3.4638671875, -3.027587890625, -2.59130859375, -2.155029296875, -1.71875, -1.282470703125, -0.84619140625, -0.409912109375, 0.0263671875, 0.462646484375, 0.89892578125, 1.335205078125, 1.771484375, 2.207763671875, 2.64404296875, 3.080322265625, 3.5166015625, 3.952880859375, 4.38916015625, 4.825439453125, 5.26171875, 5.697998046875, 6.13427734375, 6.570556640625, 7.0068359375, 7.443115234375, 7.87939453125, 8.315673828125, 8.751953125, 9.188232421875, 9.62451171875, 10.060791015625, 10.4970703125, 10.933349609375, 11.36962890625, 11.805908203125, 12.2421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 15.0, 10.0, 25.0, 53.0, 66.0, 85.0, 145.0, 222.0, 303.0, 428.0, 681.0, 1170.0, 1748.0, 2721.0, 4139.0, 6607.0, 10521.0, 17066.0, 27920.0, 46225.0, 78657.0, 129320.0, 521333.0, 916471.0, 131318.0, 78736.0, 46602.0, 28170.0, 17147.0, 10744.0, 6566.0, 4303.0, 2633.0, 1643.0, 1144.0, 779.0, 477.0, 327.0, 206.0, 108.0, 104.0, 50.0, 36.0, 42.0, 21.0, 14.0, 6.0, 9.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7625579833984375, -1.703826904296875, -1.6450958251953125, -1.58636474609375, -1.5276336669921875, -1.468902587890625, -1.4101715087890625, -1.3514404296875, -1.2927093505859375, -1.233978271484375, -1.1752471923828125, -1.11651611328125, -1.0577850341796875, -0.999053955078125, -0.9403228759765625, -0.881591796875, -0.8228607177734375, -0.764129638671875, -0.7053985595703125, -0.64666748046875, -0.5879364013671875, -0.529205322265625, -0.4704742431640625, -0.4117431640625, -0.3530120849609375, -0.294281005859375, -0.2355499267578125, -0.17681884765625, -0.1180877685546875, -0.059356689453125, -0.0006256103515625, 0.05810546875, 0.1168365478515625, 0.175567626953125, 0.2342987060546875, 0.29302978515625, 0.3517608642578125, 0.410491943359375, 0.4692230224609375, 0.5279541015625, 0.5866851806640625, 0.645416259765625, 0.7041473388671875, 0.76287841796875, 0.8216094970703125, 0.880340576171875, 0.9390716552734375, 0.997802734375, 1.0565338134765625, 1.115264892578125, 1.1739959716796875, 1.23272705078125, 1.2914581298828125, 1.350189208984375, 1.4089202880859375, 1.4676513671875, 1.5263824462890625, 1.585113525390625, 1.6438446044921875, 1.70257568359375, 1.7613067626953125, 1.820037841796875, 1.8787689208984375, 1.9375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 3.0, 11.0, 15.0, 11.0, 27.0, 27.0, 39.0, 49.0, 63.0, 93.0, 120.0, 128.0, 110.0, 66.0, 49.0, 39.0, 33.0, 17.0, 14.0, 7.0, 15.0, 10.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049713134765625, -0.04811239242553711, -0.04651165008544922, -0.04491090774536133, -0.04331016540527344, -0.04170942306518555, -0.040108680725097656, -0.038507938385009766, -0.036907196044921875, -0.035306453704833984, -0.033705711364746094, -0.0321049690246582, -0.030504226684570312, -0.028903484344482422, -0.02730274200439453, -0.02570199966430664, -0.02410125732421875, -0.02250051498413086, -0.02089977264404297, -0.019299030303955078, -0.017698287963867188, -0.016097545623779297, -0.014496803283691406, -0.012896060943603516, -0.011295318603515625, -0.009694576263427734, -0.008093833923339844, -0.006493091583251953, -0.0048923492431640625, -0.003291606903076172, -0.0016908645629882812, -9.012222290039062e-05, 0.0015106201171875, 0.0031113624572753906, 0.004712104797363281, 0.006312847137451172, 0.007913589477539062, 0.009514331817626953, 0.011115074157714844, 0.012715816497802734, 0.014316558837890625, 0.015917301177978516, 0.017518043518066406, 0.019118785858154297, 0.020719528198242188, 0.022320270538330078, 0.02392101287841797, 0.02552175521850586, 0.02712249755859375, 0.02872323989868164, 0.03032398223876953, 0.03192472457885742, 0.03352546691894531, 0.0351262092590332, 0.036726951599121094, 0.038327693939208984, 0.039928436279296875, 0.041529178619384766, 0.043129920959472656, 0.04473066329956055, 0.04633140563964844, 0.04793214797973633, 0.04953289031982422, 0.05113363265991211, 0.052734375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 10.0, 12.0, 10.0, 20.0, 26.0, 29.0, 31.0, 49.0, 79.0, 115.0, 203.0, 343.0, 1079.0, 972386.0, 72522.0, 795.0, 289.0, 177.0, 100.0, 75.0, 46.0, 33.0, 21.0, 24.0, 12.0, 11.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9970626831054688, -0.9658050537109375, -0.9345474243164062, -0.903289794921875, -0.8720321655273438, -0.8407745361328125, -0.8095169067382812, -0.77825927734375, -0.7470016479492188, -0.7157440185546875, -0.6844863891601562, -0.653228759765625, -0.6219711303710938, -0.5907135009765625, -0.5594558715820312, -0.5281982421875, -0.49694061279296875, -0.4656829833984375, -0.43442535400390625, -0.403167724609375, -0.37191009521484375, -0.3406524658203125, -0.30939483642578125, -0.27813720703125, -0.24687957763671875, -0.2156219482421875, -0.18436431884765625, -0.153106689453125, -0.12184906005859375, -0.0905914306640625, -0.05933380126953125, -0.028076171875, 0.00318145751953125, 0.0344390869140625, 0.06569671630859375, 0.096954345703125, 0.12821197509765625, 0.1594696044921875, 0.19072723388671875, 0.22198486328125, 0.25324249267578125, 0.2845001220703125, 0.31575775146484375, 0.347015380859375, 0.37827301025390625, 0.4095306396484375, 0.44078826904296875, 0.4720458984375, 0.5033035278320312, 0.5345611572265625, 0.5658187866210938, 0.597076416015625, 0.6283340454101562, 0.6595916748046875, 0.6908493041992188, 0.72210693359375, 0.7533645629882812, 0.7846221923828125, 0.8158798217773438, 0.847137451171875, 0.8783950805664062, 0.9096527099609375, 0.9409103393554688, 0.97216796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1004.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24563029408454895, -0.2198905050754547, -0.19415071606636047, -0.16841092705726624, -0.142671138048172, -0.11693136394023895, -0.09119157493114471, -0.06545178592205048, -0.03971199691295624, -0.013972209766507149, 0.01176757737994194, 0.03750736266374588, 0.06324715167284012, 0.08898693323135376, 0.114726722240448, 0.14046651124954224, 0.16620630025863647, 0.1919460892677307, 0.21768587827682495, 0.2434256672859192, 0.2691654562950134, 0.29490524530410767, 0.3206450343132019, 0.34638482332229614, 0.3721246123313904, 0.3978644013404846, 0.42360419034957886, 0.4493439793586731, 0.47508376836776733, 0.5008235573768616, 0.5265633463859558, 0.55230313539505, 0.5780429244041443, 0.6037827134132385, 0.6295225024223328, 0.655262291431427, 0.6810020804405212, 0.7067418694496155, 0.7324816584587097, 0.758221447467804, 0.7839612364768982, 0.8097010254859924, 0.8354408144950867, 0.8611806035041809, 0.8869203925132751, 0.9126601815223694, 0.9383999705314636, 0.9641397595405579, 0.9898794889450073, 1.0156192779541016, 1.0413590669631958, 1.06709885597229, 1.0928386449813843, 1.1185784339904785, 1.1443182229995728, 1.170058012008667, 1.1957978010177612, 1.2215375900268555, 1.2472773790359497, 1.273017168045044, 1.2987569570541382, 1.3244967460632324, 1.3502365350723267, 1.375976324081421, 1.4017161130905151]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 6.0, 20.0, 19.0, 23.0, 18.0, 20.0, 28.0, 46.0, 43.0, 39.0, 56.0, 56.0, 50.0, 44.0, 38.0, 44.0, 51.0, 54.0, 45.0, 53.0, 38.0, 32.0, 37.0, 35.0, 24.0, 18.0, 15.0, 17.0, 6.0, 9.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06911146640777588, -0.06712162494659424, -0.0651317909359932, -0.06314194947481155, -0.06115211173892021, -0.05916227400302887, -0.05717243254184723, -0.05518259480595589, -0.053192757070064545, -0.0512029193341732, -0.04921308159828186, -0.04722324013710022, -0.04523340240120888, -0.043243564665317535, -0.041253723204135895, -0.03926388546824455, -0.03727404773235321, -0.03528420999646187, -0.033294372260570526, -0.031304530799388885, -0.029314693063497543, -0.0273248553276062, -0.02533501572906971, -0.02334517613053322, -0.021355338394641876, -0.019365500658750534, -0.017375661060214043, -0.015385822393000126, -0.013395983725786209, -0.011406145058572292, -0.009416306391358376, -0.007426467724144459, -0.005436629056930542, -0.003446790389716625, -0.0014569517225027084, 0.0005328869447112083, 0.002522725611925125, 0.004512564279139042, 0.006502402946352959, 0.008492241613566875, 0.010482080280780792, 0.012471918947994709, 0.014461757615208626, 0.016451597213745117, 0.01844143494963646, 0.0204312726855278, 0.022421112284064293, 0.024410951882600784, 0.026400789618492126, 0.02839062735438347, 0.03038046695291996, 0.03237030655145645, 0.034360144287347794, 0.036349982023239136, 0.038339823484420776, 0.04032966122031212, 0.04231949895620346, 0.0443093366920948, 0.046299174427986145, 0.048289015889167786, 0.05027885362505913, 0.05226869136095047, 0.05425853282213211, 0.05624837055802345, 0.058238208293914795]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 5.0, 4.0, 4.0, 13.0, 10.0, 15.0, 16.0, 19.0, 18.0, 22.0, 24.0, 30.0, 33.0, 31.0, 25.0, 53.0, 25.0, 45.0, 54.0, 40.0, 38.0, 50.0, 38.0, 52.0, 40.0, 41.0, 42.0, 21.0, 26.0, 22.0, 31.0, 20.0, 19.0, 15.0, 9.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.9375, -20.236572265625, -19.53564453125, -18.834716796875, -18.1337890625, -17.432861328125, -16.73193359375, -16.031005859375, -15.330078125, -14.629150390625, -13.92822265625, -13.227294921875, -12.5263671875, -11.825439453125, -11.12451171875, -10.423583984375, -9.72265625, -9.021728515625, -8.32080078125, -7.619873046875, -6.9189453125, -6.218017578125, -5.51708984375, -4.816162109375, -4.115234375, -3.414306640625, -2.71337890625, -2.012451171875, -1.3115234375, -0.610595703125, 0.09033203125, 0.791259765625, 1.4921875, 2.193115234375, 2.89404296875, 3.594970703125, 4.2958984375, 4.996826171875, 5.69775390625, 6.398681640625, 7.099609375, 7.800537109375, 8.50146484375, 9.202392578125, 9.9033203125, 10.604248046875, 11.30517578125, 12.006103515625, 12.70703125, 13.407958984375, 14.10888671875, 14.809814453125, 15.5107421875, 16.211669921875, 16.91259765625, 17.613525390625, 18.314453125, 19.015380859375, 19.71630859375, 20.417236328125, 21.1181640625, 21.819091796875, 22.52001953125, 23.220947265625, 23.921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 15.0, 26.0, 30.0, 55.0, 98.0, 122.0, 188.0, 314.0, 549.0, 930.0, 1758.0, 3366.0, 7133.0, 15800.0, 41939.0, 146871.0, 570768.0, 177394.0, 47736.0, 17530.0, 7736.0, 3657.0, 1891.0, 1055.0, 590.0, 339.0, 204.0, 136.0, 95.0, 56.0, 35.0, 27.0, 17.0, 8.0, 14.0, 10.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0], "bins": [-39.875, -38.72119140625, -37.5673828125, -36.41357421875, -35.259765625, -34.10595703125, -32.9521484375, -31.79833984375, -30.64453125, -29.49072265625, -28.3369140625, -27.18310546875, -26.029296875, -24.87548828125, -23.7216796875, -22.56787109375, -21.4140625, -20.26025390625, -19.1064453125, -17.95263671875, -16.798828125, -15.64501953125, -14.4912109375, -13.33740234375, -12.18359375, -11.02978515625, -9.8759765625, -8.72216796875, -7.568359375, -6.41455078125, -5.2607421875, -4.10693359375, -2.953125, -1.79931640625, -0.6455078125, 0.50830078125, 1.662109375, 2.81591796875, 3.9697265625, 5.12353515625, 6.27734375, 7.43115234375, 8.5849609375, 9.73876953125, 10.892578125, 12.04638671875, 13.2001953125, 14.35400390625, 15.5078125, 16.66162109375, 17.8154296875, 18.96923828125, 20.123046875, 21.27685546875, 22.4306640625, 23.58447265625, 24.73828125, 25.89208984375, 27.0458984375, 28.19970703125, 29.353515625, 30.50732421875, 31.6611328125, 32.81494140625, 33.96875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 7.0, 12.0, 10.0, 18.0, 24.0, 26.0, 33.0, 39.0, 38.0, 42.0, 61.0, 75.0, 118.0, 249.0, 1599.0, 193.0, 102.0, 89.0, 51.0, 48.0, 34.0, 36.0, 25.0, 25.0, 23.0, 15.0, 15.0, 6.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0, -71.6357421875, -69.271484375, -66.9072265625, -64.54296875, -62.1787109375, -59.814453125, -57.4501953125, -55.0859375, -52.7216796875, -50.357421875, -47.9931640625, -45.62890625, -43.2646484375, -40.900390625, -38.5361328125, -36.171875, -33.8076171875, -31.443359375, -29.0791015625, -26.71484375, -24.3505859375, -21.986328125, -19.6220703125, -17.2578125, -14.8935546875, -12.529296875, -10.1650390625, -7.80078125, -5.4365234375, -3.072265625, -0.7080078125, 1.65625, 4.0205078125, 6.384765625, 8.7490234375, 11.11328125, 13.4775390625, 15.841796875, 18.2060546875, 20.5703125, 22.9345703125, 25.298828125, 27.6630859375, 30.02734375, 32.3916015625, 34.755859375, 37.1201171875, 39.484375, 41.8486328125, 44.212890625, 46.5771484375, 48.94140625, 51.3056640625, 53.669921875, 56.0341796875, 58.3984375, 60.7626953125, 63.126953125, 65.4912109375, 67.85546875, 70.2197265625, 72.583984375, 74.9482421875, 77.3125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 12.0, 16.0, 10.0, 22.0, 19.0, 29.0, 48.0, 65.0, 103.0, 151.0, 259.0, 606.0, 2298.0, 22131.0, 2664812.0, 440912.0, 11646.0, 1455.0, 460.0, 235.0, 115.0, 80.0, 53.0, 40.0, 31.0, 20.0, 10.0, 13.0, 14.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.4375, -95.5947265625, -91.751953125, -87.9091796875, -84.06640625, -80.2236328125, -76.380859375, -72.5380859375, -68.6953125, -64.8525390625, -61.009765625, -57.1669921875, -53.32421875, -49.4814453125, -45.638671875, -41.7958984375, -37.953125, -34.1103515625, -30.267578125, -26.4248046875, -22.58203125, -18.7392578125, -14.896484375, -11.0537109375, -7.2109375, -3.3681640625, 0.474609375, 4.3173828125, 8.16015625, 12.0029296875, 15.845703125, 19.6884765625, 23.53125, 27.3740234375, 31.216796875, 35.0595703125, 38.90234375, 42.7451171875, 46.587890625, 50.4306640625, 54.2734375, 58.1162109375, 61.958984375, 65.8017578125, 69.64453125, 73.4873046875, 77.330078125, 81.1728515625, 85.015625, 88.8583984375, 92.701171875, 96.5439453125, 100.38671875, 104.2294921875, 108.072265625, 111.9150390625, 115.7578125, 119.6005859375, 123.443359375, 127.2861328125, 131.12890625, 134.9716796875, 138.814453125, 142.6572265625, 146.5]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 18.0, 104.0, 368.0, 348.0, 135.0, 32.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.8460693359375, -102.3260726928711, -93.80607604980469, -85.28608703613281, -76.7660903930664, -68.24609375, -59.72610092163086, -51.20610809326172, -42.68611145019531, -34.166114807128906, -25.646121978759766, -17.126127243041992, -8.606132507324219, -0.0861358642578125, 8.433856964111328, 16.95384979248047, 25.473846435546875, 33.99384307861328, 42.51383590698242, 51.03382873535156, 59.55382537841797, 68.07382202148438, 76.59381103515625, 85.11380767822266, 93.63380432128906, 102.15380096435547, 110.67379760742188, 119.19378662109375, 127.71378326416016, 136.23377990722656, 144.75376892089844, 153.27377319335938, 161.79376220703125, 170.31375122070312, 178.83375549316406, 187.35374450683594, 195.87374877929688, 204.39373779296875, 212.91372680664062, 221.4337158203125, 229.95372009277344, 238.4737091064453, 246.99371337890625, 255.51370239257812, 264.03369140625, 272.5537109375, 281.0736999511719, 289.59368896484375, 298.1136779785156, 306.6336669921875, 315.1536560058594, 323.6736755371094, 332.19366455078125, 340.7136535644531, 349.233642578125, 357.7536315917969, 366.27362060546875, 374.7936096191406, 383.3135986328125, 391.8336181640625, 400.3536071777344, 408.87359619140625, 417.3935852050781, 425.91357421875, 434.43359375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 9.0, 4.0, 7.0, 9.0, 7.0, 10.0, 12.0, 13.0, 22.0, 26.0, 15.0, 21.0, 30.0, 26.0, 34.0, 33.0, 35.0, 44.0, 27.0, 43.0, 41.0, 33.0, 38.0, 33.0, 43.0, 37.0, 38.0, 42.0, 29.0, 20.0, 34.0, 24.0, 29.0, 20.0, 17.0, 13.0, 10.0, 19.0, 13.0, 4.0, 11.0, 6.0, 10.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-115.88993835449219, -112.15206909179688, -108.41419219970703, -104.67632293701172, -100.93844604492188, -97.20057678222656, -93.46270751953125, -89.7248306274414, -85.98695373535156, -82.24908447265625, -78.5112075805664, -74.7733383178711, -71.03546142578125, -67.29759216308594, -63.55971908569336, -59.82184600830078, -56.08397674560547, -52.34610366821289, -48.60823059082031, -44.870361328125, -41.132484436035156, -37.394615173339844, -33.656742095947266, -29.918869018554688, -26.18099594116211, -22.44312286376953, -18.705249786376953, -14.967378616333008, -11.22950553894043, -7.491632461547852, -3.7537612915039062, -0.015888214111328125, 3.7219924926757812, 7.459865093231201, 11.197737693786621, 14.935609817504883, 18.67348289489746, 22.41135597229004, 26.149227142333984, 29.887100219726562, 33.62497329711914, 37.36284637451172, 41.1007194519043, 44.838592529296875, 48.57646179199219, 52.31433868408203, 56.052207946777344, 59.79008102416992, 63.5279541015625, 67.26582336425781, 71.00370025634766, 74.74156951904297, 78.47944641113281, 82.21731567382812, 85.95518493652344, 89.69306182861328, 93.43093872070312, 97.16880798339844, 100.90668487548828, 104.6445541381836, 108.38243103027344, 112.12030029296875, 115.85816955566406, 119.5960464477539, 123.33391571044922]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 1.0, 3.0, 12.0, 8.0, 7.0, 11.0, 14.0, 13.0, 10.0, 12.0, 16.0, 15.0, 21.0, 21.0, 28.0, 28.0, 31.0, 34.0, 40.0, 38.0, 37.0, 47.0, 29.0, 36.0, 34.0, 39.0, 53.0, 44.0, 40.0, 42.0, 34.0, 19.0, 40.0, 23.0, 23.0, 19.0, 13.0, 17.0, 8.0, 10.0, 4.0, 6.0, 5.0, 5.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.265625, -20.583251953125, -19.90087890625, -19.218505859375, -18.5361328125, -17.853759765625, -17.17138671875, -16.489013671875, -15.806640625, -15.124267578125, -14.44189453125, -13.759521484375, -13.0771484375, -12.394775390625, -11.71240234375, -11.030029296875, -10.34765625, -9.665283203125, -8.98291015625, -8.300537109375, -7.6181640625, -6.935791015625, -6.25341796875, -5.571044921875, -4.888671875, -4.206298828125, -3.52392578125, -2.841552734375, -2.1591796875, -1.476806640625, -0.79443359375, -0.112060546875, 0.5703125, 1.252685546875, 1.93505859375, 2.617431640625, 3.2998046875, 3.982177734375, 4.66455078125, 5.346923828125, 6.029296875, 6.711669921875, 7.39404296875, 8.076416015625, 8.7587890625, 9.441162109375, 10.12353515625, 10.805908203125, 11.48828125, 12.170654296875, 12.85302734375, 13.535400390625, 14.2177734375, 14.900146484375, 15.58251953125, 16.264892578125, 16.947265625, 17.629638671875, 18.31201171875, 18.994384765625, 19.6767578125, 20.359130859375, 21.04150390625, 21.723876953125, 22.40625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 8.0, 12.0, 11.0, 18.0, 24.0, 29.0, 21.0, 46.0, 60.0, 65.0, 92.0, 104.0, 179.0, 228.0, 476.0, 1445.0, 7704.0, 901076.0, 3267048.0, 12320.0, 1781.0, 537.0, 247.0, 201.0, 115.0, 92.0, 64.0, 71.0, 32.0, 31.0, 23.0, 18.0, 16.0, 21.0, 16.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-175.875, -170.716796875, -165.55859375, -160.400390625, -155.2421875, -150.083984375, -144.92578125, -139.767578125, -134.609375, -129.451171875, -124.29296875, -119.134765625, -113.9765625, -108.818359375, -103.66015625, -98.501953125, -93.34375, -88.185546875, -83.02734375, -77.869140625, -72.7109375, -67.552734375, -62.39453125, -57.236328125, -52.078125, -46.919921875, -41.76171875, -36.603515625, -31.4453125, -26.287109375, -21.12890625, -15.970703125, -10.8125, -5.654296875, -0.49609375, 4.662109375, 9.8203125, 14.978515625, 20.13671875, 25.294921875, 30.453125, 35.611328125, 40.76953125, 45.927734375, 51.0859375, 56.244140625, 61.40234375, 66.560546875, 71.71875, 76.876953125, 82.03515625, 87.193359375, 92.3515625, 97.509765625, 102.66796875, 107.826171875, 112.984375, 118.142578125, 123.30078125, 128.458984375, 133.6171875, 138.775390625, 143.93359375, 149.091796875, 154.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 12.0, 8.0, 12.0, 14.0, 22.0, 31.0, 51.0, 66.0, 66.0, 136.0, 228.0, 445.0, 1056.0, 974.0, 457.0, 209.0, 100.0, 63.0, 31.0, 18.0, 24.0, 12.0, 15.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.78125, -44.07861328125, -42.3759765625, -40.67333984375, -38.970703125, -37.26806640625, -35.5654296875, -33.86279296875, -32.16015625, -30.45751953125, -28.7548828125, -27.05224609375, -25.349609375, -23.64697265625, -21.9443359375, -20.24169921875, -18.5390625, -16.83642578125, -15.1337890625, -13.43115234375, -11.728515625, -10.02587890625, -8.3232421875, -6.62060546875, -4.91796875, -3.21533203125, -1.5126953125, 0.18994140625, 1.892578125, 3.59521484375, 5.2978515625, 7.00048828125, 8.703125, 10.40576171875, 12.1083984375, 13.81103515625, 15.513671875, 17.21630859375, 18.9189453125, 20.62158203125, 22.32421875, 24.02685546875, 25.7294921875, 27.43212890625, 29.134765625, 30.83740234375, 32.5400390625, 34.24267578125, 35.9453125, 37.64794921875, 39.3505859375, 41.05322265625, 42.755859375, 44.45849609375, 46.1611328125, 47.86376953125, 49.56640625, 51.26904296875, 52.9716796875, 54.67431640625, 56.376953125, 58.07958984375, 59.7822265625, 61.48486328125, 63.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 10.0, 24.0, 27.0, 34.0, 42.0, 90.0, 125.0, 250.0, 467.0, 999.0, 2883.0, 10719.0, 67212.0, 3232503.0, 831108.0, 36656.0, 7045.0, 2133.0, 851.0, 437.0, 219.0, 133.0, 86.0, 61.0, 35.0, 29.0, 19.0, 17.0, 11.0, 8.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.9375, -80.8134765625, -77.689453125, -74.5654296875, -71.44140625, -68.3173828125, -65.193359375, -62.0693359375, -58.9453125, -55.8212890625, -52.697265625, -49.5732421875, -46.44921875, -43.3251953125, -40.201171875, -37.0771484375, -33.953125, -30.8291015625, -27.705078125, -24.5810546875, -21.45703125, -18.3330078125, -15.208984375, -12.0849609375, -8.9609375, -5.8369140625, -2.712890625, 0.4111328125, 3.53515625, 6.6591796875, 9.783203125, 12.9072265625, 16.03125, 19.1552734375, 22.279296875, 25.4033203125, 28.52734375, 31.6513671875, 34.775390625, 37.8994140625, 41.0234375, 44.1474609375, 47.271484375, 50.3955078125, 53.51953125, 56.6435546875, 59.767578125, 62.8916015625, 66.015625, 69.1396484375, 72.263671875, 75.3876953125, 78.51171875, 81.6357421875, 84.759765625, 87.8837890625, 91.0078125, 94.1318359375, 97.255859375, 100.3798828125, 103.50390625, 106.6279296875, 109.751953125, 112.8759765625, 116.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 11.0, 41.0, 217.0, 495.0, 192.0, 45.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.56854248046875, -271.14715576171875, -253.72573852539062, -236.30433654785156, -218.8829345703125, -201.46153259277344, -184.04013061523438, -166.6187286376953, -149.19732666015625, -131.7759246826172, -114.35452270507812, -96.93312072753906, -79.51171875, -62.09031677246094, -44.668914794921875, -27.247512817382812, -9.82611083984375, 7.5952911376953125, 25.016693115234375, 42.43809509277344, 59.8594970703125, 77.28089904785156, 94.70230102539062, 112.12370300292969, 129.54510498046875, 146.9665069580078, 164.38790893554688, 181.80931091308594, 199.230712890625, 216.65211486816406, 234.07351684570312, 251.4949188232422, 268.9163818359375, 286.3377685546875, 303.7591857910156, 321.18060302734375, 338.60198974609375, 356.02337646484375, 373.4447937011719, 390.8662109375, 408.28759765625, 425.708984375, 443.1304016113281, 460.55181884765625, 477.97320556640625, 495.39459228515625, 512.8160400390625, 530.2374267578125, 547.6588134765625, 565.0802001953125, 582.5015869140625, 599.9230346679688, 617.3444213867188, 634.7658081054688, 652.187255859375, 669.608642578125, 687.030029296875, 704.451416015625, 721.872802734375, 739.2942504882812, 756.7156372070312, 774.1370239257812, 791.5584716796875, 808.9798583984375, 826.4012451171875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 10.0, 3.0, 10.0, 11.0, 16.0, 12.0, 15.0, 15.0, 13.0, 23.0, 22.0, 34.0, 35.0, 29.0, 35.0, 39.0, 44.0, 33.0, 35.0, 36.0, 40.0, 35.0, 37.0, 64.0, 44.0, 34.0, 32.0, 28.0, 42.0, 28.0, 18.0, 21.0, 21.0, 12.0, 10.0, 9.0, 16.0, 7.0, 13.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-118.70956420898438, -114.91063690185547, -111.11170959472656, -107.31278228759766, -103.51385498046875, -99.71492767333984, -95.91600036621094, -92.11707305908203, -88.31814575195312, -84.51921844482422, -80.72029113769531, -76.9213638305664, -73.1224365234375, -69.3235092163086, -65.52458190917969, -61.72565460205078, -57.926727294921875, -54.12779998779297, -50.32887268066406, -46.529945373535156, -42.73101806640625, -38.932090759277344, -35.13316345214844, -31.33423614501953, -27.535308837890625, -23.73638153076172, -19.937454223632812, -16.138526916503906, -12.339599609375, -8.540672302246094, -4.7417449951171875, -0.9428176879882812, 2.856109619140625, 6.655036926269531, 10.453964233398438, 14.252891540527344, 18.05181884765625, 21.850746154785156, 25.649673461914062, 29.44860076904297, 33.247528076171875, 37.04645538330078, 40.84538269042969, 44.644309997558594, 48.4432373046875, 52.242164611816406, 56.04109191894531, 59.84001922607422, 63.638946533203125, 67.43787384033203, 71.23680114746094, 75.03572845458984, 78.83465576171875, 82.63358306884766, 86.43251037597656, 90.23143768310547, 94.03036499023438, 97.82929229736328, 101.62821960449219, 105.4271469116211, 109.22607421875, 113.0250015258789, 116.82392883300781, 120.62285614013672, 124.42178344726562]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 10.0, 15.0, 13.0, 23.0, 18.0, 25.0, 21.0, 26.0, 26.0, 27.0, 34.0, 32.0, 32.0, 40.0, 33.0, 38.0, 37.0, 46.0, 37.0, 36.0, 36.0, 48.0, 30.0, 39.0, 23.0, 22.0, 28.0, 32.0, 21.0, 21.0, 20.0, 14.0, 13.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.265625, -21.560791015625, -20.85595703125, -20.151123046875, -19.4462890625, -18.741455078125, -18.03662109375, -17.331787109375, -16.626953125, -15.922119140625, -15.21728515625, -14.512451171875, -13.8076171875, -13.102783203125, -12.39794921875, -11.693115234375, -10.98828125, -10.283447265625, -9.57861328125, -8.873779296875, -8.1689453125, -7.464111328125, -6.75927734375, -6.054443359375, -5.349609375, -4.644775390625, -3.93994140625, -3.235107421875, -2.5302734375, -1.825439453125, -1.12060546875, -0.415771484375, 0.2890625, 0.993896484375, 1.69873046875, 2.403564453125, 3.1083984375, 3.813232421875, 4.51806640625, 5.222900390625, 5.927734375, 6.632568359375, 7.33740234375, 8.042236328125, 8.7470703125, 9.451904296875, 10.15673828125, 10.861572265625, 11.56640625, 12.271240234375, 12.97607421875, 13.680908203125, 14.3857421875, 15.090576171875, 15.79541015625, 16.500244140625, 17.205078125, 17.909912109375, 18.61474609375, 19.319580078125, 20.0244140625, 20.729248046875, 21.43408203125, 22.138916015625, 22.84375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 11.0, 17.0, 16.0, 41.0, 56.0, 95.0, 110.0, 166.0, 278.0, 407.0, 578.0, 824.0, 1185.0, 1679.0, 2396.0, 3631.0, 5273.0, 8049.0, 11903.0, 18730.0, 29201.0, 46435.0, 74572.0, 118374.0, 179513.0, 189826.0, 130229.0, 81713.0, 50739.0, 31750.0, 20693.0, 13172.0, 8622.0, 5779.0, 3951.0, 2743.0, 1820.0, 1226.0, 875.0, 572.0, 443.0, 282.0, 199.0, 155.0, 81.0, 43.0, 41.0, 25.0, 16.0, 10.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.701171875, -2.61956787109375, -2.5379638671875, -2.45635986328125, -2.374755859375, -2.29315185546875, -2.2115478515625, -2.12994384765625, -2.04833984375, -1.96673583984375, -1.8851318359375, -1.80352783203125, -1.721923828125, -1.64031982421875, -1.5587158203125, -1.47711181640625, -1.3955078125, -1.31390380859375, -1.2322998046875, -1.15069580078125, -1.069091796875, -0.98748779296875, -0.9058837890625, -0.82427978515625, -0.74267578125, -0.66107177734375, -0.5794677734375, -0.49786376953125, -0.416259765625, -0.33465576171875, -0.2530517578125, -0.17144775390625, -0.08984375, -0.00823974609375, 0.0733642578125, 0.15496826171875, 0.236572265625, 0.31817626953125, 0.3997802734375, 0.48138427734375, 0.56298828125, 0.64459228515625, 0.7261962890625, 0.80780029296875, 0.889404296875, 0.97100830078125, 1.0526123046875, 1.13421630859375, 1.2158203125, 1.29742431640625, 1.3790283203125, 1.46063232421875, 1.542236328125, 1.62384033203125, 1.7054443359375, 1.78704833984375, 1.86865234375, 1.95025634765625, 2.0318603515625, 2.11346435546875, 2.195068359375, 2.27667236328125, 2.3582763671875, 2.43988037109375, 2.521484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 7.0, 9.0, 10.0, 12.0, 18.0, 15.0, 18.0, 21.0, 22.0, 34.0, 17.0, 26.0, 36.0, 35.0, 36.0, 35.0, 30.0, 43.0, 56.0, 1059.0, 43.0, 45.0, 49.0, 21.0, 33.0, 34.0, 27.0, 33.0, 22.0, 24.0, 22.0, 21.0, 18.0, 15.0, 11.0, 8.0, 19.0, 11.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-15.328125, -14.875244140625, -14.42236328125, -13.969482421875, -13.5166015625, -13.063720703125, -12.61083984375, -12.157958984375, -11.705078125, -11.252197265625, -10.79931640625, -10.346435546875, -9.8935546875, -9.440673828125, -8.98779296875, -8.534912109375, -8.08203125, -7.629150390625, -7.17626953125, -6.723388671875, -6.2705078125, -5.817626953125, -5.36474609375, -4.911865234375, -4.458984375, -4.006103515625, -3.55322265625, -3.100341796875, -2.6474609375, -2.194580078125, -1.74169921875, -1.288818359375, -0.8359375, -0.383056640625, 0.06982421875, 0.522705078125, 0.9755859375, 1.428466796875, 1.88134765625, 2.334228515625, 2.787109375, 3.239990234375, 3.69287109375, 4.145751953125, 4.5986328125, 5.051513671875, 5.50439453125, 5.957275390625, 6.41015625, 6.863037109375, 7.31591796875, 7.768798828125, 8.2216796875, 8.674560546875, 9.12744140625, 9.580322265625, 10.033203125, 10.486083984375, 10.93896484375, 11.391845703125, 11.8447265625, 12.297607421875, 12.75048828125, 13.203369140625, 13.65625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 16.0, 10.0, 22.0, 34.0, 53.0, 77.0, 135.0, 188.0, 277.0, 407.0, 598.0, 988.0, 1469.0, 2124.0, 3474.0, 5430.0, 8150.0, 13151.0, 21253.0, 35339.0, 59454.0, 102178.0, 173012.0, 1268764.0, 161428.0, 95120.0, 56042.0, 33496.0, 19994.0, 12447.0, 7715.0, 4991.0, 3232.0, 2102.0, 1311.0, 898.0, 571.0, 406.0, 252.0, 170.0, 100.0, 89.0, 50.0, 35.0, 25.0, 17.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.189453125, -2.1219482421875, -2.054443359375, -1.9869384765625, -1.91943359375, -1.8519287109375, -1.784423828125, -1.7169189453125, -1.6494140625, -1.5819091796875, -1.514404296875, -1.4468994140625, -1.37939453125, -1.3118896484375, -1.244384765625, -1.1768798828125, -1.109375, -1.0418701171875, -0.974365234375, -0.9068603515625, -0.83935546875, -0.7718505859375, -0.704345703125, -0.6368408203125, -0.5693359375, -0.5018310546875, -0.434326171875, -0.3668212890625, -0.29931640625, -0.2318115234375, -0.164306640625, -0.0968017578125, -0.029296875, 0.0382080078125, 0.105712890625, 0.1732177734375, 0.24072265625, 0.3082275390625, 0.375732421875, 0.4432373046875, 0.5107421875, 0.5782470703125, 0.645751953125, 0.7132568359375, 0.78076171875, 0.8482666015625, 0.915771484375, 0.9832763671875, 1.05078125, 1.1182861328125, 1.185791015625, 1.2532958984375, 1.32080078125, 1.3883056640625, 1.455810546875, 1.5233154296875, 1.5908203125, 1.6583251953125, 1.725830078125, 1.7933349609375, 1.86083984375, 1.9283447265625, 1.995849609375, 2.0633544921875, 2.130859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 4.0, 6.0, 7.0, 16.0, 9.0, 20.0, 29.0, 29.0, 51.0, 52.0, 75.0, 80.0, 98.0, 82.0, 77.0, 70.0, 66.0, 58.0, 32.0, 33.0, 24.0, 15.0, 9.0, 12.0, 5.0, 11.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03436851501464844, -0.033184051513671875, -0.03199958801269531, -0.03081512451171875, -0.029630661010742188, -0.028446197509765625, -0.027261734008789062, -0.0260772705078125, -0.024892807006835938, -0.023708343505859375, -0.022523880004882812, -0.02133941650390625, -0.020154953002929688, -0.018970489501953125, -0.017786026000976562, -0.0166015625, -0.015417098999023438, -0.014232635498046875, -0.013048171997070312, -0.01186370849609375, -0.010679244995117188, -0.009494781494140625, -0.008310317993164062, -0.0071258544921875, -0.0059413909912109375, -0.004756927490234375, -0.0035724639892578125, -0.00238800048828125, -0.0012035369873046875, -1.9073486328125e-05, 0.0011653900146484375, 0.002349853515625, 0.0035343170166015625, 0.004718780517578125, 0.0059032440185546875, 0.00708770751953125, 0.008272171020507812, 0.009456634521484375, 0.010641098022460938, 0.0118255615234375, 0.013010025024414062, 0.014194488525390625, 0.015378952026367188, 0.01656341552734375, 0.017747879028320312, 0.018932342529296875, 0.020116806030273438, 0.02130126953125, 0.022485733032226562, 0.023670196533203125, 0.024854660034179688, 0.02603912353515625, 0.027223587036132812, 0.028408050537109375, 0.029592514038085938, 0.0307769775390625, 0.03196144104003906, 0.033145904541015625, 0.03433036804199219, 0.03551483154296875, 0.03669929504394531, 0.037883758544921875, 0.03906822204589844, 0.040252685546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 15.0, 16.0, 24.0, 28.0, 50.0, 58.0, 94.0, 124.0, 234.0, 371.0, 1316.0, 786954.0, 257188.0, 1096.0, 355.0, 208.0, 124.0, 53.0, 57.0, 32.0, 27.0, 23.0, 14.0, 16.0, 13.0, 9.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.796875, -0.773406982421875, -0.74993896484375, -0.726470947265625, -0.7030029296875, -0.679534912109375, -0.65606689453125, -0.632598876953125, -0.609130859375, -0.585662841796875, -0.56219482421875, -0.538726806640625, -0.5152587890625, -0.491790771484375, -0.46832275390625, -0.444854736328125, -0.42138671875, -0.397918701171875, -0.37445068359375, -0.350982666015625, -0.3275146484375, -0.304046630859375, -0.28057861328125, -0.257110595703125, -0.233642578125, -0.210174560546875, -0.18670654296875, -0.163238525390625, -0.1397705078125, -0.116302490234375, -0.09283447265625, -0.069366455078125, -0.0458984375, -0.022430419921875, 0.00103759765625, 0.024505615234375, 0.0479736328125, 0.071441650390625, 0.09490966796875, 0.118377685546875, 0.141845703125, 0.165313720703125, 0.18878173828125, 0.212249755859375, 0.2357177734375, 0.259185791015625, 0.28265380859375, 0.306121826171875, 0.32958984375, 0.353057861328125, 0.37652587890625, 0.399993896484375, 0.4234619140625, 0.446929931640625, 0.47039794921875, 0.493865966796875, 0.517333984375, 0.540802001953125, 0.56427001953125, 0.587738037109375, 0.6112060546875, 0.634674072265625, 0.65814208984375, 0.681610107421875, 0.705078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 20.0, 988.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1338716298341751, -0.11262015253305435, -0.0913686752319336, -0.07011719793081284, -0.04886572062969208, -0.02761424332857132, -0.0063627660274505615, 0.014888718724250793, 0.036140188574790955, 0.05739166587591171, 0.07864314317703247, 0.09989462047815323, 0.12114609777927399, 0.14239758253097534, 0.1636490523815155, 0.18490053713321686, 0.20615200698375702, 0.22740349173545837, 0.24865496158599854, 0.2699064314365387, 0.29115790128707886, 0.3124094009399414, 0.33366087079048157, 0.35491234064102173, 0.3761638402938843, 0.39741531014442444, 0.4186667799949646, 0.43991827964782715, 0.4611697494983673, 0.48242121934890747, 0.50367271900177, 0.5249241590499878, 0.5461755990982056, 0.5674270987510681, 0.5886785387992859, 0.6099300384521484, 0.6311814785003662, 0.6524329781532288, 0.6736844778060913, 0.6949359178543091, 0.7161874175071716, 0.7374389171600342, 0.758690357208252, 0.7799418568611145, 0.801193356513977, 0.8224447965621948, 0.8436962962150574, 0.8649477958679199, 0.8861992359161377, 0.9074507355690002, 0.928702175617218, 0.9499536752700806, 0.9712051153182983, 0.9924566149711609, 1.0137081146240234, 1.0349595546722412, 1.056210994720459, 1.0774624347686768, 1.098713994026184, 1.1199654340744019, 1.1412168741226196, 1.162468433380127, 1.1837198734283447, 1.2049713134765625, 1.2262228727340698]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 8.0, 9.0, 16.0, 13.0, 17.0, 33.0, 33.0, 33.0, 38.0, 50.0, 44.0, 50.0, 59.0, 52.0, 69.0, 55.0, 67.0, 56.0, 41.0, 48.0, 54.0, 32.0, 25.0, 26.0, 8.0, 14.0, 17.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05988478660583496, -0.058346085250377655, -0.05680738389492035, -0.055268678814172745, -0.05372997745871544, -0.05219127610325813, -0.05065257102251053, -0.04911386966705322, -0.04757516831159592, -0.04603646695613861, -0.044497765600681305, -0.0429590605199337, -0.041420359164476395, -0.03988165780901909, -0.038342952728271484, -0.03680425137281418, -0.03526555001735687, -0.03372684866189957, -0.03218814730644226, -0.030649442225694656, -0.02911074087023735, -0.027572039514780045, -0.02603333629667759, -0.024494633078575134, -0.02295593172311783, -0.021417230367660522, -0.019878527149558067, -0.018339823931455612, -0.016801122575998306, -0.015262420289218426, -0.013723718002438545, -0.012185015715658665, -0.010646313428878784, -0.009107611142098904, -0.007568908855319023, -0.006030206568539143, -0.004491504281759262, -0.0029528019949793816, -0.001414099708199501, 0.00012460257858037949, 0.00166330486536026, 0.0032020071521401405, 0.004740709438920021, 0.006279411725699902, 0.007818114012479782, 0.009356816299259663, 0.010895518586039543, 0.012434220872819424, 0.013972923159599304, 0.015511625446379185, 0.017050327733159065, 0.01858903095126152, 0.020127732306718826, 0.021666433662176132, 0.023205136880278587, 0.024743840098381042, 0.02628254145383835, 0.027821242809295654, 0.02935994602739811, 0.030898649245500565, 0.03243735060095787, 0.033976051956415176, 0.03551475703716278, 0.03705345839262009, 0.03859215974807739]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 8.0, 17.0, 13.0, 22.0, 19.0, 25.0, 21.0, 25.0, 27.0, 26.0, 35.0, 31.0, 32.0, 40.0, 34.0, 38.0, 37.0, 46.0, 37.0, 35.0, 37.0, 48.0, 30.0, 39.0, 22.0, 23.0, 28.0, 31.0, 22.0, 21.0, 20.0, 14.0, 13.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.28125, -21.576171875, -20.87109375, -20.166015625, -19.4609375, -18.755859375, -18.05078125, -17.345703125, -16.640625, -15.935546875, -15.23046875, -14.525390625, -13.8203125, -13.115234375, -12.41015625, -11.705078125, -11.0, -10.294921875, -9.58984375, -8.884765625, -8.1796875, -7.474609375, -6.76953125, -6.064453125, -5.359375, -4.654296875, -3.94921875, -3.244140625, -2.5390625, -1.833984375, -1.12890625, -0.423828125, 0.28125, 0.986328125, 1.69140625, 2.396484375, 3.1015625, 3.806640625, 4.51171875, 5.216796875, 5.921875, 6.626953125, 7.33203125, 8.037109375, 8.7421875, 9.447265625, 10.15234375, 10.857421875, 11.5625, 12.267578125, 12.97265625, 13.677734375, 14.3828125, 15.087890625, 15.79296875, 16.498046875, 17.203125, 17.908203125, 18.61328125, 19.318359375, 20.0234375, 20.728515625, 21.43359375, 22.138671875, 22.84375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 18.0, 32.0, 34.0, 63.0, 71.0, 95.0, 138.0, 178.0, 238.0, 378.0, 473.0, 649.0, 950.0, 1332.0, 2228.0, 3814.0, 7418.0, 16654.0, 45688.0, 166016.0, 524844.0, 189389.0, 50948.0, 17912.0, 7821.0, 3921.0, 2322.0, 1434.0, 951.0, 694.0, 553.0, 343.0, 258.0, 191.0, 130.0, 94.0, 69.0, 47.0, 44.0, 21.0, 24.0, 15.0, 13.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-34.625, -33.56103515625, -32.4970703125, -31.43310546875, -30.369140625, -29.30517578125, -28.2412109375, -27.17724609375, -26.11328125, -25.04931640625, -23.9853515625, -22.92138671875, -21.857421875, -20.79345703125, -19.7294921875, -18.66552734375, -17.6015625, -16.53759765625, -15.4736328125, -14.40966796875, -13.345703125, -12.28173828125, -11.2177734375, -10.15380859375, -9.08984375, -8.02587890625, -6.9619140625, -5.89794921875, -4.833984375, -3.77001953125, -2.7060546875, -1.64208984375, -0.578125, 0.48583984375, 1.5498046875, 2.61376953125, 3.677734375, 4.74169921875, 5.8056640625, 6.86962890625, 7.93359375, 8.99755859375, 10.0615234375, 11.12548828125, 12.189453125, 13.25341796875, 14.3173828125, 15.38134765625, 16.4453125, 17.50927734375, 18.5732421875, 19.63720703125, 20.701171875, 21.76513671875, 22.8291015625, 23.89306640625, 24.95703125, 26.02099609375, 27.0849609375, 28.14892578125, 29.212890625, 30.27685546875, 31.3408203125, 32.40478515625, 33.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 5.0, 11.0, 16.0, 13.0, 24.0, 34.0, 44.0, 34.0, 38.0, 48.0, 60.0, 94.0, 155.0, 1440.0, 439.0, 135.0, 67.0, 43.0, 51.0, 54.0, 44.0, 37.0, 23.0, 21.0, 22.0, 18.0, 12.0, 8.0, 11.0, 4.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-80.1875, -77.95556640625, -75.7236328125, -73.49169921875, -71.259765625, -69.02783203125, -66.7958984375, -64.56396484375, -62.33203125, -60.10009765625, -57.8681640625, -55.63623046875, -53.404296875, -51.17236328125, -48.9404296875, -46.70849609375, -44.4765625, -42.24462890625, -40.0126953125, -37.78076171875, -35.548828125, -33.31689453125, -31.0849609375, -28.85302734375, -26.62109375, -24.38916015625, -22.1572265625, -19.92529296875, -17.693359375, -15.46142578125, -13.2294921875, -10.99755859375, -8.765625, -6.53369140625, -4.3017578125, -2.06982421875, 0.162109375, 2.39404296875, 4.6259765625, 6.85791015625, 9.08984375, 11.32177734375, 13.5537109375, 15.78564453125, 18.017578125, 20.24951171875, 22.4814453125, 24.71337890625, 26.9453125, 29.17724609375, 31.4091796875, 33.64111328125, 35.873046875, 38.10498046875, 40.3369140625, 42.56884765625, 44.80078125, 47.03271484375, 49.2646484375, 51.49658203125, 53.728515625, 55.96044921875, 58.1923828125, 60.42431640625, 62.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 9.0, 3.0, 5.0, 12.0, 15.0, 10.0, 12.0, 25.0, 18.0, 24.0, 39.0, 42.0, 51.0, 101.0, 165.0, 348.0, 753.0, 2456.0, 2819244.0, 319246.0, 1688.0, 652.0, 310.0, 150.0, 99.0, 57.0, 25.0, 23.0, 23.0, 21.0, 17.0, 13.0, 14.0, 8.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-226.75, -219.646484375, -212.54296875, -205.439453125, -198.3359375, -191.232421875, -184.12890625, -177.025390625, -169.921875, -162.818359375, -155.71484375, -148.611328125, -141.5078125, -134.404296875, -127.30078125, -120.197265625, -113.09375, -105.990234375, -98.88671875, -91.783203125, -84.6796875, -77.576171875, -70.47265625, -63.369140625, -56.265625, -49.162109375, -42.05859375, -34.955078125, -27.8515625, -20.748046875, -13.64453125, -6.541015625, 0.5625, 7.666015625, 14.76953125, 21.873046875, 28.9765625, 36.080078125, 43.18359375, 50.287109375, 57.390625, 64.494140625, 71.59765625, 78.701171875, 85.8046875, 92.908203125, 100.01171875, 107.115234375, 114.21875, 121.322265625, 128.42578125, 135.529296875, 142.6328125, 149.736328125, 156.83984375, 163.943359375, 171.046875, 178.150390625, 185.25390625, 192.357421875, 199.4609375, 206.564453125, 213.66796875, 220.771484375, 227.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 301.0, 658.0, 46.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-402.95916748046875, -380.8097839355469, -358.660400390625, -336.5110168457031, -314.36163330078125, -292.2122497558594, -270.0628662109375, -247.91348266601562, -225.76409912109375, -203.61471557617188, -181.46533203125, -159.31594848632812, -137.16656494140625, -115.01718139648438, -92.8677978515625, -70.71841430664062, -48.56903076171875, -26.419647216796875, -4.270263671875, 17.879119873046875, 40.02850341796875, 62.177886962890625, 84.3272705078125, 106.47665405273438, 128.62603759765625, 150.77542114257812, 172.9248046875, 195.07418823242188, 217.22357177734375, 239.37295532226562, 261.5223388671875, 283.6717224121094, 305.821044921875, 327.9704284667969, 350.11981201171875, 372.2691955566406, 394.4185791015625, 416.5679626464844, 438.71734619140625, 460.8667297363281, 483.01611328125, 505.1654968261719, 527.3148803710938, 549.4642333984375, 571.6136474609375, 593.7630615234375, 615.9124145507812, 638.061767578125, 660.211181640625, 682.360595703125, 704.5099487304688, 726.6593017578125, 748.8087158203125, 770.9581298828125, 793.1074829101562, 815.2568359375, 837.40625, 859.5556640625, 881.7050170898438, 903.8543701171875, 926.0037841796875, 948.1531982421875, 970.3025512695312, 992.451904296875, 1014.601318359375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 7.0, 3.0, 7.0, 8.0, 12.0, 8.0, 19.0, 14.0, 23.0, 15.0, 30.0, 19.0, 19.0, 33.0, 30.0, 33.0, 31.0, 26.0, 52.0, 52.0, 44.0, 50.0, 35.0, 41.0, 41.0, 33.0, 25.0, 30.0, 31.0, 42.0, 24.0, 23.0, 22.0, 13.0, 11.0, 15.0, 17.0, 9.0, 8.0, 8.0, 6.0, 10.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-162.3834991455078, -157.62156677246094, -152.85963439941406, -148.09771728515625, -143.33578491210938, -138.5738525390625, -133.81192016601562, -129.04998779296875, -124.2880630493164, -119.52613067626953, -114.76420593261719, -110.00227355957031, -105.24034118652344, -100.4784164428711, -95.71648406982422, -90.95455932617188, -86.192626953125, -81.43069458007812, -76.66876983642578, -71.9068374633789, -67.14491271972656, -62.38298034667969, -57.62104797363281, -52.8591194152832, -48.097190856933594, -43.335262298583984, -38.573333740234375, -33.8114013671875, -29.04947280883789, -24.28754425048828, -19.52561378479004, -14.763683319091797, -10.001739501953125, -5.239809989929199, -0.47788047790527344, 4.284049034118652, 9.045978546142578, 13.807907104492188, 18.56983757019043, 23.331768035888672, 28.09369659423828, 32.85562515258789, 37.6175537109375, 42.379486083984375, 47.141414642333984, 51.903343200683594, 56.66527557373047, 61.42720413208008, 66.18913269042969, 70.95106506347656, 75.7129898071289, 80.47492218017578, 85.23684692382812, 89.998779296875, 94.76071166992188, 99.52264404296875, 104.2845687866211, 109.04650115966797, 113.80842590332031, 118.57035827636719, 123.33229064941406, 128.09420776367188, 132.85614013671875, 137.61807250976562, 142.3800048828125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 9.0, 2.0, 10.0, 4.0, 10.0, 26.0, 15.0, 11.0, 23.0, 24.0, 26.0, 28.0, 23.0, 22.0, 30.0, 31.0, 44.0, 43.0, 41.0, 32.0, 39.0, 49.0, 56.0, 32.0, 34.0, 45.0, 39.0, 34.0, 28.0, 21.0, 21.0, 29.0, 26.0, 16.0, 13.0, 14.0, 18.0, 8.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.642578125, -21.87890625, -21.115234375, -20.3515625, -19.587890625, -18.82421875, -18.060546875, -17.296875, -16.533203125, -15.76953125, -15.005859375, -14.2421875, -13.478515625, -12.71484375, -11.951171875, -11.1875, -10.423828125, -9.66015625, -8.896484375, -8.1328125, -7.369140625, -6.60546875, -5.841796875, -5.078125, -4.314453125, -3.55078125, -2.787109375, -2.0234375, -1.259765625, -0.49609375, 0.267578125, 1.03125, 1.794921875, 2.55859375, 3.322265625, 4.0859375, 4.849609375, 5.61328125, 6.376953125, 7.140625, 7.904296875, 8.66796875, 9.431640625, 10.1953125, 10.958984375, 11.72265625, 12.486328125, 13.25, 14.013671875, 14.77734375, 15.541015625, 16.3046875, 17.068359375, 17.83203125, 18.595703125, 19.359375, 20.123046875, 20.88671875, 21.650390625, 22.4140625, 23.177734375, 23.94140625, 24.705078125, 25.46875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 13.0, 15.0, 18.0, 15.0, 22.0, 29.0, 39.0, 56.0, 79.0, 115.0, 168.0, 326.0, 643.0, 1287.0, 3469.0, 12100.0, 128479.0, 2906846.0, 1091452.0, 38132.0, 6688.0, 2154.0, 915.0, 456.0, 260.0, 141.0, 87.0, 74.0, 48.0, 23.0, 30.0, 14.0, 19.0, 7.0, 5.0, 9.0, 11.0, 5.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -68.1015625, -65.890625, -63.6796875, -61.46875, -59.2578125, -57.046875, -54.8359375, -52.625, -50.4140625, -48.203125, -45.9921875, -43.78125, -41.5703125, -39.359375, -37.1484375, -34.9375, -32.7265625, -30.515625, -28.3046875, -26.09375, -23.8828125, -21.671875, -19.4609375, -17.25, -15.0390625, -12.828125, -10.6171875, -8.40625, -6.1953125, -3.984375, -1.7734375, 0.4375, 2.6484375, 4.859375, 7.0703125, 9.28125, 11.4921875, 13.703125, 15.9140625, 18.125, 20.3359375, 22.546875, 24.7578125, 26.96875, 29.1796875, 31.390625, 33.6015625, 35.8125, 38.0234375, 40.234375, 42.4453125, 44.65625, 46.8671875, 49.078125, 51.2890625, 53.5, 55.7109375, 57.921875, 60.1328125, 62.34375, 64.5546875, 66.765625, 68.9765625, 71.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 8.0, 15.0, 4.0, 16.0, 13.0, 32.0, 31.0, 52.0, 89.0, 109.0, 136.0, 234.0, 371.0, 596.0, 843.0, 577.0, 302.0, 203.0, 132.0, 76.0, 65.0, 51.0, 36.0, 14.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.84130859375, -45.2451171875, -43.64892578125, -42.052734375, -40.45654296875, -38.8603515625, -37.26416015625, -35.66796875, -34.07177734375, -32.4755859375, -30.87939453125, -29.283203125, -27.68701171875, -26.0908203125, -24.49462890625, -22.8984375, -21.30224609375, -19.7060546875, -18.10986328125, -16.513671875, -14.91748046875, -13.3212890625, -11.72509765625, -10.12890625, -8.53271484375, -6.9365234375, -5.34033203125, -3.744140625, -2.14794921875, -0.5517578125, 1.04443359375, 2.640625, 4.23681640625, 5.8330078125, 7.42919921875, 9.025390625, 10.62158203125, 12.2177734375, 13.81396484375, 15.41015625, 17.00634765625, 18.6025390625, 20.19873046875, 21.794921875, 23.39111328125, 24.9873046875, 26.58349609375, 28.1796875, 29.77587890625, 31.3720703125, 32.96826171875, 34.564453125, 36.16064453125, 37.7568359375, 39.35302734375, 40.94921875, 42.54541015625, 44.1416015625, 45.73779296875, 47.333984375, 48.93017578125, 50.5263671875, 52.12255859375, 53.71875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 7.0, 8.0, 8.0, 28.0, 41.0, 50.0, 96.0, 165.0, 283.0, 577.0, 1238.0, 3744.0, 14077.0, 78855.0, 1727784.0, 2257335.0, 88468.0, 14866.0, 3870.0, 1405.0, 613.0, 305.0, 181.0, 97.0, 50.0, 40.0, 24.0, 16.0, 14.0, 13.0, 14.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-82.875, -80.439453125, -78.00390625, -75.568359375, -73.1328125, -70.697265625, -68.26171875, -65.826171875, -63.390625, -60.955078125, -58.51953125, -56.083984375, -53.6484375, -51.212890625, -48.77734375, -46.341796875, -43.90625, -41.470703125, -39.03515625, -36.599609375, -34.1640625, -31.728515625, -29.29296875, -26.857421875, -24.421875, -21.986328125, -19.55078125, -17.115234375, -14.6796875, -12.244140625, -9.80859375, -7.373046875, -4.9375, -2.501953125, -0.06640625, 2.369140625, 4.8046875, 7.240234375, 9.67578125, 12.111328125, 14.546875, 16.982421875, 19.41796875, 21.853515625, 24.2890625, 26.724609375, 29.16015625, 31.595703125, 34.03125, 36.466796875, 38.90234375, 41.337890625, 43.7734375, 46.208984375, 48.64453125, 51.080078125, 53.515625, 55.951171875, 58.38671875, 60.822265625, 63.2578125, 65.693359375, 68.12890625, 70.564453125, 73.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 115.0, 720.0, 172.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-832.3998413085938, -793.9087524414062, -755.4176025390625, -716.926513671875, -678.4354248046875, -639.9442749023438, -601.4531860351562, -562.9620361328125, -524.470947265625, -485.9798278808594, -447.48870849609375, -408.99761962890625, -370.5065002441406, -332.015380859375, -293.5242919921875, -255.03317260742188, -216.54205322265625, -178.05093383789062, -139.55982971191406, -101.06871795654297, -62.577606201171875, -24.08648681640625, 14.404617309570312, 52.895721435546875, 91.3868408203125, 129.87796020507812, 168.3690643310547, 206.86016845703125, 245.35128784179688, 283.8424072265625, 322.33349609375, 360.8246154785156, 399.3157958984375, 437.8069152832031, 476.29803466796875, 514.7891235351562, 553.2802734375, 591.7713623046875, 630.262451171875, 668.7535400390625, 707.2446899414062, 745.7357788085938, 784.2269287109375, 822.718017578125, 861.2091064453125, 899.7002563476562, 938.1913452148438, 976.6824951171875, 1015.173583984375, 1053.6646728515625, 1092.15576171875, 1130.64697265625, 1169.1380615234375, 1207.629150390625, 1246.1202392578125, 1284.611328125, 1323.1025390625, 1361.5936279296875, 1400.084716796875, 1438.575927734375, 1477.0670166015625, 1515.55810546875, 1554.0491943359375, 1592.540283203125, 1631.0313720703125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 7.0, 12.0, 10.0, 14.0, 16.0, 11.0, 25.0, 20.0, 17.0, 27.0, 22.0, 35.0, 31.0, 35.0, 33.0, 41.0, 34.0, 31.0, 44.0, 28.0, 36.0, 32.0, 33.0, 40.0, 34.0, 34.0, 36.0, 21.0, 22.0, 25.0, 26.0, 15.0, 20.0, 18.0, 12.0, 9.0, 10.0, 17.0, 6.0, 11.0, 12.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.62420654296875, -122.42036437988281, -118.2165298461914, -114.0126953125, -109.80885314941406, -105.60501098632812, -101.40117645263672, -97.19734191894531, -92.99349975585938, -88.78965759277344, -84.58582305908203, -80.38198852539062, -76.17814636230469, -71.97430419921875, -67.77046966552734, -63.56663131713867, -59.36279296875, -55.15895462036133, -50.955116271972656, -46.751277923583984, -42.54743957519531, -38.34360122680664, -34.13976287841797, -29.935924530029297, -25.732086181640625, -21.528247833251953, -17.32440948486328, -13.12057113647461, -8.916732788085938, -4.712894439697266, -0.5090560913085938, 3.694782257080078, 7.8986358642578125, 12.102474212646484, 16.306312561035156, 20.510150909423828, 24.7139892578125, 28.917827606201172, 33.121665954589844, 37.325504302978516, 41.52934265136719, 45.73318099975586, 49.93701934814453, 54.1408576965332, 58.344696044921875, 62.54853439331055, 66.75237274169922, 70.95620727539062, 75.16004943847656, 79.3638916015625, 83.5677261352539, 87.77156066894531, 91.97540283203125, 96.17924499511719, 100.3830795288086, 104.5869140625, 108.79075622558594, 112.99459838867188, 117.19843292236328, 121.40226745605469, 125.60610961914062, 129.80995178222656, 134.0137939453125, 138.21762084960938, 142.4214630126953]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 15.0, 15.0, 22.0, 19.0, 25.0, 19.0, 21.0, 34.0, 32.0, 33.0, 30.0, 39.0, 41.0, 54.0, 35.0, 39.0, 44.0, 44.0, 37.0, 35.0, 33.0, 29.0, 32.0, 35.0, 32.0, 33.0, 25.0, 20.0, 16.0, 11.0, 11.0, 7.0, 9.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.0, -19.35693359375, -18.7138671875, -18.07080078125, -17.427734375, -16.78466796875, -16.1416015625, -15.49853515625, -14.85546875, -14.21240234375, -13.5693359375, -12.92626953125, -12.283203125, -11.64013671875, -10.9970703125, -10.35400390625, -9.7109375, -9.06787109375, -8.4248046875, -7.78173828125, -7.138671875, -6.49560546875, -5.8525390625, -5.20947265625, -4.56640625, -3.92333984375, -3.2802734375, -2.63720703125, -1.994140625, -1.35107421875, -0.7080078125, -0.06494140625, 0.578125, 1.22119140625, 1.8642578125, 2.50732421875, 3.150390625, 3.79345703125, 4.4365234375, 5.07958984375, 5.72265625, 6.36572265625, 7.0087890625, 7.65185546875, 8.294921875, 8.93798828125, 9.5810546875, 10.22412109375, 10.8671875, 11.51025390625, 12.1533203125, 12.79638671875, 13.439453125, 14.08251953125, 14.7255859375, 15.36865234375, 16.01171875, 16.65478515625, 17.2978515625, 17.94091796875, 18.583984375, 19.22705078125, 19.8701171875, 20.51318359375, 21.15625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 22.0, 22.0, 32.0, 50.0, 70.0, 109.0, 144.0, 242.0, 335.0, 438.0, 685.0, 1037.0, 1438.0, 2212.0, 3209.0, 4899.0, 7257.0, 11003.0, 16737.0, 25778.0, 39571.0, 62919.0, 103372.0, 168697.0, 208070.0, 146137.0, 88896.0, 54096.0, 34811.0, 22528.0, 14566.0, 9684.0, 6433.0, 4187.0, 2879.0, 1942.0, 1267.0, 893.0, 594.0, 434.0, 271.0, 177.0, 135.0, 86.0, 57.0, 47.0, 31.0, 23.0, 13.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.099609375, -2.032623291015625, -1.96563720703125, -1.898651123046875, -1.8316650390625, -1.764678955078125, -1.69769287109375, -1.630706787109375, -1.563720703125, -1.496734619140625, -1.42974853515625, -1.362762451171875, -1.2957763671875, -1.228790283203125, -1.16180419921875, -1.094818115234375, -1.02783203125, -0.960845947265625, -0.89385986328125, -0.826873779296875, -0.7598876953125, -0.692901611328125, -0.62591552734375, -0.558929443359375, -0.491943359375, -0.424957275390625, -0.35797119140625, -0.290985107421875, -0.2239990234375, -0.157012939453125, -0.09002685546875, -0.023040771484375, 0.0439453125, 0.110931396484375, 0.17791748046875, 0.244903564453125, 0.3118896484375, 0.378875732421875, 0.44586181640625, 0.512847900390625, 0.579833984375, 0.646820068359375, 0.71380615234375, 0.780792236328125, 0.8477783203125, 0.914764404296875, 0.98175048828125, 1.048736572265625, 1.11572265625, 1.182708740234375, 1.24969482421875, 1.316680908203125, 1.3836669921875, 1.450653076171875, 1.51763916015625, 1.584625244140625, 1.651611328125, 1.718597412109375, 1.78558349609375, 1.852569580078125, 1.9195556640625, 1.986541748046875, 2.05352783203125, 2.120513916015625, 2.1875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 8.0, 4.0, 12.0, 16.0, 18.0, 16.0, 15.0, 17.0, 26.0, 19.0, 22.0, 29.0, 29.0, 32.0, 37.0, 43.0, 32.0, 54.0, 28.0, 40.0, 1057.0, 31.0, 31.0, 30.0, 40.0, 37.0, 22.0, 28.0, 36.0, 31.0, 28.0, 21.0, 23.0, 12.0, 13.0, 12.0, 14.0, 8.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.8203125, -12.4345703125, -12.048828125, -11.6630859375, -11.27734375, -10.8916015625, -10.505859375, -10.1201171875, -9.734375, -9.3486328125, -8.962890625, -8.5771484375, -8.19140625, -7.8056640625, -7.419921875, -7.0341796875, -6.6484375, -6.2626953125, -5.876953125, -5.4912109375, -5.10546875, -4.7197265625, -4.333984375, -3.9482421875, -3.5625, -3.1767578125, -2.791015625, -2.4052734375, -2.01953125, -1.6337890625, -1.248046875, -0.8623046875, -0.4765625, -0.0908203125, 0.294921875, 0.6806640625, 1.06640625, 1.4521484375, 1.837890625, 2.2236328125, 2.609375, 2.9951171875, 3.380859375, 3.7666015625, 4.15234375, 4.5380859375, 4.923828125, 5.3095703125, 5.6953125, 6.0810546875, 6.466796875, 6.8525390625, 7.23828125, 7.6240234375, 8.009765625, 8.3955078125, 8.78125, 9.1669921875, 9.552734375, 9.9384765625, 10.32421875, 10.7099609375, 11.095703125, 11.4814453125, 11.8671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 25.0, 19.0, 29.0, 39.0, 61.0, 87.0, 136.0, 181.0, 261.0, 399.0, 541.0, 806.0, 1190.0, 1760.0, 2568.0, 3943.0, 5682.0, 8706.0, 13217.0, 19997.0, 31518.0, 49226.0, 79602.0, 129428.0, 1179691.0, 238239.0, 121475.0, 74839.0, 46486.0, 29399.0, 19227.0, 12714.0, 8394.0, 5483.0, 3719.0, 2565.0, 1754.0, 1139.0, 796.0, 533.0, 396.0, 223.0, 189.0, 131.0, 98.0, 61.0, 53.0, 30.0, 23.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.55859375, -1.508209228515625, -1.45782470703125, -1.407440185546875, -1.3570556640625, -1.306671142578125, -1.25628662109375, -1.205902099609375, -1.155517578125, -1.105133056640625, -1.05474853515625, -1.004364013671875, -0.9539794921875, -0.903594970703125, -0.85321044921875, -0.802825927734375, -0.75244140625, -0.702056884765625, -0.65167236328125, -0.601287841796875, -0.5509033203125, -0.500518798828125, -0.45013427734375, -0.399749755859375, -0.349365234375, -0.298980712890625, -0.24859619140625, -0.198211669921875, -0.1478271484375, -0.097442626953125, -0.04705810546875, 0.003326416015625, 0.0537109375, 0.104095458984375, 0.15447998046875, 0.204864501953125, 0.2552490234375, 0.305633544921875, 0.35601806640625, 0.406402587890625, 0.456787109375, 0.507171630859375, 0.55755615234375, 0.607940673828125, 0.6583251953125, 0.708709716796875, 0.75909423828125, 0.809478759765625, 0.85986328125, 0.910247802734375, 0.96063232421875, 1.011016845703125, 1.0614013671875, 1.111785888671875, 1.16217041015625, 1.212554931640625, 1.262939453125, 1.313323974609375, 1.36370849609375, 1.414093017578125, 1.4644775390625, 1.514862060546875, 1.56524658203125, 1.615631103515625, 1.666015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 9.0, 12.0, 7.0, 15.0, 20.0, 31.0, 21.0, 34.0, 47.0, 57.0, 52.0, 77.0, 66.0, 88.0, 64.0, 66.0, 51.0, 50.0, 38.0, 30.0, 32.0, 22.0, 14.0, 13.0, 10.0, 10.0, 7.0, 9.0, 8.0, 2.0, 0.0, 6.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.022857666015625, -0.022141218185424805, -0.02142477035522461, -0.020708322525024414, -0.01999187469482422, -0.019275426864624023, -0.018558979034423828, -0.017842531204223633, -0.017126083374023438, -0.016409635543823242, -0.015693187713623047, -0.014976739883422852, -0.014260292053222656, -0.013543844223022461, -0.012827396392822266, -0.01211094856262207, -0.011394500732421875, -0.01067805290222168, -0.009961605072021484, -0.009245157241821289, -0.008528709411621094, -0.0078122615814208984, -0.007095813751220703, -0.006379365921020508, -0.0056629180908203125, -0.004946470260620117, -0.004230022430419922, -0.0035135746002197266, -0.0027971267700195312, -0.002080678939819336, -0.0013642311096191406, -0.0006477832794189453, 6.866455078125e-05, 0.0007851123809814453, 0.0015015602111816406, 0.002218008041381836, 0.0029344558715820312, 0.0036509037017822266, 0.004367351531982422, 0.005083799362182617, 0.0058002471923828125, 0.006516695022583008, 0.007233142852783203, 0.007949590682983398, 0.008666038513183594, 0.009382486343383789, 0.010098934173583984, 0.01081538200378418, 0.011531829833984375, 0.01224827766418457, 0.012964725494384766, 0.013681173324584961, 0.014397621154785156, 0.015114068984985352, 0.015830516815185547, 0.016546964645385742, 0.017263412475585938, 0.017979860305786133, 0.018696308135986328, 0.019412755966186523, 0.02012920379638672, 0.020845651626586914, 0.02156209945678711, 0.022278547286987305, 0.0229949951171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 3.0, 7.0, 8.0, 15.0, 18.0, 18.0, 17.0, 23.0, 28.0, 52.0, 62.0, 70.0, 98.0, 161.0, 231.0, 392.0, 809.0, 33253.0, 1009454.0, 2412.0, 477.0, 280.0, 183.0, 124.0, 67.0, 65.0, 45.0, 29.0, 27.0, 16.0, 23.0, 15.0, 15.0, 10.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.4362449645996094, -0.42229461669921875, -0.4083442687988281, -0.3943939208984375, -0.3804435729980469, -0.36649322509765625, -0.3525428771972656, -0.338592529296875, -0.3246421813964844, -0.31069183349609375, -0.2967414855957031, -0.2827911376953125, -0.2688407897949219, -0.25489044189453125, -0.24094009399414062, -0.22698974609375, -0.21303939819335938, -0.19908905029296875, -0.18513870239257812, -0.1711883544921875, -0.15723800659179688, -0.14328765869140625, -0.12933731079101562, -0.115386962890625, -0.10143661499023438, -0.08748626708984375, -0.07353591918945312, -0.0595855712890625, -0.045635223388671875, -0.03168487548828125, -0.017734527587890625, -0.0037841796875, 0.010166168212890625, 0.02411651611328125, 0.038066864013671875, 0.0520172119140625, 0.06596755981445312, 0.07991790771484375, 0.09386825561523438, 0.107818603515625, 0.12176895141601562, 0.13571929931640625, 0.14966964721679688, 0.1636199951171875, 0.17757034301757812, 0.19152069091796875, 0.20547103881835938, 0.21942138671875, 0.23337173461914062, 0.24732208251953125, 0.2612724304199219, 0.2752227783203125, 0.2891731262207031, 0.30312347412109375, 0.3170738220214844, 0.331024169921875, 0.3449745178222656, 0.35892486572265625, 0.3728752136230469, 0.3868255615234375, 0.4007759094238281, 0.41472625732421875, 0.4286766052246094, 0.442626953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 10.0, 999.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12311657518148422, -0.10840263962745667, -0.0936887115240097, -0.07897477596998215, -0.06426084041595459, -0.04954690486192703, -0.03483297675848007, -0.020119041204452515, -0.005405105650424957, 0.00930882804095745, 0.02402276173233986, 0.03873669356107712, 0.053450629115104675, 0.06816456466913223, 0.0828784927725792, 0.09759242832660675, 0.11230636388063431, 0.12702029943466187, 0.14173422753810883, 0.1564481556415558, 0.17116209864616394, 0.1858760416507721, 0.20058995485305786, 0.21530389785766602, 0.23001784086227417, 0.24473176896572113, 0.2594456970691681, 0.27415964007377625, 0.2888735830783844, 0.30358749628067017, 0.3183014392852783, 0.3330153822898865, 0.34772932529449463, 0.3624432682991028, 0.37715718150138855, 0.3918711245059967, 0.40658506751060486, 0.4212989807128906, 0.4360129237174988, 0.45072686672210693, 0.4654408097267151, 0.48015475273132324, 0.494868665933609, 0.5095826387405396, 0.5242965221405029, 0.5390104651451111, 0.5537244081497192, 0.5684383511543274, 0.5831522941589355, 0.5978662371635437, 0.6125801801681519, 0.6272940635681152, 0.6420080065727234, 0.6567219495773315, 0.6714358925819397, 0.6861498355865479, 0.7008637189865112, 0.7155776619911194, 0.7302916049957275, 0.7450054883956909, 0.7597194314002991, 0.7744333744049072, 0.7891473174095154, 0.8038612604141235, 0.8185752034187317]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 9.0, 5.0, 7.0, 12.0, 20.0, 22.0, 29.0, 37.0, 37.0, 60.0, 36.0, 62.0, 65.0, 55.0, 60.0, 60.0, 55.0, 65.0, 48.0, 51.0, 56.0, 32.0, 32.0, 18.0, 29.0, 18.0, 10.0, 8.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03972238302230835, -0.0385768823325634, -0.03743138164281845, -0.0362858846783638, -0.03514038398861885, -0.0339948832988739, -0.03284938633441925, -0.0317038856446743, -0.030558384954929352, -0.029412884265184402, -0.028267385438084602, -0.027121886610984802, -0.025976385921239853, -0.024830885231494904, -0.023685386404395103, -0.022539887577295303, -0.021394386887550354, -0.020248886197805405, -0.019103387370705605, -0.017957888543605804, -0.016812387853860855, -0.015666887164115906, -0.014521388337016106, -0.013375888578593731, -0.012230388820171356, -0.011084889061748981, -0.009939389303326607, -0.008793889544904232, -0.007648389786481857, -0.006502890028059483, -0.005357390269637108, -0.004211890511214733, -0.0030663907527923584, -0.0019208909943699837, -0.000775391235947609, 0.0003701085224747658, 0.0015156082808971405, 0.0026611080393195152, 0.00380660779774189, 0.004952107556164265, 0.006097607314586639, 0.007243107073009014, 0.008388606831431389, 0.009534106589853764, 0.010679606348276138, 0.011825106106698513, 0.012970605865120888, 0.014116105623543262, 0.015261605381965637, 0.016407106071710587, 0.017552604898810387, 0.018698103725910187, 0.019843604415655136, 0.020989105105400085, 0.022134603932499886, 0.023280102759599686, 0.024425603449344635, 0.025571104139089584, 0.026716602966189384, 0.027862101793289185, 0.029007602483034134, 0.030153103172779083, 0.031298600137233734, 0.032444100826978683, 0.03358960151672363]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 15.0, 15.0, 22.0, 19.0, 25.0, 20.0, 20.0, 34.0, 32.0, 33.0, 30.0, 40.0, 40.0, 54.0, 36.0, 38.0, 44.0, 44.0, 37.0, 35.0, 32.0, 30.0, 33.0, 33.0, 33.0, 33.0, 24.0, 21.0, 16.0, 11.0, 11.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.0, -19.35693359375, -18.7138671875, -18.07080078125, -17.427734375, -16.78466796875, -16.1416015625, -15.49853515625, -14.85546875, -14.21240234375, -13.5693359375, -12.92626953125, -12.283203125, -11.64013671875, -10.9970703125, -10.35400390625, -9.7109375, -9.06787109375, -8.4248046875, -7.78173828125, -7.138671875, -6.49560546875, -5.8525390625, -5.20947265625, -4.56640625, -3.92333984375, -3.2802734375, -2.63720703125, -1.994140625, -1.35107421875, -0.7080078125, -0.06494140625, 0.578125, 1.22119140625, 1.8642578125, 2.50732421875, 3.150390625, 3.79345703125, 4.4365234375, 5.07958984375, 5.72265625, 6.36572265625, 7.0087890625, 7.65185546875, 8.294921875, 8.93798828125, 9.5810546875, 10.22412109375, 10.8671875, 11.51025390625, 12.1533203125, 12.79638671875, 13.439453125, 14.08251953125, 14.7255859375, 15.36865234375, 16.01171875, 16.65478515625, 17.2978515625, 17.94091796875, 18.583984375, 19.22705078125, 19.8701171875, 20.51318359375, 21.15625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 4.0, 10.0, 8.0, 19.0, 20.0, 27.0, 32.0, 48.0, 74.0, 78.0, 126.0, 189.0, 251.0, 397.0, 563.0, 796.0, 1210.0, 1885.0, 2995.0, 6043.0, 16595.0, 73695.0, 609952.0, 272764.0, 38205.0, 10791.0, 4525.0, 2448.0, 1494.0, 963.0, 687.0, 480.0, 351.0, 238.0, 177.0, 109.0, 92.0, 61.0, 46.0, 26.0, 25.0, 18.0, 17.0, 3.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-49.625, -48.19921875, -46.7734375, -45.34765625, -43.921875, -42.49609375, -41.0703125, -39.64453125, -38.21875, -36.79296875, -35.3671875, -33.94140625, -32.515625, -31.08984375, -29.6640625, -28.23828125, -26.8125, -25.38671875, -23.9609375, -22.53515625, -21.109375, -19.68359375, -18.2578125, -16.83203125, -15.40625, -13.98046875, -12.5546875, -11.12890625, -9.703125, -8.27734375, -6.8515625, -5.42578125, -4.0, -2.57421875, -1.1484375, 0.27734375, 1.703125, 3.12890625, 4.5546875, 5.98046875, 7.40625, 8.83203125, 10.2578125, 11.68359375, 13.109375, 14.53515625, 15.9609375, 17.38671875, 18.8125, 20.23828125, 21.6640625, 23.08984375, 24.515625, 25.94140625, 27.3671875, 28.79296875, 30.21875, 31.64453125, 33.0703125, 34.49609375, 35.921875, 37.34765625, 38.7734375, 40.19921875, 41.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 4.0, 15.0, 25.0, 28.0, 20.0, 36.0, 29.0, 43.0, 50.0, 66.0, 58.0, 101.0, 209.0, 1598.0, 229.0, 96.0, 89.0, 49.0, 50.0, 23.0, 34.0, 32.0, 24.0, 20.0, 13.0, 10.0, 13.0, 11.0, 12.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.75, -64.7607421875, -62.771484375, -60.7822265625, -58.79296875, -56.8037109375, -54.814453125, -52.8251953125, -50.8359375, -48.8466796875, -46.857421875, -44.8681640625, -42.87890625, -40.8896484375, -38.900390625, -36.9111328125, -34.921875, -32.9326171875, -30.943359375, -28.9541015625, -26.96484375, -24.9755859375, -22.986328125, -20.9970703125, -19.0078125, -17.0185546875, -15.029296875, -13.0400390625, -11.05078125, -9.0615234375, -7.072265625, -5.0830078125, -3.09375, -1.1044921875, 0.884765625, 2.8740234375, 4.86328125, 6.8525390625, 8.841796875, 10.8310546875, 12.8203125, 14.8095703125, 16.798828125, 18.7880859375, 20.77734375, 22.7666015625, 24.755859375, 26.7451171875, 28.734375, 30.7236328125, 32.712890625, 34.7021484375, 36.69140625, 38.6806640625, 40.669921875, 42.6591796875, 44.6484375, 46.6376953125, 48.626953125, 50.6162109375, 52.60546875, 54.5947265625, 56.583984375, 58.5732421875, 60.5625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 7.0, 8.0, 6.0, 9.0, 10.0, 16.0, 11.0, 25.0, 31.0, 45.0, 47.0, 77.0, 73.0, 127.0, 187.0, 329.0, 659.0, 1552.0, 48351.0, 3085663.0, 5958.0, 1074.0, 493.0, 285.0, 168.0, 115.0, 93.0, 68.0, 59.0, 41.0, 24.0, 17.0, 19.0, 16.0, 7.0, 10.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-168.25, -163.041015625, -157.83203125, -152.623046875, -147.4140625, -142.205078125, -136.99609375, -131.787109375, -126.578125, -121.369140625, -116.16015625, -110.951171875, -105.7421875, -100.533203125, -95.32421875, -90.115234375, -84.90625, -79.697265625, -74.48828125, -69.279296875, -64.0703125, -58.861328125, -53.65234375, -48.443359375, -43.234375, -38.025390625, -32.81640625, -27.607421875, -22.3984375, -17.189453125, -11.98046875, -6.771484375, -1.5625, 3.646484375, 8.85546875, 14.064453125, 19.2734375, 24.482421875, 29.69140625, 34.900390625, 40.109375, 45.318359375, 50.52734375, 55.736328125, 60.9453125, 66.154296875, 71.36328125, 76.572265625, 81.78125, 86.990234375, 92.19921875, 97.408203125, 102.6171875, 107.826171875, 113.03515625, 118.244140625, 123.453125, 128.662109375, 133.87109375, 139.080078125, 144.2890625, 149.498046875, 154.70703125, 159.916015625, 165.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 12.0, 42.0, 80.0, 199.0, 303.0, 218.0, 101.0, 34.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.7008972167969, -263.5650329589844, -255.42913818359375, -247.2932586669922, -239.15737915039062, -231.02151489257812, -222.88563537597656, -214.749755859375, -206.61387634277344, -198.47799682617188, -190.3421173095703, -182.20623779296875, -174.07037353515625, -165.93447875976562, -157.79861450195312, -149.66273498535156, -141.52685546875, -133.39097595214844, -125.25509643554688, -117.11922454833984, -108.98334503173828, -100.84746551513672, -92.71159362792969, -84.57571411132812, -76.43983459472656, -68.303955078125, -60.1680793762207, -52.032203674316406, -43.896324157714844, -35.76044464111328, -27.624568939208984, -19.488693237304688, -11.352828979492188, -3.216951370239258, 4.918926239013672, 13.054803848266602, 21.19068145751953, 29.326560974121094, 37.46243667602539, 45.59831237792969, 53.73419189453125, 61.87007141113281, 70.00595092773438, 78.1418228149414, 86.27770233154297, 94.41358184814453, 102.54945373535156, 110.68533325195312, 118.82121276855469, 126.95709228515625, 135.0929718017578, 143.22885131835938, 151.36471557617188, 159.5006103515625, 167.636474609375, 175.77235412597656, 183.90823364257812, 192.0441131591797, 200.17999267578125, 208.3158721923828, 216.45175170898438, 224.58761596679688, 232.72349548339844, 240.859375, 248.99525451660156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 2.0, 3.0, 8.0, 11.0, 10.0, 10.0, 14.0, 21.0, 15.0, 26.0, 26.0, 39.0, 30.0, 37.0, 41.0, 29.0, 43.0, 49.0, 53.0, 60.0, 51.0, 48.0, 34.0, 40.0, 44.0, 28.0, 38.0, 33.0, 22.0, 26.0, 17.0, 16.0, 16.0, 17.0, 8.0, 8.0, 3.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-179.334228515625, -173.6168670654297, -167.89950561523438, -162.18214416503906, -156.46478271484375, -150.74742126464844, -145.03005981445312, -139.31268310546875, -133.5953369140625, -127.87797546386719, -122.16061401367188, -116.44325256347656, -110.72589111328125, -105.00852966308594, -99.2911605834961, -93.57379913330078, -87.85643005371094, -82.13906860351562, -76.42170715332031, -70.704345703125, -64.98698425292969, -59.26961898803711, -53.55225372314453, -47.83489227294922, -42.117530822753906, -36.400169372558594, -30.68280601501465, -24.965442657470703, -19.24808120727539, -13.530719757080078, -7.8133544921875, -2.0959930419921875, 3.621368408203125, 9.338730812072754, 15.056093215942383, 20.773456573486328, 26.49081802368164, 32.20817947387695, 37.92554473876953, 43.642906188964844, 49.360267639160156, 55.07762908935547, 60.79499053955078, 66.51235961914062, 72.22972106933594, 77.94708251953125, 83.66444396972656, 89.38180541992188, 95.09916687011719, 100.8165283203125, 106.53388977050781, 112.25125122070312, 117.96861267089844, 123.68597412109375, 129.40335083007812, 135.12069702148438, 140.83807373046875, 146.55543518066406, 152.27279663085938, 157.9901580810547, 163.70751953125, 169.4248809814453, 175.14224243164062, 180.859619140625, 186.57696533203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 10.0, 23.0, 12.0, 15.0, 21.0, 23.0, 25.0, 37.0, 24.0, 29.0, 25.0, 26.0, 39.0, 36.0, 32.0, 37.0, 49.0, 33.0, 43.0, 33.0, 40.0, 36.0, 42.0, 27.0, 34.0, 31.0, 30.0, 18.0, 21.0, 16.0, 22.0, 11.0, 14.0, 10.0, 10.0, 8.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.8125, -20.165283203125, -19.51806640625, -18.870849609375, -18.2236328125, -17.576416015625, -16.92919921875, -16.281982421875, -15.634765625, -14.987548828125, -14.34033203125, -13.693115234375, -13.0458984375, -12.398681640625, -11.75146484375, -11.104248046875, -10.45703125, -9.809814453125, -9.16259765625, -8.515380859375, -7.8681640625, -7.220947265625, -6.57373046875, -5.926513671875, -5.279296875, -4.632080078125, -3.98486328125, -3.337646484375, -2.6904296875, -2.043212890625, -1.39599609375, -0.748779296875, -0.1015625, 0.545654296875, 1.19287109375, 1.840087890625, 2.4873046875, 3.134521484375, 3.78173828125, 4.428955078125, 5.076171875, 5.723388671875, 6.37060546875, 7.017822265625, 7.6650390625, 8.312255859375, 8.95947265625, 9.606689453125, 10.25390625, 10.901123046875, 11.54833984375, 12.195556640625, 12.8427734375, 13.489990234375, 14.13720703125, 14.784423828125, 15.431640625, 16.078857421875, 16.72607421875, 17.373291015625, 18.0205078125, 18.667724609375, 19.31494140625, 19.962158203125, 20.609375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 12.0, 15.0, 14.0, 30.0, 19.0, 32.0, 50.0, 57.0, 71.0, 96.0, 107.0, 160.0, 214.0, 308.0, 429.0, 650.0, 981.0, 1741.0, 3518.0, 9691.0, 53385.0, 656224.0, 2800580.0, 603667.0, 44764.0, 8889.0, 3544.0, 1760.0, 1015.0, 652.0, 421.0, 313.0, 205.0, 169.0, 109.0, 96.0, 56.0, 57.0, 32.0, 29.0, 30.0, 17.0, 13.0, 11.0, 11.0, 11.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-40.9375, -39.548828125, -38.16015625, -36.771484375, -35.3828125, -33.994140625, -32.60546875, -31.216796875, -29.828125, -28.439453125, -27.05078125, -25.662109375, -24.2734375, -22.884765625, -21.49609375, -20.107421875, -18.71875, -17.330078125, -15.94140625, -14.552734375, -13.1640625, -11.775390625, -10.38671875, -8.998046875, -7.609375, -6.220703125, -4.83203125, -3.443359375, -2.0546875, -0.666015625, 0.72265625, 2.111328125, 3.5, 4.888671875, 6.27734375, 7.666015625, 9.0546875, 10.443359375, 11.83203125, 13.220703125, 14.609375, 15.998046875, 17.38671875, 18.775390625, 20.1640625, 21.552734375, 22.94140625, 24.330078125, 25.71875, 27.107421875, 28.49609375, 29.884765625, 31.2734375, 32.662109375, 34.05078125, 35.439453125, 36.828125, 38.216796875, 39.60546875, 40.994140625, 42.3828125, 43.771484375, 45.16015625, 46.548828125, 47.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 11.0, 21.0, 24.0, 56.0, 147.0, 267.0, 720.0, 1365.0, 861.0, 320.0, 147.0, 73.0, 33.0, 17.0, 12.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.8125, -71.0439453125, -68.275390625, -65.5068359375, -62.73828125, -59.9697265625, -57.201171875, -54.4326171875, -51.6640625, -48.8955078125, -46.126953125, -43.3583984375, -40.58984375, -37.8212890625, -35.052734375, -32.2841796875, -29.515625, -26.7470703125, -23.978515625, -21.2099609375, -18.44140625, -15.6728515625, -12.904296875, -10.1357421875, -7.3671875, -4.5986328125, -1.830078125, 0.9384765625, 3.70703125, 6.4755859375, 9.244140625, 12.0126953125, 14.78125, 17.5498046875, 20.318359375, 23.0869140625, 25.85546875, 28.6240234375, 31.392578125, 34.1611328125, 36.9296875, 39.6982421875, 42.466796875, 45.2353515625, 48.00390625, 50.7724609375, 53.541015625, 56.3095703125, 59.078125, 61.8466796875, 64.615234375, 67.3837890625, 70.15234375, 72.9208984375, 75.689453125, 78.4580078125, 81.2265625, 83.9951171875, 86.763671875, 89.5322265625, 92.30078125, 95.0693359375, 97.837890625, 100.6064453125, 103.375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 27.0, 54.0, 161.0, 458.0, 1837.0, 121808.0, 4061301.0, 7277.0, 851.0, 322.0, 103.0, 36.0, 18.0, 12.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.0, -234.529296875, -228.05859375, -221.587890625, -215.1171875, -208.646484375, -202.17578125, -195.705078125, -189.234375, -182.763671875, -176.29296875, -169.822265625, -163.3515625, -156.880859375, -150.41015625, -143.939453125, -137.46875, -130.998046875, -124.52734375, -118.056640625, -111.5859375, -105.115234375, -98.64453125, -92.173828125, -85.703125, -79.232421875, -72.76171875, -66.291015625, -59.8203125, -53.349609375, -46.87890625, -40.408203125, -33.9375, -27.466796875, -20.99609375, -14.525390625, -8.0546875, -1.583984375, 4.88671875, 11.357421875, 17.828125, 24.298828125, 30.76953125, 37.240234375, 43.7109375, 50.181640625, 56.65234375, 63.123046875, 69.59375, 76.064453125, 82.53515625, 89.005859375, 95.4765625, 101.947265625, 108.41796875, 114.888671875, 121.359375, 127.830078125, 134.30078125, 140.771484375, 147.2421875, 153.712890625, 160.18359375, 166.654296875, 173.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 38.0, 152.0, 431.0, 288.0, 79.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-599.0835571289062, -583.9814453125, -568.87939453125, -553.77734375, -538.6752319335938, -523.5731201171875, -508.4710693359375, -493.3689880371094, -478.26690673828125, -463.1648254394531, -448.062744140625, -432.9606628417969, -417.85858154296875, -402.7565002441406, -387.6544189453125, -372.5523376464844, -357.45025634765625, -342.3481750488281, -327.24609375, -312.1440124511719, -297.04193115234375, -281.9398498535156, -266.8377685546875, -251.73568725585938, -236.63360595703125, -221.53152465820312, -206.429443359375, -191.32736206054688, -176.22528076171875, -161.12319946289062, -146.0211181640625, -130.91903686523438, -115.81695556640625, -100.71487426757812, -85.61279296875, -70.51071166992188, -55.40863037109375, -40.306549072265625, -25.2044677734375, -10.102386474609375, 4.99969482421875, 20.101776123046875, 35.203857421875, 50.305938720703125, 65.40802001953125, 80.51010131835938, 95.6121826171875, 110.71426391601562, 125.81634521484375, 140.91842651367188, 156.0205078125, 171.12258911132812, 186.22467041015625, 201.32675170898438, 216.4288330078125, 231.53091430664062, 246.63299560546875, 261.7350769042969, 276.837158203125, 291.9392395019531, 307.04132080078125, 322.1434020996094, 337.2454833984375, 352.3475646972656, 367.44964599609375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 2.0, 12.0, 5.0, 8.0, 12.0, 16.0, 16.0, 18.0, 20.0, 25.0, 35.0, 23.0, 31.0, 33.0, 35.0, 41.0, 37.0, 34.0, 41.0, 46.0, 53.0, 41.0, 40.0, 28.0, 28.0, 45.0, 29.0, 33.0, 33.0, 27.0, 15.0, 20.0, 18.0, 17.0, 13.0, 12.0, 14.0, 8.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.4825439453125, -111.51422119140625, -107.5458984375, -103.57757568359375, -99.6092529296875, -95.64093017578125, -91.67259979248047, -87.70427703857422, -83.73595428466797, -79.76763153076172, -75.79930877685547, -71.83098602294922, -67.86265563964844, -63.89433670043945, -59.92601013183594, -55.95768737792969, -51.98936462402344, -48.02104187011719, -44.05271911621094, -40.08439254760742, -36.11606979370117, -32.14774703979492, -28.17942237854004, -24.211097717285156, -20.242774963378906, -16.274452209472656, -12.306127548217773, -8.337803840637207, -4.369480133056641, -0.4011573791503906, 3.567167282104492, 7.535491943359375, 11.503814697265625, 15.472138404846191, 19.440462112426758, 23.40878677368164, 27.37710952758789, 31.34543228149414, 35.313758850097656, 39.282081604003906, 43.250404357910156, 47.218727111816406, 51.187049865722656, 55.15537643432617, 59.12369918823242, 63.09202194213867, 67.06034851074219, 71.02867126464844, 74.99699401855469, 78.96531677246094, 82.93363952636719, 86.90196228027344, 90.87028503417969, 94.83860778808594, 98.80693817138672, 102.77526092529297, 106.74358367919922, 110.71190643310547, 114.68022918701172, 118.64855194091797, 122.61688232421875, 126.585205078125, 130.55352783203125, 134.5218505859375, 138.49017333984375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 23.0, 20.0, 14.0, 33.0, 18.0, 32.0, 30.0, 22.0, 26.0, 27.0, 30.0, 32.0, 30.0, 32.0, 39.0, 25.0, 30.0, 46.0, 41.0, 36.0, 40.0, 27.0, 31.0, 24.0, 26.0, 21.0, 26.0, 21.0, 16.0, 14.0, 17.0, 10.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.171875, -14.683837890625, -14.19580078125, -13.707763671875, -13.2197265625, -12.731689453125, -12.24365234375, -11.755615234375, -11.267578125, -10.779541015625, -10.29150390625, -9.803466796875, -9.3154296875, -8.827392578125, -8.33935546875, -7.851318359375, -7.36328125, -6.875244140625, -6.38720703125, -5.899169921875, -5.4111328125, -4.923095703125, -4.43505859375, -3.947021484375, -3.458984375, -2.970947265625, -2.48291015625, -1.994873046875, -1.5068359375, -1.018798828125, -0.53076171875, -0.042724609375, 0.4453125, 0.933349609375, 1.42138671875, 1.909423828125, 2.3974609375, 2.885498046875, 3.37353515625, 3.861572265625, 4.349609375, 4.837646484375, 5.32568359375, 5.813720703125, 6.3017578125, 6.789794921875, 7.27783203125, 7.765869140625, 8.25390625, 8.741943359375, 9.22998046875, 9.718017578125, 10.2060546875, 10.694091796875, 11.18212890625, 11.670166015625, 12.158203125, 12.646240234375, 13.13427734375, 13.622314453125, 14.1103515625, 14.598388671875, 15.08642578125, 15.574462890625, 16.0625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 8.0, 8.0, 20.0, 28.0, 33.0, 57.0, 77.0, 127.0, 182.0, 306.0, 529.0, 836.0, 1422.0, 2339.0, 3734.0, 6452.0, 10798.0, 18436.0, 32465.0, 56990.0, 105996.0, 204383.0, 262825.0, 154733.0, 80533.0, 44066.0, 25198.0, 14468.0, 8581.0, 5065.0, 3094.0, 1854.0, 1099.0, 674.0, 431.0, 258.0, 145.0, 116.0, 66.0, 45.0, 21.0, 22.0, 12.0, 11.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.211578369140625, -2.13604736328125, -2.060516357421875, -1.9849853515625, -1.909454345703125, -1.83392333984375, -1.758392333984375, -1.682861328125, -1.607330322265625, -1.53179931640625, -1.456268310546875, -1.3807373046875, -1.305206298828125, -1.22967529296875, -1.154144287109375, -1.07861328125, -1.003082275390625, -0.92755126953125, -0.852020263671875, -0.7764892578125, -0.700958251953125, -0.62542724609375, -0.549896240234375, -0.474365234375, -0.398834228515625, -0.32330322265625, -0.247772216796875, -0.1722412109375, -0.096710205078125, -0.02117919921875, 0.054351806640625, 0.1298828125, 0.205413818359375, 0.28094482421875, 0.356475830078125, 0.4320068359375, 0.507537841796875, 0.58306884765625, 0.658599853515625, 0.734130859375, 0.809661865234375, 0.88519287109375, 0.960723876953125, 1.0362548828125, 1.111785888671875, 1.18731689453125, 1.262847900390625, 1.33837890625, 1.413909912109375, 1.48944091796875, 1.564971923828125, 1.6405029296875, 1.716033935546875, 1.79156494140625, 1.867095947265625, 1.942626953125, 2.018157958984375, 2.09368896484375, 2.169219970703125, 2.2447509765625, 2.320281982421875, 2.39581298828125, 2.471343994140625, 2.546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 11.0, 9.0, 10.0, 15.0, 17.0, 12.0, 21.0, 28.0, 34.0, 32.0, 30.0, 41.0, 26.0, 34.0, 42.0, 26.0, 37.0, 37.0, 1064.0, 43.0, 46.0, 30.0, 26.0, 28.0, 40.0, 33.0, 26.0, 25.0, 16.0, 22.0, 16.0, 18.0, 10.0, 12.0, 13.0, 10.0, 13.0, 10.0, 5.0, 6.0, 9.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.171875, -9.8216552734375, -9.471435546875, -9.1212158203125, -8.77099609375, -8.4207763671875, -8.070556640625, -7.7203369140625, -7.3701171875, -7.0198974609375, -6.669677734375, -6.3194580078125, -5.96923828125, -5.6190185546875, -5.268798828125, -4.9185791015625, -4.568359375, -4.2181396484375, -3.867919921875, -3.5177001953125, -3.16748046875, -2.8172607421875, -2.467041015625, -2.1168212890625, -1.7666015625, -1.4163818359375, -1.066162109375, -0.7159423828125, -0.36572265625, -0.0155029296875, 0.334716796875, 0.6849365234375, 1.03515625, 1.3853759765625, 1.735595703125, 2.0858154296875, 2.43603515625, 2.7862548828125, 3.136474609375, 3.4866943359375, 3.8369140625, 4.1871337890625, 4.537353515625, 4.8875732421875, 5.23779296875, 5.5880126953125, 5.938232421875, 6.2884521484375, 6.638671875, 6.9888916015625, 7.339111328125, 7.6893310546875, 8.03955078125, 8.3897705078125, 8.739990234375, 9.0902099609375, 9.4404296875, 9.7906494140625, 10.140869140625, 10.4910888671875, 10.84130859375, 11.1915283203125, 11.541748046875, 11.8919677734375, 12.2421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 6.0, 20.0, 20.0, 27.0, 51.0, 65.0, 58.0, 98.0, 174.0, 250.0, 370.0, 487.0, 693.0, 1020.0, 1465.0, 2236.0, 3074.0, 4553.0, 6771.0, 9794.0, 14651.0, 21759.0, 34059.0, 54041.0, 86727.0, 139773.0, 1246072.0, 170646.0, 108085.0, 66791.0, 41885.0, 26905.0, 17598.0, 11627.0, 7823.0, 5448.0, 3825.0, 2547.0, 1682.0, 1235.0, 806.0, 574.0, 415.0, 285.0, 193.0, 154.0, 98.0, 61.0, 44.0, 29.0, 15.0, 13.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0], "bins": [-1.45703125, -1.412506103515625, -1.36798095703125, -1.323455810546875, -1.2789306640625, -1.234405517578125, -1.18988037109375, -1.145355224609375, -1.100830078125, -1.056304931640625, -1.01177978515625, -0.967254638671875, -0.9227294921875, -0.878204345703125, -0.83367919921875, -0.789154052734375, -0.74462890625, -0.700103759765625, -0.65557861328125, -0.611053466796875, -0.5665283203125, -0.522003173828125, -0.47747802734375, -0.432952880859375, -0.388427734375, -0.343902587890625, -0.29937744140625, -0.254852294921875, -0.2103271484375, -0.165802001953125, -0.12127685546875, -0.076751708984375, -0.0322265625, 0.012298583984375, 0.05682373046875, 0.101348876953125, 0.1458740234375, 0.190399169921875, 0.23492431640625, 0.279449462890625, 0.323974609375, 0.368499755859375, 0.41302490234375, 0.457550048828125, 0.5020751953125, 0.546600341796875, 0.59112548828125, 0.635650634765625, 0.68017578125, 0.724700927734375, 0.76922607421875, 0.813751220703125, 0.8582763671875, 0.902801513671875, 0.94732666015625, 0.991851806640625, 1.036376953125, 1.080902099609375, 1.12542724609375, 1.169952392578125, 1.2144775390625, 1.259002685546875, 1.30352783203125, 1.348052978515625, 1.392578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 1.0, 4.0, 7.0, 7.0, 21.0, 19.0, 19.0, 34.0, 32.0, 23.0, 28.0, 43.0, 45.0, 61.0, 91.0, 94.0, 92.0, 57.0, 63.0, 41.0, 46.0, 35.0, 28.0, 21.0, 11.0, 13.0, 15.0, 17.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02557373046875, -0.024890661239624023, -0.024207592010498047, -0.02352452278137207, -0.022841453552246094, -0.022158384323120117, -0.02147531509399414, -0.020792245864868164, -0.020109176635742188, -0.01942610740661621, -0.018743038177490234, -0.018059968948364258, -0.01737689971923828, -0.016693830490112305, -0.016010761260986328, -0.015327692031860352, -0.014644622802734375, -0.013961553573608398, -0.013278484344482422, -0.012595415115356445, -0.011912345886230469, -0.011229276657104492, -0.010546207427978516, -0.009863138198852539, -0.009180068969726562, -0.008496999740600586, -0.00781393051147461, -0.007130861282348633, -0.006447792053222656, -0.00576472282409668, -0.005081653594970703, -0.0043985843658447266, -0.00371551513671875, -0.0030324459075927734, -0.002349376678466797, -0.0016663074493408203, -0.0009832382202148438, -0.0003001689910888672, 0.0003829002380371094, 0.001065969467163086, 0.0017490386962890625, 0.002432107925415039, 0.0031151771545410156, 0.003798246383666992, 0.004481315612792969, 0.005164384841918945, 0.005847454071044922, 0.0065305233001708984, 0.007213592529296875, 0.007896661758422852, 0.008579730987548828, 0.009262800216674805, 0.009945869445800781, 0.010628938674926758, 0.011312007904052734, 0.011995077133178711, 0.012678146362304688, 0.013361215591430664, 0.01404428482055664, 0.014727354049682617, 0.015410423278808594, 0.01609349250793457, 0.016776561737060547, 0.017459630966186523, 0.0181427001953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 7.0, 12.0, 19.0, 16.0, 29.0, 37.0, 41.0, 62.0, 79.0, 143.0, 207.0, 333.0, 601.0, 3497.0, 1038680.0, 3221.0, 589.0, 318.0, 195.0, 125.0, 99.0, 67.0, 53.0, 40.0, 27.0, 11.0, 12.0, 8.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3599090576171875, -0.345794677734375, -0.3316802978515625, -0.31756591796875, -0.3034515380859375, -0.289337158203125, -0.2752227783203125, -0.2611083984375, -0.2469940185546875, -0.232879638671875, -0.2187652587890625, -0.20465087890625, -0.1905364990234375, -0.176422119140625, -0.1623077392578125, -0.148193359375, -0.1340789794921875, -0.119964599609375, -0.1058502197265625, -0.09173583984375, -0.0776214599609375, -0.063507080078125, -0.0493927001953125, -0.0352783203125, -0.0211639404296875, -0.007049560546875, 0.0070648193359375, 0.02117919921875, 0.0352935791015625, 0.049407958984375, 0.0635223388671875, 0.07763671875, 0.0917510986328125, 0.105865478515625, 0.1199798583984375, 0.13409423828125, 0.1482086181640625, 0.162322998046875, 0.1764373779296875, 0.1905517578125, 0.2046661376953125, 0.218780517578125, 0.2328948974609375, 0.24700927734375, 0.2611236572265625, 0.275238037109375, 0.2893524169921875, 0.303466796875, 0.3175811767578125, 0.331695556640625, 0.3458099365234375, 0.35992431640625, 0.3740386962890625, 0.388153076171875, 0.4022674560546875, 0.4163818359375, 0.4304962158203125, 0.444610595703125, 0.4587249755859375, 0.47283935546875, 0.4869537353515625, 0.501068115234375, 0.5151824951171875, 0.529296875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 947.0, 62.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07114312052726746, -0.06445673853158951, -0.05777035653591156, -0.05108397454023361, -0.044397592544555664, -0.037711214274168015, -0.031024832278490067, -0.02433845028281212, -0.01765206828713417, -0.010965686291456223, -0.004279305227100849, 0.0024070758372545242, 0.009093457832932472, 0.01577983796596527, 0.02246621996164322, 0.029152601957321167, 0.035838983952999115, 0.04252536594867706, 0.04921174794435501, 0.05589812994003296, 0.06258451193571091, 0.06927089393138885, 0.0759572684764862, 0.08264365792274475, 0.0893300324678421, 0.09601641446352005, 0.102702796459198, 0.10938917845487595, 0.1160755604505539, 0.12276193499565125, 0.1294483244419098, 0.13613469898700714, 0.14282108843326569, 0.14950746297836304, 0.15619385242462158, 0.16288022696971893, 0.16956661641597748, 0.17625299096107483, 0.18293938040733337, 0.18962575495243073, 0.19631214439868927, 0.20299851894378662, 0.20968490839004517, 0.21637128293514252, 0.22305767238140106, 0.2297440469264984, 0.23643043637275696, 0.2431168109178543, 0.24980318546295166, 0.2564895749092102, 0.26317593455314636, 0.2698623239994049, 0.27654871344566345, 0.283235102891922, 0.28992146253585815, 0.2966078519821167, 0.30329424142837524, 0.3099806308746338, 0.31666699051856995, 0.3233533799648285, 0.33003976941108704, 0.3367261588573456, 0.34341251850128174, 0.3500989079475403, 0.35678529739379883]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 8.0, 17.0, 25.0, 26.0, 36.0, 36.0, 46.0, 41.0, 38.0, 46.0, 44.0, 57.0, 53.0, 53.0, 51.0, 48.0, 45.0, 59.0, 37.0, 33.0, 40.0, 35.0, 27.0, 20.0, 19.0, 12.0, 9.0, 1.0, 6.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.026851892471313477, -0.026176083832979202, -0.025500277057290077, -0.024824470281600952, -0.024148661643266678, -0.023472853004932404, -0.02279704622924328, -0.022121239453554153, -0.02144543081521988, -0.020769622176885605, -0.02009381540119648, -0.019418008625507355, -0.01874219998717308, -0.018066391348838806, -0.01739058457314968, -0.016714777797460556, -0.016038969159126282, -0.015363161452114582, -0.014687353745102882, -0.014011546038091183, -0.013335738331079483, -0.012659930624067783, -0.011984122917056084, -0.011308315210044384, -0.010632507503032684, -0.009956699796020985, -0.009280892089009285, -0.008605084381997585, -0.007929276674985886, -0.007253468967974186, -0.006577661260962486, -0.005901853553950787, -0.005226045846939087, -0.004550238139927387, -0.0038744304329156876, -0.003198622725903988, -0.002522815018892288, -0.0018470073118805885, -0.0011711996048688889, -0.0004953918978571892, 0.0001804158091545105, 0.0008562235161662102, 0.0015320312231779099, 0.0022078389301896095, 0.002883646637201309, 0.003559454344213009, 0.0042352620512247086, 0.004911069758236408, 0.005586877465248108, 0.006262685172259808, 0.006938492879271507, 0.007614300586283207, 0.008290108293294907, 0.008965916000306606, 0.009641723707318306, 0.010317531414330006, 0.010993339121341705, 0.011669146828353405, 0.012344954535365105, 0.013020762242376804, 0.013696569949388504, 0.014372377656400204, 0.015048185363411903, 0.01572399213910103, 0.016399800777435303]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 21.0, 22.0, 14.0, 33.0, 16.0, 32.0, 32.0, 22.0, 26.0, 27.0, 30.0, 32.0, 30.0, 31.0, 40.0, 24.0, 31.0, 46.0, 40.0, 37.0, 40.0, 27.0, 31.0, 24.0, 26.0, 21.0, 26.0, 21.0, 15.0, 15.0, 17.0, 10.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.1796875, -14.6915283203125, -14.203369140625, -13.7152099609375, -13.22705078125, -12.7388916015625, -12.250732421875, -11.7625732421875, -11.2744140625, -10.7862548828125, -10.298095703125, -9.8099365234375, -9.32177734375, -8.8336181640625, -8.345458984375, -7.8572998046875, -7.369140625, -6.8809814453125, -6.392822265625, -5.9046630859375, -5.41650390625, -4.9283447265625, -4.440185546875, -3.9520263671875, -3.4638671875, -2.9757080078125, -2.487548828125, -1.9993896484375, -1.51123046875, -1.0230712890625, -0.534912109375, -0.0467529296875, 0.44140625, 0.9295654296875, 1.417724609375, 1.9058837890625, 2.39404296875, 2.8822021484375, 3.370361328125, 3.8585205078125, 4.3466796875, 4.8348388671875, 5.322998046875, 5.8111572265625, 6.29931640625, 6.7874755859375, 7.275634765625, 7.7637939453125, 8.251953125, 8.7401123046875, 9.228271484375, 9.7164306640625, 10.20458984375, 10.6927490234375, 11.180908203125, 11.6690673828125, 12.1572265625, 12.6453857421875, 13.133544921875, 13.6217041015625, 14.10986328125, 14.5980224609375, 15.086181640625, 15.5743408203125, 16.0625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 11.0, 5.0, 12.0, 10.0, 17.0, 22.0, 16.0, 30.0, 32.0, 55.0, 58.0, 80.0, 129.0, 155.0, 205.0, 329.0, 463.0, 711.0, 1090.0, 1818.0, 3378.0, 7372.0, 20405.0, 78747.0, 447851.0, 384090.0, 68254.0, 18288.0, 6700.0, 3213.0, 1722.0, 1061.0, 672.0, 442.0, 313.0, 200.0, 162.0, 98.0, 81.0, 52.0, 56.0, 29.0, 25.0, 21.0, 23.0, 17.0, 8.0, 6.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.796875, -25.958251953125, -25.11962890625, -24.281005859375, -23.4423828125, -22.603759765625, -21.76513671875, -20.926513671875, -20.087890625, -19.249267578125, -18.41064453125, -17.572021484375, -16.7333984375, -15.894775390625, -15.05615234375, -14.217529296875, -13.37890625, -12.540283203125, -11.70166015625, -10.863037109375, -10.0244140625, -9.185791015625, -8.34716796875, -7.508544921875, -6.669921875, -5.831298828125, -4.99267578125, -4.154052734375, -3.3154296875, -2.476806640625, -1.63818359375, -0.799560546875, 0.0390625, 0.877685546875, 1.71630859375, 2.554931640625, 3.3935546875, 4.232177734375, 5.07080078125, 5.909423828125, 6.748046875, 7.586669921875, 8.42529296875, 9.263916015625, 10.1025390625, 10.941162109375, 11.77978515625, 12.618408203125, 13.45703125, 14.295654296875, 15.13427734375, 15.972900390625, 16.8115234375, 17.650146484375, 18.48876953125, 19.327392578125, 20.166015625, 21.004638671875, 21.84326171875, 22.681884765625, 23.5205078125, 24.359130859375, 25.19775390625, 26.036376953125, 26.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 3.0, 7.0, 10.0, 17.0, 23.0, 26.0, 26.0, 15.0, 34.0, 55.0, 60.0, 76.0, 131.0, 354.0, 1574.0, 159.0, 97.0, 84.0, 56.0, 53.0, 41.0, 31.0, 23.0, 17.0, 8.0, 17.0, 7.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.36865234375, -55.3310546875, -53.29345703125, -51.255859375, -49.21826171875, -47.1806640625, -45.14306640625, -43.10546875, -41.06787109375, -39.0302734375, -36.99267578125, -34.955078125, -32.91748046875, -30.8798828125, -28.84228515625, -26.8046875, -24.76708984375, -22.7294921875, -20.69189453125, -18.654296875, -16.61669921875, -14.5791015625, -12.54150390625, -10.50390625, -8.46630859375, -6.4287109375, -4.39111328125, -2.353515625, -0.31591796875, 1.7216796875, 3.75927734375, 5.796875, 7.83447265625, 9.8720703125, 11.90966796875, 13.947265625, 15.98486328125, 18.0224609375, 20.06005859375, 22.09765625, 24.13525390625, 26.1728515625, 28.21044921875, 30.248046875, 32.28564453125, 34.3232421875, 36.36083984375, 38.3984375, 40.43603515625, 42.4736328125, 44.51123046875, 46.548828125, 48.58642578125, 50.6240234375, 52.66162109375, 54.69921875, 56.73681640625, 58.7744140625, 60.81201171875, 62.849609375, 64.88720703125, 66.9248046875, 68.96240234375, 71.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 9.0, 10.0, 9.0, 15.0, 16.0, 38.0, 43.0, 79.0, 113.0, 246.0, 453.0, 1272.0, 98589.0, 3041483.0, 2119.0, 529.0, 268.0, 135.0, 88.0, 53.0, 29.0, 39.0, 17.0, 12.0, 6.0, 4.0, 14.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-193.25, -187.751953125, -182.25390625, -176.755859375, -171.2578125, -165.759765625, -160.26171875, -154.763671875, -149.265625, -143.767578125, -138.26953125, -132.771484375, -127.2734375, -121.775390625, -116.27734375, -110.779296875, -105.28125, -99.783203125, -94.28515625, -88.787109375, -83.2890625, -77.791015625, -72.29296875, -66.794921875, -61.296875, -55.798828125, -50.30078125, -44.802734375, -39.3046875, -33.806640625, -28.30859375, -22.810546875, -17.3125, -11.814453125, -6.31640625, -0.818359375, 4.6796875, 10.177734375, 15.67578125, 21.173828125, 26.671875, 32.169921875, 37.66796875, 43.166015625, 48.6640625, 54.162109375, 59.66015625, 65.158203125, 70.65625, 76.154296875, 81.65234375, 87.150390625, 92.6484375, 98.146484375, 103.64453125, 109.142578125, 114.640625, 120.138671875, 125.63671875, 131.134765625, 136.6328125, 142.130859375, 147.62890625, 153.126953125, 158.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [3.0, 457.0, 546.0, 11.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.125770568847656, -26.121835708618164, -0.11790084838867188, 25.886032104492188, 51.88996887207031, 77.8938980102539, 103.89783477783203, 129.90176391601562, 155.90570068359375, 181.90963745117188, 207.91357421875, 233.91751098632812, 259.92144775390625, 285.92535400390625, 311.9293212890625, 337.9332275390625, 363.93719482421875, 389.9411315917969, 415.945068359375, 441.9490051269531, 467.95294189453125, 493.95684814453125, 519.9608154296875, 545.9647216796875, 571.9686889648438, 597.9725952148438, 623.9765625, 649.98046875, 675.9844360351562, 701.9883422851562, 727.9923095703125, 753.9962158203125, 780.0001831054688, 806.0040893554688, 832.008056640625, 858.011962890625, 884.0159301757812, 910.0198364257812, 936.0238037109375, 962.0277099609375, 988.0316772460938, 1014.0355834960938, 1040.03955078125, 1066.04345703125, 1092.04736328125, 1118.0513916015625, 1144.0552978515625, 1170.0592041015625, 1196.0631103515625, 1222.0670166015625, 1248.0709228515625, 1274.074951171875, 1300.078857421875, 1326.082763671875, 1352.086669921875, 1378.0906982421875, 1404.0946044921875, 1430.0985107421875, 1456.1024169921875, 1482.1064453125, 1508.1103515625, 1534.1142578125, 1560.1181640625, 1586.1221923828125, 1612.1260986328125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 9.0, 7.0, 6.0, 10.0, 19.0, 18.0, 20.0, 24.0, 23.0, 21.0, 36.0, 46.0, 31.0, 37.0, 37.0, 50.0, 50.0, 42.0, 41.0, 40.0, 53.0, 41.0, 38.0, 39.0, 31.0, 39.0, 24.0, 33.0, 19.0, 11.0, 18.0, 16.0, 14.0, 9.0, 7.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-126.49910736083984, -122.5952377319336, -118.69137573242188, -114.78750610351562, -110.88363647460938, -106.97976684570312, -103.07589721679688, -99.17203521728516, -95.2681655883789, -91.36429595947266, -87.46043395996094, -83.55656433105469, -79.65269470214844, -75.74882507324219, -71.84495544433594, -67.94109344482422, -64.03722381591797, -60.13335418701172, -56.229488372802734, -52.32562255859375, -48.4217529296875, -44.51788330078125, -40.614017486572266, -36.71015167236328, -32.80628204345703, -28.902414321899414, -24.998546600341797, -21.09467887878418, -17.190811157226562, -13.286943435668945, -9.383075714111328, -5.479207992553711, -1.5753326416015625, 2.3285350799560547, 6.232402801513672, 10.136270523071289, 14.040138244628906, 17.944005966186523, 21.84787368774414, 25.751741409301758, 29.655609130859375, 33.559478759765625, 37.46334457397461, 41.367210388183594, 45.271080017089844, 49.174949645996094, 53.07881546020508, 56.98268127441406, 60.88655090332031, 64.79042053222656, 68.69429016113281, 72.59815216064453, 76.50202178955078, 80.40589141845703, 84.30975341796875, 88.213623046875, 92.11749267578125, 96.0213623046875, 99.92523193359375, 103.82909393310547, 107.73296356201172, 111.63683319091797, 115.54069519042969, 119.44456481933594, 123.34843444824219]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 4.0, 12.0, 8.0, 9.0, 16.0, 14.0, 10.0, 13.0, 30.0, 18.0, 23.0, 24.0, 24.0, 43.0, 37.0, 34.0, 36.0, 32.0, 35.0, 48.0, 42.0, 41.0, 35.0, 35.0, 44.0, 44.0, 31.0, 27.0, 33.0, 21.0, 28.0, 29.0, 14.0, 13.0, 15.0, 17.0, 17.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.0625, -20.43017578125, -19.7978515625, -19.16552734375, -18.533203125, -17.90087890625, -17.2685546875, -16.63623046875, -16.00390625, -15.37158203125, -14.7392578125, -14.10693359375, -13.474609375, -12.84228515625, -12.2099609375, -11.57763671875, -10.9453125, -10.31298828125, -9.6806640625, -9.04833984375, -8.416015625, -7.78369140625, -7.1513671875, -6.51904296875, -5.88671875, -5.25439453125, -4.6220703125, -3.98974609375, -3.357421875, -2.72509765625, -2.0927734375, -1.46044921875, -0.828125, -0.19580078125, 0.4365234375, 1.06884765625, 1.701171875, 2.33349609375, 2.9658203125, 3.59814453125, 4.23046875, 4.86279296875, 5.4951171875, 6.12744140625, 6.759765625, 7.39208984375, 8.0244140625, 8.65673828125, 9.2890625, 9.92138671875, 10.5537109375, 11.18603515625, 11.818359375, 12.45068359375, 13.0830078125, 13.71533203125, 14.34765625, 14.97998046875, 15.6123046875, 16.24462890625, 16.876953125, 17.50927734375, 18.1416015625, 18.77392578125, 19.40625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 12.0, 10.0, 12.0, 16.0, 24.0, 17.0, 40.0, 35.0, 55.0, 64.0, 97.0, 103.0, 141.0, 161.0, 250.0, 334.0, 495.0, 823.0, 1724.0, 3693.0, 11193.0, 114964.0, 3577199.0, 456246.0, 16448.0, 4950.0, 2054.0, 1079.0, 569.0, 378.0, 269.0, 181.0, 138.0, 106.0, 100.0, 57.0, 48.0, 39.0, 36.0, 22.0, 19.0, 24.0, 16.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-97.1875, -94.2978515625, -91.408203125, -88.5185546875, -85.62890625, -82.7392578125, -79.849609375, -76.9599609375, -74.0703125, -71.1806640625, -68.291015625, -65.4013671875, -62.51171875, -59.6220703125, -56.732421875, -53.8427734375, -50.953125, -48.0634765625, -45.173828125, -42.2841796875, -39.39453125, -36.5048828125, -33.615234375, -30.7255859375, -27.8359375, -24.9462890625, -22.056640625, -19.1669921875, -16.27734375, -13.3876953125, -10.498046875, -7.6083984375, -4.71875, -1.8291015625, 1.060546875, 3.9501953125, 6.83984375, 9.7294921875, 12.619140625, 15.5087890625, 18.3984375, 21.2880859375, 24.177734375, 27.0673828125, 29.95703125, 32.8466796875, 35.736328125, 38.6259765625, 41.515625, 44.4052734375, 47.294921875, 50.1845703125, 53.07421875, 55.9638671875, 58.853515625, 61.7431640625, 64.6328125, 67.5224609375, 70.412109375, 73.3017578125, 76.19140625, 79.0810546875, 81.970703125, 84.8603515625, 87.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 11.0, 15.0, 25.0, 32.0, 78.0, 125.0, 262.0, 575.0, 1123.0, 935.0, 415.0, 205.0, 103.0, 61.0, 26.0, 19.0, 13.0, 6.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90625, -52.86279296875, -50.8193359375, -48.77587890625, -46.732421875, -44.68896484375, -42.6455078125, -40.60205078125, -38.55859375, -36.51513671875, -34.4716796875, -32.42822265625, -30.384765625, -28.34130859375, -26.2978515625, -24.25439453125, -22.2109375, -20.16748046875, -18.1240234375, -16.08056640625, -14.037109375, -11.99365234375, -9.9501953125, -7.90673828125, -5.86328125, -3.81982421875, -1.7763671875, 0.26708984375, 2.310546875, 4.35400390625, 6.3974609375, 8.44091796875, 10.484375, 12.52783203125, 14.5712890625, 16.61474609375, 18.658203125, 20.70166015625, 22.7451171875, 24.78857421875, 26.83203125, 28.87548828125, 30.9189453125, 32.96240234375, 35.005859375, 37.04931640625, 39.0927734375, 41.13623046875, 43.1796875, 45.22314453125, 47.2666015625, 49.31005859375, 51.353515625, 53.39697265625, 55.4404296875, 57.48388671875, 59.52734375, 61.57080078125, 63.6142578125, 65.65771484375, 67.701171875, 69.74462890625, 71.7880859375, 73.83154296875, 75.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 4.0, 5.0, 9.0, 15.0, 25.0, 19.0, 30.0, 33.0, 45.0, 71.0, 104.0, 165.0, 243.0, 440.0, 739.0, 1478.0, 3031.0, 6945.0, 21230.0, 97904.0, 1654900.0, 2252119.0, 116316.0, 23815.0, 7683.0, 3298.0, 1563.0, 797.0, 437.0, 242.0, 162.0, 116.0, 76.0, 55.0, 36.0, 25.0, 19.0, 26.0, 9.0, 17.0, 8.0, 4.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.40625, -43.89501953125, -42.3837890625, -40.87255859375, -39.361328125, -37.85009765625, -36.3388671875, -34.82763671875, -33.31640625, -31.80517578125, -30.2939453125, -28.78271484375, -27.271484375, -25.76025390625, -24.2490234375, -22.73779296875, -21.2265625, -19.71533203125, -18.2041015625, -16.69287109375, -15.181640625, -13.67041015625, -12.1591796875, -10.64794921875, -9.13671875, -7.62548828125, -6.1142578125, -4.60302734375, -3.091796875, -1.58056640625, -0.0693359375, 1.44189453125, 2.953125, 4.46435546875, 5.9755859375, 7.48681640625, 8.998046875, 10.50927734375, 12.0205078125, 13.53173828125, 15.04296875, 16.55419921875, 18.0654296875, 19.57666015625, 21.087890625, 22.59912109375, 24.1103515625, 25.62158203125, 27.1328125, 28.64404296875, 30.1552734375, 31.66650390625, 33.177734375, 34.68896484375, 36.2001953125, 37.71142578125, 39.22265625, 40.73388671875, 42.2451171875, 43.75634765625, 45.267578125, 46.77880859375, 48.2900390625, 49.80126953125, 51.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 11.0, 12.0, 25.0, 18.0, 35.0, 48.0, 43.0, 64.0, 85.0, 107.0, 106.0, 104.0, 73.0, 60.0, 49.0, 31.0, 23.0, 16.0, 17.0, 11.0, 17.0, 14.0, 7.0, 5.0, 4.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-268.54449462890625, -261.75665283203125, -254.9688262939453, -248.1809844970703, -241.3931427001953, -234.60531616210938, -227.81747436523438, -221.02963256835938, -214.24180603027344, -207.45396423339844, -200.6661376953125, -193.8782958984375, -187.0904541015625, -180.30262756347656, -173.51478576660156, -166.72695922851562, -159.93911743164062, -153.15127563476562, -146.3634490966797, -139.5756072998047, -132.7877655029297, -125.99993896484375, -119.21209716796875, -112.42426300048828, -105.63641357421875, -98.84857940673828, -92.06073760986328, -85.27290344238281, -78.48506927490234, -71.69723510742188, -64.90939331054688, -58.121559143066406, -51.33372497558594, -44.5458869934082, -37.758052825927734, -30.97021484375, -24.1823787689209, -17.394542694091797, -10.606704711914062, -3.8188705444335938, 2.9689674377441406, 9.756803512573242, 16.544639587402344, 23.332477569580078, 30.12031364440918, 36.90814971923828, 43.695987701416016, 50.483821868896484, 57.27165985107422, 64.05949401855469, 70.84733581542969, 77.63516998291016, 84.42300415039062, 91.21084594726562, 97.9986801147461, 104.78651428222656, 111.57435607910156, 118.36219024658203, 125.15003204345703, 131.9378662109375, 138.7257080078125, 145.51353454589844, 152.30137634277344, 159.08920288085938, 165.87704467773438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 15.0, 15.0, 13.0, 19.0, 26.0, 27.0, 25.0, 19.0, 38.0, 38.0, 34.0, 30.0, 41.0, 54.0, 43.0, 42.0, 40.0, 45.0, 39.0, 46.0, 28.0, 30.0, 30.0, 36.0, 20.0, 22.0, 22.0, 30.0, 19.0, 19.0, 8.0, 16.0, 11.0, 7.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-141.1405029296875, -136.6005859375, -132.06068420410156, -127.52076721191406, -122.9808578491211, -118.44094848632812, -113.90103149414062, -109.36112213134766, -104.82121276855469, -100.28130340576172, -95.74139404296875, -91.20147705078125, -86.66156768798828, -82.12165832519531, -77.58174133300781, -73.04183197021484, -68.50192260742188, -63.962013244628906, -59.42210006713867, -54.88218688964844, -50.34227752685547, -45.8023681640625, -41.262454986572266, -36.72254180908203, -32.18263244628906, -27.64272117614746, -23.10280990600586, -18.562898635864258, -14.022987365722656, -9.483076095581055, -4.943164825439453, -0.40325355529785156, 4.1366424560546875, 8.676553726196289, 13.21646499633789, 17.756376266479492, 22.296287536621094, 26.836198806762695, 31.376110076904297, 35.91602325439453, 40.4559326171875, 44.99584197998047, 49.5357551574707, 54.07566833496094, 58.615577697753906, 63.155487060546875, 67.69540405273438, 72.23531341552734, 76.77522277832031, 81.31513214111328, 85.85504150390625, 90.39495849609375, 94.93486785888672, 99.47477722167969, 104.01469421386719, 108.55460357666016, 113.09451293945312, 117.6344223022461, 122.17433166503906, 126.71424865722656, 131.254150390625, 135.7940673828125, 140.333984375, 144.87388610839844, 149.41380310058594]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 5.0, 13.0, 10.0, 13.0, 12.0, 20.0, 23.0, 24.0, 32.0, 37.0, 37.0, 33.0, 42.0, 30.0, 54.0, 52.0, 54.0, 42.0, 41.0, 40.0, 38.0, 40.0, 40.0, 36.0, 23.0, 33.0, 18.0, 18.0, 34.0, 17.0, 16.0, 15.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.625, -239.181640625, -230.73828125, -222.294921875, -213.8515625, -205.408203125, -196.96484375, -188.521484375, -180.078125, -171.634765625, -163.19140625, -154.748046875, -146.3046875, -137.861328125, -129.41796875, -120.974609375, -112.53125, -104.087890625, -95.64453125, -87.201171875, -78.7578125, -70.314453125, -61.87109375, -53.427734375, -44.984375, -36.541015625, -28.09765625, -19.654296875, -11.2109375, -2.767578125, 5.67578125, 14.119140625, 22.5625, 31.005859375, 39.44921875, 47.892578125, 56.3359375, 64.779296875, 73.22265625, 81.666015625, 90.109375, 98.552734375, 106.99609375, 115.439453125, 123.8828125, 132.326171875, 140.76953125, 149.212890625, 157.65625, 166.099609375, 174.54296875, 182.986328125, 191.4296875, 199.873046875, 208.31640625, 216.759765625, 225.203125, 233.646484375, 242.08984375, 250.533203125, 258.9765625, 267.419921875, 275.86328125, 284.306640625, 292.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 15.0, 23.0, 51.0, 59.0, 84.0, 124.0, 183.0, 281.0, 445.0, 686.0, 1087.0, 1733.0, 2853.0, 4784.0, 7930.0, 13975.0, 25065.0, 45502.0, 87766.0, 178086.0, 288194.0, 187297.0, 92280.0, 47557.0, 26163.0, 14778.0, 8576.0, 4895.0, 2984.0, 1813.0, 1174.0, 730.0, 469.0, 301.0, 213.0, 134.0, 74.0, 58.0, 43.0, 27.0, 19.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.657470703125, -26.72119140625, -25.784912109375, -24.8486328125, -23.912353515625, -22.97607421875, -22.039794921875, -21.103515625, -20.167236328125, -19.23095703125, -18.294677734375, -17.3583984375, -16.422119140625, -15.48583984375, -14.549560546875, -13.61328125, -12.677001953125, -11.74072265625, -10.804443359375, -9.8681640625, -8.931884765625, -7.99560546875, -7.059326171875, -6.123046875, -5.186767578125, -4.25048828125, -3.314208984375, -2.3779296875, -1.441650390625, -0.50537109375, 0.430908203125, 1.3671875, 2.303466796875, 3.23974609375, 4.176025390625, 5.1123046875, 6.048583984375, 6.98486328125, 7.921142578125, 8.857421875, 9.793701171875, 10.72998046875, 11.666259765625, 12.6025390625, 13.538818359375, 14.47509765625, 15.411376953125, 16.34765625, 17.283935546875, 18.22021484375, 19.156494140625, 20.0927734375, 21.029052734375, 21.96533203125, 22.901611328125, 23.837890625, 24.774169921875, 25.71044921875, 26.646728515625, 27.5830078125, 28.519287109375, 29.45556640625, 30.391845703125, 31.328125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 13.0, 18.0, 10.0, 21.0, 23.0, 9.0, 22.0, 29.0, 30.0, 32.0, 37.0, 32.0, 31.0, 36.0, 47.0, 32.0, 42.0, 1059.0, 49.0, 31.0, 29.0, 32.0, 36.0, 33.0, 25.0, 28.0, 22.0, 20.0, 22.0, 22.0, 16.0, 22.0, 8.0, 12.0, 12.0, 15.0, 5.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-154.0, -149.513671875, -145.02734375, -140.541015625, -136.0546875, -131.568359375, -127.08203125, -122.595703125, -118.109375, -113.623046875, -109.13671875, -104.650390625, -100.1640625, -95.677734375, -91.19140625, -86.705078125, -82.21875, -77.732421875, -73.24609375, -68.759765625, -64.2734375, -59.787109375, -55.30078125, -50.814453125, -46.328125, -41.841796875, -37.35546875, -32.869140625, -28.3828125, -23.896484375, -19.41015625, -14.923828125, -10.4375, -5.951171875, -1.46484375, 3.021484375, 7.5078125, 11.994140625, 16.48046875, 20.966796875, 25.453125, 29.939453125, 34.42578125, 38.912109375, 43.3984375, 47.884765625, 52.37109375, 56.857421875, 61.34375, 65.830078125, 70.31640625, 74.802734375, 79.2890625, 83.775390625, 88.26171875, 92.748046875, 97.234375, 101.720703125, 106.20703125, 110.693359375, 115.1796875, 119.666015625, 124.15234375, 128.638671875, 133.125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 17.0, 11.0, 28.0, 39.0, 47.0, 80.0, 109.0, 161.0, 234.0, 366.0, 535.0, 747.0, 1070.0, 1586.0, 2304.0, 3445.0, 5058.0, 7413.0, 10904.0, 16257.0, 24630.0, 38876.0, 63965.0, 107145.0, 175660.0, 1254578.0, 145243.0, 87211.0, 52538.0, 32505.0, 20920.0, 13973.0, 9324.0, 6291.0, 4463.0, 2944.0, 2027.0, 1401.0, 913.0, 667.0, 443.0, 306.0, 223.0, 150.0, 108.0, 73.0, 35.0, 32.0, 24.0, 18.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.875, -17.303955078125, -16.73291015625, -16.161865234375, -15.5908203125, -15.019775390625, -14.44873046875, -13.877685546875, -13.306640625, -12.735595703125, -12.16455078125, -11.593505859375, -11.0224609375, -10.451416015625, -9.88037109375, -9.309326171875, -8.73828125, -8.167236328125, -7.59619140625, -7.025146484375, -6.4541015625, -5.883056640625, -5.31201171875, -4.740966796875, -4.169921875, -3.598876953125, -3.02783203125, -2.456787109375, -1.8857421875, -1.314697265625, -0.74365234375, -0.172607421875, 0.3984375, 0.969482421875, 1.54052734375, 2.111572265625, 2.6826171875, 3.253662109375, 3.82470703125, 4.395751953125, 4.966796875, 5.537841796875, 6.10888671875, 6.679931640625, 7.2509765625, 7.822021484375, 8.39306640625, 8.964111328125, 9.53515625, 10.106201171875, 10.67724609375, 11.248291015625, 11.8193359375, 12.390380859375, 12.96142578125, 13.532470703125, 14.103515625, 14.674560546875, 15.24560546875, 15.816650390625, 16.3876953125, 16.958740234375, 17.52978515625, 18.100830078125, 18.671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 7.0, 20.0, 28.0, 32.0, 37.0, 57.0, 74.0, 123.0, 111.0, 105.0, 100.0, 75.0, 76.0, 37.0, 29.0, 21.0, 14.0, 9.0, 5.0, 10.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.22842025756835938, -0.21880340576171875, -0.20918655395507812, -0.1995697021484375, -0.18995285034179688, -0.18033599853515625, -0.17071914672851562, -0.161102294921875, -0.15148544311523438, -0.14186859130859375, -0.13225173950195312, -0.1226348876953125, -0.11301803588867188, -0.10340118408203125, -0.09378433227539062, -0.08416748046875, -0.07455062866210938, -0.06493377685546875, -0.055316925048828125, -0.0457000732421875, -0.036083221435546875, -0.02646636962890625, -0.016849517822265625, -0.007232666015625, 0.002384185791015625, 0.01200103759765625, 0.021617889404296875, 0.0312347412109375, 0.040851593017578125, 0.05046844482421875, 0.060085296630859375, 0.0697021484375, 0.07931900024414062, 0.08893585205078125, 0.09855270385742188, 0.1081695556640625, 0.11778640747070312, 0.12740325927734375, 0.13702011108398438, 0.146636962890625, 0.15625381469726562, 0.16587066650390625, 0.17548751831054688, 0.1851043701171875, 0.19472122192382812, 0.20433807373046875, 0.21395492553710938, 0.22357177734375, 0.23318862915039062, 0.24280548095703125, 0.2524223327636719, 0.2620391845703125, 0.2716560363769531, 0.28127288818359375, 0.2908897399902344, 0.300506591796875, 0.3101234436035156, 0.31974029541015625, 0.3293571472167969, 0.3389739990234375, 0.3485908508300781, 0.35820770263671875, 0.3678245544433594, 0.37744140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 9.0, 18.0, 24.0, 32.0, 48.0, 78.0, 123.0, 198.0, 404.0, 821.0, 1916.0, 5397.0, 21064.0, 172065.0, 762978.0, 65463.0, 11732.0, 3427.0, 1352.0, 650.0, 298.0, 163.0, 105.0, 48.0, 38.0, 26.0, 18.0, 12.0, 14.0, 5.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.923065185546875, -1.86859130859375, -1.814117431640625, -1.7596435546875, -1.705169677734375, -1.65069580078125, -1.596221923828125, -1.541748046875, -1.487274169921875, -1.43280029296875, -1.378326416015625, -1.3238525390625, -1.269378662109375, -1.21490478515625, -1.160430908203125, -1.10595703125, -1.051483154296875, -0.99700927734375, -0.942535400390625, -0.8880615234375, -0.833587646484375, -0.77911376953125, -0.724639892578125, -0.670166015625, -0.615692138671875, -0.56121826171875, -0.506744384765625, -0.4522705078125, -0.397796630859375, -0.34332275390625, -0.288848876953125, -0.234375, -0.179901123046875, -0.12542724609375, -0.070953369140625, -0.0164794921875, 0.037994384765625, 0.09246826171875, 0.146942138671875, 0.201416015625, 0.255889892578125, 0.31036376953125, 0.364837646484375, 0.4193115234375, 0.473785400390625, 0.52825927734375, 0.582733154296875, 0.63720703125, 0.691680908203125, 0.74615478515625, 0.800628662109375, 0.8551025390625, 0.909576416015625, 0.96405029296875, 1.018524169921875, 1.072998046875, 1.127471923828125, 1.18194580078125, 1.236419677734375, 1.2908935546875, 1.345367431640625, 1.39984130859375, 1.454315185546875, 1.5087890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 20.0, 14.0, 19.0, 29.0, 47.0, 58.0, 111.0, 193.0, 239.0, 122.0, 64.0, 24.0, 14.0, 9.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.7018107771873474, -0.6883791089057922, -0.6749473810195923, -0.6615157127380371, -0.6480840444564819, -0.634652316570282, -0.6212206482887268, -0.6077889800071716, -0.5943572521209717, -0.5809255838394165, -0.5674938559532166, -0.5540621876716614, -0.5406305193901062, -0.5271987915039062, -0.5137671232223511, -0.5003354549407959, -0.48690375685691833, -0.47347205877304077, -0.4600403904914856, -0.44660869240760803, -0.43317699432373047, -0.4197453260421753, -0.40631362795829773, -0.39288192987442017, -0.379450261592865, -0.3660185635089874, -0.35258689522743225, -0.3391551971435547, -0.3257234990596771, -0.31229180097579956, -0.2988601326942444, -0.2854284346103668, -0.27199673652648926, -0.2585650384426117, -0.24513335525989532, -0.23170167207717896, -0.2182699739933014, -0.20483829081058502, -0.19140660762786865, -0.1779749095439911, -0.16454321146011353, -0.15111152827739716, -0.1376798301935196, -0.12424814701080322, -0.11081645637750626, -0.09738476574420929, -0.08395308256149292, -0.07052139192819595, -0.05708970129489899, -0.04365801066160202, -0.030226323753595352, -0.016794636845588684, -0.0033629462122917175, 0.010068744421005249, 0.02350042760372162, 0.036932118237018585, 0.05036380887031555, 0.06379549950361252, 0.07722719013690948, 0.09065887331962585, 0.10409056395292282, 0.11752225458621979, 0.13095393776893616, 0.14438563585281372, 0.1578173190355301]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 13.0, 5.0, 14.0, 20.0, 18.0, 19.0, 29.0, 23.0, 22.0, 26.0, 26.0, 35.0, 38.0, 37.0, 39.0, 41.0, 32.0, 36.0, 45.0, 41.0, 44.0, 44.0, 29.0, 37.0, 28.0, 22.0, 21.0, 31.0, 25.0, 27.0, 23.0, 13.0, 21.0, 16.0, 13.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.22242134809494019, -0.2160506397485733, -0.20967991650104523, -0.20330920815467834, -0.19693848490715027, -0.1905677765607834, -0.1841970682144165, -0.17782634496688843, -0.17145563662052155, -0.16508492827415466, -0.1587142050266266, -0.1523434966802597, -0.14597278833389282, -0.13960206508636475, -0.13323135673999786, -0.12686064839363098, -0.1204899251461029, -0.11411920934915543, -0.10774849355220795, -0.10137778520584106, -0.09500706940889359, -0.0886363536119461, -0.08226564526557922, -0.07589492946863174, -0.06952421367168427, -0.06315349787473679, -0.056782785803079605, -0.050412073731422424, -0.044041357934474945, -0.037670642137527466, -0.031299930065870285, -0.024929217994213104, -0.018558502197265625, -0.012187788262963295, -0.005817074328660965, 0.000553639605641365, 0.006924353539943695, 0.013295069336891174, 0.019665781408548355, 0.026036493480205536, 0.032407209277153015, 0.038777925074100494, 0.045148637145757675, 0.051519349217414856, 0.057890065014362335, 0.06426078081130981, 0.0706314891576767, 0.07700220495462418, 0.08337292075157166, 0.08974363654851913, 0.09611435234546661, 0.1024850606918335, 0.10885577648878098, 0.11522649228572845, 0.12159720063209534, 0.1279679238796234, 0.1343386322259903, 0.14070934057235718, 0.14708006381988525, 0.15345077216625214, 0.15982148051261902, 0.1661922037601471, 0.17256291210651398, 0.17893362045288086, 0.18530434370040894]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 5.0, 12.0, 11.0, 12.0, 10.0, 23.0, 22.0, 25.0, 35.0, 35.0, 37.0, 31.0, 45.0, 28.0, 53.0, 54.0, 54.0, 45.0, 38.0, 39.0, 38.0, 42.0, 41.0, 32.0, 26.0, 32.0, 17.0, 19.0, 33.0, 17.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 1.0, 5.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.5, -239.046875, -230.59375, -222.140625, -213.6875, -205.234375, -196.78125, -188.328125, -179.875, -171.421875, -162.96875, -154.515625, -146.0625, -137.609375, -129.15625, -120.703125, -112.25, -103.796875, -95.34375, -86.890625, -78.4375, -69.984375, -61.53125, -53.078125, -44.625, -36.171875, -27.71875, -19.265625, -10.8125, -2.359375, 6.09375, 14.546875, 23.0, 31.453125, 39.90625, 48.359375, 56.8125, 65.265625, 73.71875, 82.171875, 90.625, 99.078125, 107.53125, 115.984375, 124.4375, 132.890625, 141.34375, 149.796875, 158.25, 166.703125, 175.15625, 183.609375, 192.0625, 200.515625, 208.96875, 217.421875, 225.875, 234.328125, 242.78125, 251.234375, 259.6875, 268.140625, 276.59375, 285.046875, 293.5]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 3.0, 12.0, 7.0, 8.0, 13.0, 25.0, 30.0, 43.0, 62.0, 90.0, 142.0, 196.0, 279.0, 429.0, 716.0, 1257.0, 2302.0, 4826.0, 11291.0, 32554.0, 121171.0, 501639.0, 274612.0, 62863.0, 19030.0, 7367.0, 3347.0, 1607.0, 941.0, 563.0, 355.0, 221.0, 161.0, 114.0, 64.0, 51.0, 48.0, 34.0, 24.0, 19.0, 12.0, 7.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.46875, -37.17626953125, -35.8837890625, -34.59130859375, -33.298828125, -32.00634765625, -30.7138671875, -29.42138671875, -28.12890625, -26.83642578125, -25.5439453125, -24.25146484375, -22.958984375, -21.66650390625, -20.3740234375, -19.08154296875, -17.7890625, -16.49658203125, -15.2041015625, -13.91162109375, -12.619140625, -11.32666015625, -10.0341796875, -8.74169921875, -7.44921875, -6.15673828125, -4.8642578125, -3.57177734375, -2.279296875, -0.98681640625, 0.3056640625, 1.59814453125, 2.890625, 4.18310546875, 5.4755859375, 6.76806640625, 8.060546875, 9.35302734375, 10.6455078125, 11.93798828125, 13.23046875, 14.52294921875, 15.8154296875, 17.10791015625, 18.400390625, 19.69287109375, 20.9853515625, 22.27783203125, 23.5703125, 24.86279296875, 26.1552734375, 27.44775390625, 28.740234375, 30.03271484375, 31.3251953125, 32.61767578125, 33.91015625, 35.20263671875, 36.4951171875, 37.78759765625, 39.080078125, 40.37255859375, 41.6650390625, 42.95751953125, 44.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 9.0, 15.0, 8.0, 20.0, 18.0, 18.0, 27.0, 34.0, 45.0, 65.0, 61.0, 70.0, 63.0, 2109.0, 78.0, 48.0, 61.0, 58.0, 50.0, 28.0, 33.0, 31.0, 20.0, 18.0, 6.0, 13.0, 1.0, 3.0, 8.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-625.0, -607.48828125, -589.9765625, -572.46484375, -554.953125, -537.44140625, -519.9296875, -502.41796875, -484.90625, -467.39453125, -449.8828125, -432.37109375, -414.859375, -397.34765625, -379.8359375, -362.32421875, -344.8125, -327.30078125, -309.7890625, -292.27734375, -274.765625, -257.25390625, -239.7421875, -222.23046875, -204.71875, -187.20703125, -169.6953125, -152.18359375, -134.671875, -117.16015625, -99.6484375, -82.13671875, -64.625, -47.11328125, -29.6015625, -12.08984375, 5.421875, 22.93359375, 40.4453125, 57.95703125, 75.46875, 92.98046875, 110.4921875, 128.00390625, 145.515625, 163.02734375, 180.5390625, 198.05078125, 215.5625, 233.07421875, 250.5859375, 268.09765625, 285.609375, 303.12109375, 320.6328125, 338.14453125, 355.65625, 373.16796875, 390.6796875, 408.19140625, 425.703125, 443.21484375, 460.7265625, 478.23828125, 495.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 14.0, 15.0, 17.0, 16.0, 34.0, 45.0, 53.0, 87.0, 108.0, 194.0, 314.0, 628.0, 1671.0, 6335.0, 50942.0, 2942457.0, 127857.0, 10656.0, 2346.0, 805.0, 383.0, 220.0, 157.0, 85.0, 62.0, 45.0, 29.0, 37.0, 15.0, 17.0, 7.0, 13.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-110.75, -107.13671875, -103.5234375, -99.91015625, -96.296875, -92.68359375, -89.0703125, -85.45703125, -81.84375, -78.23046875, -74.6171875, -71.00390625, -67.390625, -63.77734375, -60.1640625, -56.55078125, -52.9375, -49.32421875, -45.7109375, -42.09765625, -38.484375, -34.87109375, -31.2578125, -27.64453125, -24.03125, -20.41796875, -16.8046875, -13.19140625, -9.578125, -5.96484375, -2.3515625, 1.26171875, 4.875, 8.48828125, 12.1015625, 15.71484375, 19.328125, 22.94140625, 26.5546875, 30.16796875, 33.78125, 37.39453125, 41.0078125, 44.62109375, 48.234375, 51.84765625, 55.4609375, 59.07421875, 62.6875, 66.30078125, 69.9140625, 73.52734375, 77.140625, 80.75390625, 84.3671875, 87.98046875, 91.59375, 95.20703125, 98.8203125, 102.43359375, 106.046875, 109.66015625, 113.2734375, 116.88671875, 120.5]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 2.0, 7.0, 8.0, 19.0, 32.0, 44.0, 60.0, 135.0, 173.0, 174.0, 136.0, 68.0, 53.0, 25.0, 16.0, 10.0, 14.0, 11.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-949.3392944335938, -928.2639770507812, -907.1886596679688, -886.1133422851562, -865.0380249023438, -843.9627075195312, -822.8873901367188, -801.8120727539062, -780.7367553710938, -759.6614379882812, -738.5861206054688, -717.5108032226562, -696.4354858398438, -675.3601684570312, -654.2848510742188, -633.2095336914062, -612.13427734375, -591.0589599609375, -569.983642578125, -548.9083251953125, -527.8330078125, -506.7576904296875, -485.682373046875, -464.6070556640625, -443.53173828125, -422.4564208984375, -401.381103515625, -380.3057861328125, -359.23046875, -338.1551513671875, -317.079833984375, -296.0045166015625, -274.92919921875, -253.8538818359375, -232.778564453125, -211.7032470703125, -190.6279296875, -169.5526123046875, -148.47731018066406, -127.40199279785156, -106.32667541503906, -85.25135803222656, -64.17604064941406, -43.100730895996094, -22.025413513183594, -0.9500961303710938, 20.125213623046875, 41.200531005859375, 62.275848388671875, 83.35116577148438, 104.42648315429688, 125.50179290771484, 146.57711791992188, 167.65243530273438, 188.7277374267578, 209.8030548095703, 230.8783721923828, 251.9536895751953, 273.02899169921875, 294.10430908203125, 315.17962646484375, 336.25494384765625, 357.33026123046875, 378.40557861328125, 399.48089599609375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 10.0, 10.0, 15.0, 11.0, 18.0, 22.0, 26.0, 21.0, 30.0, 31.0, 29.0, 39.0, 35.0, 40.0, 54.0, 48.0, 54.0, 63.0, 52.0, 50.0, 37.0, 39.0, 34.0, 41.0, 27.0, 22.0, 16.0, 18.0, 15.0, 14.0, 13.0, 9.0, 5.0, 5.0, 7.0, 2.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-594.61328125, -575.13037109375, -555.6474609375, -536.1644897460938, -516.6815795898438, -497.19866943359375, -477.71575927734375, -458.23284912109375, -438.7499084472656, -419.2669982910156, -399.7840576171875, -380.3011474609375, -360.8182373046875, -341.3352966308594, -321.8523864746094, -302.36944580078125, -282.88653564453125, -263.40362548828125, -243.92068481445312, -224.43777465820312, -204.95484924316406, -185.471923828125, -165.989013671875, -146.50608825683594, -127.02316284179688, -107.54023742675781, -88.05731964111328, -68.57440185546875, -49.09147644042969, -29.608551025390625, -10.125633239746094, 9.357284545898438, 28.8402099609375, 48.3231315612793, 67.8060531616211, 87.28897094726562, 106.77189636230469, 126.25482177734375, 145.73773193359375, 165.2206573486328, 184.70358276367188, 204.18650817871094, 223.66943359375, 243.15234375, 262.63525390625, 282.1181945800781, 301.6011047363281, 321.08404541015625, 340.56695556640625, 360.04986572265625, 379.5328063964844, 399.0157165527344, 418.4986572265625, 437.9815673828125, 457.4644775390625, 476.9473876953125, 496.4303283691406, 515.9132690429688, 535.3961791992188, 554.8790893554688, 574.3619995117188, 593.844970703125, 613.327880859375, 632.810791015625, 652.293701171875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 5.0, 5.0, 8.0, 12.0, 10.0, 17.0, 24.0, 27.0, 39.0, 31.0, 54.0, 58.0, 95.0, 90.0, 124.0, 162.0, 221.0, 323.0, 448.0, 823.0, 1597.0, 1041593.0, 886.0, 559.0, 323.0, 238.0, 167.0, 116.0, 99.0, 82.0, 58.0, 53.0, 42.0, 26.0, 27.0, 18.0, 20.0, 18.0, 14.0, 11.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-153.81883239746094, -148.34539794921875, -142.87196350097656, -137.39852905273438, -131.92507934570312, -126.45165252685547, -120.97821044921875, -115.50477600097656, -110.03134155273438, -104.55790710449219, -99.08447265625, -93.61103057861328, -88.1375961303711, -82.6641616821289, -77.19071960449219, -71.71728515625, -66.24385070800781, -60.770416259765625, -55.29697799682617, -49.82353973388672, -44.35010528564453, -38.876670837402344, -33.40323257446289, -27.929794311523438, -22.45635986328125, -16.98292350769043, -11.50948715209961, -6.036050796508789, -0.5626144409179688, 4.910821914672852, 10.384258270263672, 15.857696533203125, 21.331146240234375, 26.804582595825195, 32.278018951416016, 37.75145721435547, 43.224891662597656, 48.698326110839844, 54.1717643737793, 59.64520263671875, 65.11863708496094, 70.59207153320312, 76.06550598144531, 81.53894805908203, 87.01238250732422, 92.4858169555664, 97.95925903320312, 103.43269348144531, 108.9061279296875, 114.37956237792969, 119.85299682617188, 125.3264389038086, 130.79986572265625, 136.2733154296875, 141.7467498779297, 147.22018432617188, 152.69361877441406, 158.16705322265625, 163.64048767089844, 169.11392211914062, 174.58737182617188, 180.06080627441406, 185.53424072265625, 191.00767517089844, 196.48110961914062]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 11.0, 9.0, 12.0, 4.0, 9.0, 18.0, 24.0, 76.0, 594.0, 51461156.0, 1060.0, 73.0, 36.0, 17.0, 11.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3195.414794921875, -3100.2216796875, -3005.0283203125, -2909.835205078125, -2814.64208984375, -2719.44873046875, -2624.255615234375, -2529.0625, -2433.869140625, -2338.676025390625, -2243.482666015625, -2148.28955078125, -2053.09619140625, -1957.903076171875, -1862.7099609375, -1767.5167236328125, -1672.323486328125, -1577.1302490234375, -1481.93701171875, -1386.743896484375, -1291.5506591796875, -1196.357421875, -1101.164306640625, -1005.9710693359375, -910.77783203125, -815.5845947265625, -720.3914184570312, -625.1982421875, -530.0050048828125, -434.8117980957031, -339.61859130859375, -244.4254150390625, -149.232177734375, -54.038970947265625, 41.15423583984375, 136.34744262695312, 231.5406494140625, 326.7338562011719, 421.92706298828125, 517.1202392578125, 612.3134765625, 707.5067138671875, 802.6998901367188, 897.89306640625, 993.0863037109375, 1088.279541015625, 1183.47265625, 1278.6658935546875, 1373.859130859375, 1469.0523681640625, 1564.24560546875, 1659.438720703125, 1754.6319580078125, 1849.8251953125, 1945.018310546875, 2040.2115478515625, 2135.40478515625, 2230.597900390625, 2325.791259765625, 2420.984375, 2516.177734375, 2611.370849609375, 2706.56396484375, 2801.75732421875, 2896.950439453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 14.0, 14.0, 22.0, 40.0, 67.0, 92.0, 125.0, 211.0, 290.0, 449.0, 676.0, 988.0, 1488.0, 2251.0, 3391.0, 5151.0, 7745.0, 11692.0, 17469.0, 27471.0, 42158.0, 67282.0, 110593.0, 187931.0, 326438.0, 676907.0, 3685608.0, 465228.0, 257162.0, 149263.0, 88932.0, 54796.0, 34442.0, 22238.0, 14718.0, 9613.0, 6165.0, 4151.0, 2761.0, 1768.0, 1209.0, 846.0, 580.0, 366.0, 234.0, 167.0, 88.0, 47.0, 40.0, 22.0, 13.0, 6.0, 7.0, 1.0, 2.0], "bins": [-7.796875, -7.57598876953125, -7.3551025390625, -7.13421630859375, -6.913330078125, -6.69244384765625, -6.4715576171875, -6.25067138671875, -6.02978515625, -5.80889892578125, -5.5880126953125, -5.36712646484375, -5.146240234375, -4.92535400390625, -4.7044677734375, -4.48358154296875, -4.2626953125, -4.04180908203125, -3.8209228515625, -3.60003662109375, -3.379150390625, -3.15826416015625, -2.9373779296875, -2.71649169921875, -2.49560546875, -2.27471923828125, -2.0538330078125, -1.83294677734375, -1.612060546875, -1.39117431640625, -1.1702880859375, -0.94940185546875, -0.728515625, -0.50762939453125, -0.2867431640625, -0.06585693359375, 0.155029296875, 0.37591552734375, 0.5968017578125, 0.81768798828125, 1.03857421875, 1.25946044921875, 1.4803466796875, 1.70123291015625, 1.922119140625, 2.14300537109375, 2.3638916015625, 2.58477783203125, 2.8056640625, 3.02655029296875, 3.2474365234375, 3.46832275390625, 3.689208984375, 3.91009521484375, 4.1309814453125, 4.35186767578125, 4.57275390625, 4.79364013671875, 5.0145263671875, 5.23541259765625, 5.456298828125, 5.67718505859375, 5.8980712890625, 6.11895751953125, 6.33984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 11.0, 7.0, 14.0, 7.0, 16.0, 12.0, 18.0, 18.0, 30.0, 34.0, 25.0, 26.0, 35.0, 35.0, 31.0, 30.0, 43.0, 68.0, 840.0, 220.0, 37.0, 37.0, 46.0, 42.0, 27.0, 40.0, 36.0, 39.0, 29.0, 23.0, 24.0, 18.0, 11.0, 15.0, 17.0, 7.0, 7.0, 9.0, 6.0, 5.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.6728515625, -60.408203125, -58.1435546875, -55.87890625, -53.6142578125, -51.349609375, -49.0849609375, -46.8203125, -44.5556640625, -42.291015625, -40.0263671875, -37.76171875, -35.4970703125, -33.232421875, -30.9677734375, -28.703125, -26.4384765625, -24.173828125, -21.9091796875, -19.64453125, -17.3798828125, -15.115234375, -12.8505859375, -10.5859375, -8.3212890625, -6.056640625, -3.7919921875, -1.52734375, 0.7373046875, 3.001953125, 5.2666015625, 7.53125, 9.7958984375, 12.060546875, 14.3251953125, 16.58984375, 18.8544921875, 21.119140625, 23.3837890625, 25.6484375, 27.9130859375, 30.177734375, 32.4423828125, 34.70703125, 36.9716796875, 39.236328125, 41.5009765625, 43.765625, 46.0302734375, 48.294921875, 50.5595703125, 52.82421875, 55.0888671875, 57.353515625, 59.6181640625, 61.8828125, 64.1474609375, 66.412109375, 68.6767578125, 70.94140625, 73.2060546875, 75.470703125, 77.7353515625, 80.0]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 14.0, 15.0, 44.0, 49.0, 81.0, 115.0, 193.0, 263.0, 364.0, 604.0, 892.0, 1285.0, 1898.0, 2983.0, 4359.0, 6566.0, 10338.0, 15779.0, 25125.0, 39954.0, 65118.0, 107534.0, 185634.0, 340541.0, 775673.0, 3671455.0, 446311.0, 236934.0, 136069.0, 80606.0, 49004.0, 30258.0, 19381.0, 12369.0, 7990.0, 5183.0, 3377.0, 2288.0, 1606.0, 1035.0, 676.0, 477.0, 336.0, 223.0, 138.0, 100.0, 60.0, 47.0, 23.0, 24.0, 9.0, 3.0, 4.0, 5.0, 6.0, 3.0, 2.0], "bins": [-7.48046875, -7.24822998046875, -7.0159912109375, -6.78375244140625, -6.551513671875, -6.31927490234375, -6.0870361328125, -5.85479736328125, -5.62255859375, -5.39031982421875, -5.1580810546875, -4.92584228515625, -4.693603515625, -4.46136474609375, -4.2291259765625, -3.99688720703125, -3.7646484375, -3.53240966796875, -3.3001708984375, -3.06793212890625, -2.835693359375, -2.60345458984375, -2.3712158203125, -2.13897705078125, -1.90673828125, -1.67449951171875, -1.4422607421875, -1.21002197265625, -0.977783203125, -0.74554443359375, -0.5133056640625, -0.28106689453125, -0.048828125, 0.18341064453125, 0.4156494140625, 0.64788818359375, 0.880126953125, 1.11236572265625, 1.3446044921875, 1.57684326171875, 1.80908203125, 2.04132080078125, 2.2735595703125, 2.50579833984375, 2.738037109375, 2.97027587890625, 3.2025146484375, 3.43475341796875, 3.6669921875, 3.89923095703125, 4.1314697265625, 4.36370849609375, 4.595947265625, 4.82818603515625, 5.0604248046875, 5.29266357421875, 5.52490234375, 5.75714111328125, 5.9893798828125, 6.22161865234375, 6.453857421875, 6.68609619140625, 6.9183349609375, 7.15057373046875, 7.3828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 6.0, 9.0, 11.0, 10.0, 21.0, 19.0, 24.0, 19.0, 33.0, 41.0, 37.0, 29.0, 35.0, 41.0, 35.0, 34.0, 58.0, 161.0, 926.0, 66.0, 47.0, 35.0, 38.0, 35.0, 25.0, 29.0, 19.0, 27.0, 24.0, 18.0, 19.0, 13.0, 14.0, 7.0, 10.0, 8.0, 6.0, 6.0, 7.0, 1.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-83.3125, -80.8046875, -78.296875, -75.7890625, -73.28125, -70.7734375, -68.265625, -65.7578125, -63.25, -60.7421875, -58.234375, -55.7265625, -53.21875, -50.7109375, -48.203125, -45.6953125, -43.1875, -40.6796875, -38.171875, -35.6640625, -33.15625, -30.6484375, -28.140625, -25.6328125, -23.125, -20.6171875, -18.109375, -15.6015625, -13.09375, -10.5859375, -8.078125, -5.5703125, -3.0625, -0.5546875, 1.953125, 4.4609375, 6.96875, 9.4765625, 11.984375, 14.4921875, 17.0, 19.5078125, 22.015625, 24.5234375, 27.03125, 29.5390625, 32.046875, 34.5546875, 37.0625, 39.5703125, 42.078125, 44.5859375, 47.09375, 49.6015625, 52.109375, 54.6171875, 57.125, 59.6328125, 62.140625, 64.6484375, 67.15625, 69.6640625, 72.171875, 74.6796875, 77.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 11.0, 22.0, 22.0, 45.0, 59.0, 145.0, 204.0, 307.0, 504.0, 788.0, 1290.0, 1975.0, 3042.0, 4678.0, 7837.0, 12967.0, 21977.0, 40892.0, 86401.0, 5284123.0, 645993.0, 83728.0, 39787.0, 21402.0, 12551.0, 7712.0, 4761.0, 3032.0, 1921.0, 1279.0, 748.0, 467.0, 298.0, 157.0, 106.0, 84.0, 40.0, 24.0, 18.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.087646484375, -21.26904296875, -20.450439453125, -19.6318359375, -18.813232421875, -17.99462890625, -17.176025390625, -16.357421875, -15.538818359375, -14.72021484375, -13.901611328125, -13.0830078125, -12.264404296875, -11.44580078125, -10.627197265625, -9.80859375, -8.989990234375, -8.17138671875, -7.352783203125, -6.5341796875, -5.715576171875, -4.89697265625, -4.078369140625, -3.259765625, -2.441162109375, -1.62255859375, -0.803955078125, 0.0146484375, 0.833251953125, 1.65185546875, 2.470458984375, 3.2890625, 4.107666015625, 4.92626953125, 5.744873046875, 6.5634765625, 7.382080078125, 8.20068359375, 9.019287109375, 9.837890625, 10.656494140625, 11.47509765625, 12.293701171875, 13.1123046875, 13.930908203125, 14.74951171875, 15.568115234375, 16.38671875, 17.205322265625, 18.02392578125, 18.842529296875, 19.6611328125, 20.479736328125, 21.29833984375, 22.116943359375, 22.935546875, 23.754150390625, 24.57275390625, 25.391357421875, 26.2099609375, 27.028564453125, 27.84716796875, 28.665771484375, 29.484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 5.0, 18.0, 11.0, 18.0, 16.0, 13.0, 25.0, 37.0, 23.0, 30.0, 36.0, 30.0, 34.0, 44.0, 46.0, 36.0, 141.0, 922.0, 81.0, 45.0, 44.0, 39.0, 32.0, 23.0, 31.0, 28.0, 22.0, 25.0, 19.0, 26.0, 16.0, 13.0, 16.0, 11.0, 13.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-93.8125, -91.072265625, -88.33203125, -85.591796875, -82.8515625, -80.111328125, -77.37109375, -74.630859375, -71.890625, -69.150390625, -66.41015625, -63.669921875, -60.9296875, -58.189453125, -55.44921875, -52.708984375, -49.96875, -47.228515625, -44.48828125, -41.748046875, -39.0078125, -36.267578125, -33.52734375, -30.787109375, -28.046875, -25.306640625, -22.56640625, -19.826171875, -17.0859375, -14.345703125, -11.60546875, -8.865234375, -6.125, -3.384765625, -0.64453125, 2.095703125, 4.8359375, 7.576171875, 10.31640625, 13.056640625, 15.796875, 18.537109375, 21.27734375, 24.017578125, 26.7578125, 29.498046875, 32.23828125, 34.978515625, 37.71875, 40.458984375, 43.19921875, 45.939453125, 48.6796875, 51.419921875, 54.16015625, 56.900390625, 59.640625, 62.380859375, 65.12109375, 67.861328125, 70.6015625, 73.341796875, 76.08203125, 78.822265625, 81.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 20.0, 25.0, 72.0, 228.0, 410.0, 132.0, 49.0, 27.0, 15.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.72393798828125, -269.84014892578125, -259.95635986328125, -250.0725555419922, -240.18875122070312, -230.30496215820312, -220.42117309570312, -210.53738403320312, -200.65357971191406, -190.76979064941406, -180.885986328125, -171.002197265625, -161.118408203125, -151.23460388183594, -141.35081481933594, -131.46701049804688, -121.58322143554688, -111.69942474365234, -101.81562805175781, -91.93183898925781, -82.04804229736328, -72.16424560546875, -62.280452728271484, -52.39665985107422, -42.51286315917969, -32.629066467285156, -22.74527359008789, -12.861478805541992, -2.9776840209960938, 6.9061126708984375, 16.789905548095703, 26.67369842529297, 36.5574951171875, 46.44129180908203, 56.3250846862793, 66.20887756347656, 76.0926742553711, 85.97647094726562, 95.86026000976562, 105.74405670166016, 115.62785339355469, 125.51165008544922, 135.39544677734375, 145.27923583984375, 155.16302490234375, 165.0468292236328, 174.9306182861328, 184.81442260742188, 194.69821166992188, 204.58200073242188, 214.46580505371094, 224.34959411621094, 234.2333984375, 244.1171875, 254.0009765625, 263.884765625, 273.7685546875, 283.65234375, 293.5361328125, 303.4199523925781, 313.3037414550781, 323.1875305175781, 333.0713195800781, 342.9551086425781, 352.83892822265625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 4.0, 10.0, 5.0, 21.0, 23.0, 31.0, 39.0, 66.0, 83.0, 111.0, 112.0, 106.0, 105.0, 78.0, 56.0, 46.0, 30.0, 20.0, 17.0, 13.0, 8.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-523.0494384765625, -510.5206604003906, -497.99188232421875, -485.4631042480469, -472.934326171875, -460.405517578125, -447.8767395019531, -435.34796142578125, -422.8191833496094, -410.2904052734375, -397.7616271972656, -385.23284912109375, -372.70404052734375, -360.1752624511719, -347.646484375, -335.1177062988281, -322.58892822265625, -310.0601501464844, -297.5313720703125, -285.0025939941406, -272.47381591796875, -259.94500732421875, -247.41622924804688, -234.887451171875, -222.35867309570312, -209.82989501953125, -197.30111694335938, -184.77232360839844, -172.24354553222656, -159.7147674560547, -147.18597412109375, -134.65719604492188, -122.12841796875, -109.59963989257812, -97.07085418701172, -84.54206848144531, -72.01329040527344, -59.4845085144043, -46.955726623535156, -34.42694091796875, -21.898162841796875, -9.369380950927734, 3.1594009399414062, 15.688182830810547, 28.216964721679688, 40.74574661254883, 53.27452850341797, 65.80331420898438, 78.33209228515625, 90.86087036132812, 103.38965606689453, 115.91844177246094, 128.4472198486328, 140.9759979248047, 153.50479125976562, 166.0335693359375, 178.56234741210938, 191.09112548828125, 203.61990356445312, 216.14869689941406, 228.67747497558594, 241.2062530517578, 253.73504638671875, 266.2638244628906, 278.7926025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 5.0, 5.0, 7.0, 12.0, 8.0, 12.0, 18.0, 31.0, 39.0, 51.0, 80.0, 112.0, 137.0, 194.0, 303.0, 434.0, 776.0, 1214.0, 2176.0, 4258.0, 9604.0, 30719.0, 4017755.0, 99846.0, 15112.0, 5448.0, 2613.0, 1328.0, 753.0, 446.0, 276.0, 178.0, 110.0, 59.0, 62.0, 26.0, 26.0, 18.0, 7.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.59375, -4.475189208984375, -4.35662841796875, -4.238067626953125, -4.1195068359375, -4.000946044921875, -3.88238525390625, -3.763824462890625, -3.645263671875, -3.526702880859375, -3.40814208984375, -3.289581298828125, -3.1710205078125, -3.052459716796875, -2.93389892578125, -2.815338134765625, -2.69677734375, -2.578216552734375, -2.45965576171875, -2.341094970703125, -2.2225341796875, -2.103973388671875, -1.98541259765625, -1.866851806640625, -1.748291015625, -1.629730224609375, -1.51116943359375, -1.392608642578125, -1.2740478515625, -1.155487060546875, -1.03692626953125, -0.918365478515625, -0.7998046875, -0.681243896484375, -0.56268310546875, -0.444122314453125, -0.3255615234375, -0.207000732421875, -0.08843994140625, 0.030120849609375, 0.148681640625, 0.267242431640625, 0.38580322265625, 0.504364013671875, 0.6229248046875, 0.741485595703125, 0.86004638671875, 0.978607177734375, 1.09716796875, 1.215728759765625, 1.33428955078125, 1.452850341796875, 1.5714111328125, 1.689971923828125, 1.80853271484375, 1.927093505859375, 2.045654296875, 2.164215087890625, 2.28277587890625, 2.401336669921875, 2.5198974609375, 2.638458251953125, 2.75701904296875, 2.875579833984375, 2.994140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 6.0, 7.0, 10.0, 8.0, 12.0, 18.0, 17.0, 759.0, 33.0, 14.0, 19.0, 11.0, 11.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.537322998046875, -1.49652099609375, -1.455718994140625, -1.4149169921875, -1.374114990234375, -1.33331298828125, -1.292510986328125, -1.251708984375, -1.210906982421875, -1.17010498046875, -1.129302978515625, -1.0885009765625, -1.047698974609375, -1.00689697265625, -0.966094970703125, -0.92529296875, -0.884490966796875, -0.84368896484375, -0.802886962890625, -0.7620849609375, -0.721282958984375, -0.68048095703125, -0.639678955078125, -0.598876953125, -0.558074951171875, -0.51727294921875, -0.476470947265625, -0.4356689453125, -0.394866943359375, -0.35406494140625, -0.313262939453125, -0.2724609375, -0.231658935546875, -0.19085693359375, -0.150054931640625, -0.1092529296875, -0.068450927734375, -0.02764892578125, 0.013153076171875, 0.053955078125, 0.094757080078125, 0.13555908203125, 0.176361083984375, 0.2171630859375, 0.257965087890625, 0.29876708984375, 0.339569091796875, 0.38037109375, 0.421173095703125, 0.46197509765625, 0.502777099609375, 0.5435791015625, 0.584381103515625, 0.62518310546875, 0.665985107421875, 0.706787109375, 0.747589111328125, 0.78839111328125, 0.829193115234375, 0.8699951171875, 0.910797119140625, 0.95159912109375, 0.992401123046875, 1.033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 8.0, 18.0, 20.0, 26.0, 40.0, 88.0, 168.0, 409.0, 1278.0, 5509.0, 32517.0, 1662916.0, 2442885.0, 38660.0, 6953.0, 1703.0, 515.0, 215.0, 139.0, 69.0, 30.0, 24.0, 22.0, 13.0, 14.0, 10.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.787506103515625, -3.64727783203125, -3.507049560546875, -3.3668212890625, -3.226593017578125, -3.08636474609375, -2.946136474609375, -2.805908203125, -2.665679931640625, -2.52545166015625, -2.385223388671875, -2.2449951171875, -2.104766845703125, -1.96453857421875, -1.824310302734375, -1.68408203125, -1.543853759765625, -1.40362548828125, -1.263397216796875, -1.1231689453125, -0.982940673828125, -0.84271240234375, -0.702484130859375, -0.562255859375, -0.422027587890625, -0.28179931640625, -0.141571044921875, -0.0013427734375, 0.138885498046875, 0.27911376953125, 0.419342041015625, 0.5595703125, 0.699798583984375, 0.84002685546875, 0.980255126953125, 1.1204833984375, 1.260711669921875, 1.40093994140625, 1.541168212890625, 1.681396484375, 1.821624755859375, 1.96185302734375, 2.102081298828125, 2.2423095703125, 2.382537841796875, 2.52276611328125, 2.662994384765625, 2.80322265625, 2.943450927734375, 3.08367919921875, 3.223907470703125, 3.3641357421875, 3.504364013671875, 3.64459228515625, 3.784820556640625, 3.925048828125, 4.065277099609375, 4.20550537109375, 4.345733642578125, 4.4859619140625, 4.626190185546875, 4.76641845703125, 4.906646728515625, 5.046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 17.0, 11.0, 17.0, 28.0, 39.0, 41.0, 58.0, 99.0, 144.0, 534.0, 1966.0, 446.0, 192.0, 122.0, 80.0, 47.0, 54.0, 29.0, 23.0, 23.0, 16.0, 13.0, 8.0, 14.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.128265380859375, -1.08856201171875, -1.048858642578125, -1.0091552734375, -0.969451904296875, -0.92974853515625, -0.890045166015625, -0.850341796875, -0.810638427734375, -0.77093505859375, -0.731231689453125, -0.6915283203125, -0.651824951171875, -0.61212158203125, -0.572418212890625, -0.53271484375, -0.493011474609375, -0.45330810546875, -0.413604736328125, -0.3739013671875, -0.334197998046875, -0.29449462890625, -0.254791259765625, -0.215087890625, -0.175384521484375, -0.13568115234375, -0.095977783203125, -0.0562744140625, -0.016571044921875, 0.02313232421875, 0.062835693359375, 0.1025390625, 0.142242431640625, 0.18194580078125, 0.221649169921875, 0.2613525390625, 0.301055908203125, 0.34075927734375, 0.380462646484375, 0.420166015625, 0.459869384765625, 0.49957275390625, 0.539276123046875, 0.5789794921875, 0.618682861328125, 0.65838623046875, 0.698089599609375, 0.73779296875, 0.777496337890625, 0.81719970703125, 0.856903076171875, 0.8966064453125, 0.936309814453125, 0.97601318359375, 1.015716552734375, 1.055419921875, 1.095123291015625, 1.13482666015625, 1.174530029296875, 1.2142333984375, 1.253936767578125, 1.29364013671875, 1.333343505859375, 1.373046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 21.0, 110.0, 608.0, 186.0, 51.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8753252029418945, -4.22678279876709, -3.578240394592285, -2.9296982288360596, -2.281155824661255, -1.6326134204864502, -0.9840712547302246, -0.3355288505554199, 0.31301355361938477, 0.9615558981895447, 1.6100982427597046, 2.2586405277252197, 2.9071829319000244, 3.555725336074829, 4.204267501831055, 4.852809906005859, 5.501352310180664, 6.149894714355469, 6.798437118530273, 7.446979522705078, 8.095521926879883, 8.744064331054688, 9.392606735229492, 10.041149139404297, 10.689691543579102, 11.338233947753906, 11.986776351928711, 12.635318756103516, 13.28386116027832, 13.932403564453125, 14.58094596862793, 15.229488372802734, 15.878030776977539, 16.526573181152344, 17.17511558532715, 17.823657989501953, 18.472200393676758, 19.120742797851562, 19.769285202026367, 20.417827606201172, 21.066370010375977, 21.71491241455078, 22.363454818725586, 23.01199722290039, 23.660539627075195, 24.30908203125, 24.957624435424805, 25.60616683959961, 26.25470733642578, 26.903249740600586, 27.55179214477539, 28.200334548950195, 28.848876953125, 29.497419357299805, 30.14596176147461, 30.794504165649414, 31.44304656982422, 32.09158706665039, 32.74013137817383, 33.388671875, 34.03721618652344, 34.68575668334961, 35.33430099487305, 35.98284149169922, 36.631385803222656]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 17.0, 24.0, 39.0, 41.0, 37.0, 35.0, 54.0, 54.0, 56.0, 67.0, 66.0, 78.0, 62.0, 66.0, 53.0, 49.0, 47.0, 24.0, 29.0, 23.0, 14.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1167707443237305, -5.892937183380127, -5.669103622436523, -5.44527006149292, -5.221436500549316, -4.997602939605713, -4.773769378662109, -4.549935340881348, -4.326102256774902, -4.102268695831299, -3.8784351348876953, -3.654601573944092, -3.4307680130004883, -3.2069344520568848, -2.983100652694702, -2.7592670917510986, -2.535433292388916, -2.3115997314453125, -2.087766170501709, -1.863932490348816, -1.6400989294052124, -1.4162653684616089, -1.1924316883087158, -0.9685981273651123, -0.7447645664215088, -0.5209310054779053, -0.297097384929657, -0.07326376438140869, 0.15056979656219482, 0.37440335750579834, 0.5982370376586914, 0.8220705986022949, 1.0459041595458984, 1.269737720489502, 1.4935712814331055, 1.7174049615859985, 1.941238522529602, 2.165071964263916, 2.3889057636260986, 2.612739324569702, 2.8365728855133057, 3.060406446456909, 3.2842400074005127, 3.5080738067626953, 3.731907367706299, 3.9557409286499023, 4.179574489593506, 4.403408050537109, 4.627241611480713, 4.851075172424316, 5.07490873336792, 5.298742294311523, 5.522575855255127, 5.7464094161987305, 5.970243453979492, 6.1940765380859375, 6.417910575866699, 6.641744136810303, 6.865577697753906, 7.08941125869751, 7.313244819641113, 7.537078380584717, 7.76091194152832, 7.984745979309082, 8.208579063415527]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 19.0, 17.0, 32.0, 45.0, 56.0, 93.0, 128.0, 193.0, 300.0, 462.0, 718.0, 1205.0, 1942.0, 3326.0, 5897.0, 11600.0, 26365.0, 780442.0, 170064.0, 22340.0, 10075.0, 5343.0, 3053.0, 1786.0, 1066.0, 695.0, 400.0, 264.0, 164.0, 139.0, 91.0, 62.0, 37.0, 32.0, 21.0, 19.0, 10.0, 5.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.2850341796875, -4.113037109375, -3.9410400390625, -3.76904296875, -3.5970458984375, -3.425048828125, -3.2530517578125, -3.0810546875, -2.9090576171875, -2.737060546875, -2.5650634765625, -2.39306640625, -2.2210693359375, -2.049072265625, -1.8770751953125, -1.705078125, -1.5330810546875, -1.361083984375, -1.1890869140625, -1.01708984375, -0.8450927734375, -0.673095703125, -0.5010986328125, -0.3291015625, -0.1571044921875, 0.014892578125, 0.1868896484375, 0.35888671875, 0.5308837890625, 0.702880859375, 0.8748779296875, 1.046875, 1.2188720703125, 1.390869140625, 1.5628662109375, 1.73486328125, 1.9068603515625, 2.078857421875, 2.2508544921875, 2.4228515625, 2.5948486328125, 2.766845703125, 2.9388427734375, 3.11083984375, 3.2828369140625, 3.454833984375, 3.6268310546875, 3.798828125, 3.9708251953125, 4.142822265625, 4.3148193359375, 4.48681640625, 4.6588134765625, 4.830810546875, 5.0028076171875, 5.1748046875, 5.3468017578125, 5.518798828125, 5.6907958984375, 5.86279296875, 6.0347900390625, 6.206787109375, 6.3787841796875, 6.55078125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 9.0, 8.0, 9.0, 7.0, 8.0, 15.0, 15.0, 41.0, 548.0, 213.0, 24.0, 15.0, 16.0, 8.0, 7.0, 8.0, 4.0, 9.0, 3.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5625, -1.5210418701171875, -1.479583740234375, -1.4381256103515625, -1.39666748046875, -1.3552093505859375, -1.313751220703125, -1.2722930908203125, -1.2308349609375, -1.1893768310546875, -1.147918701171875, -1.1064605712890625, -1.06500244140625, -1.0235443115234375, -0.982086181640625, -0.9406280517578125, -0.899169921875, -0.8577117919921875, -0.816253662109375, -0.7747955322265625, -0.73333740234375, -0.6918792724609375, -0.650421142578125, -0.6089630126953125, -0.5675048828125, -0.5260467529296875, -0.484588623046875, -0.4431304931640625, -0.40167236328125, -0.3602142333984375, -0.318756103515625, -0.2772979736328125, -0.23583984375, -0.1943817138671875, -0.152923583984375, -0.1114654541015625, -0.07000732421875, -0.0285491943359375, 0.012908935546875, 0.0543670654296875, 0.0958251953125, 0.1372833251953125, 0.178741455078125, 0.2201995849609375, 0.26165771484375, 0.3031158447265625, 0.344573974609375, 0.3860321044921875, 0.427490234375, 0.4689483642578125, 0.510406494140625, 0.5518646240234375, 0.59332275390625, 0.6347808837890625, 0.676239013671875, 0.7176971435546875, 0.7591552734375, 0.8006134033203125, 0.842071533203125, 0.8835296630859375, 0.92498779296875, 0.9664459228515625, 1.007904052734375, 1.0493621826171875, 1.0908203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 13.0, 19.0, 28.0, 28.0, 56.0, 64.0, 93.0, 132.0, 172.0, 223.0, 342.0, 504.0, 996.0, 1837.0, 3951.0, 8655.0, 21315.0, 56859.0, 201747.0, 533423.0, 142441.0, 44160.0, 17028.0, 7166.0, 3335.0, 1578.0, 882.0, 427.0, 302.0, 210.0, 141.0, 110.0, 77.0, 70.0, 42.0, 39.0, 20.0, 10.0, 20.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.8828125, -2.79644775390625, -2.7100830078125, -2.62371826171875, -2.537353515625, -2.45098876953125, -2.3646240234375, -2.27825927734375, -2.19189453125, -2.10552978515625, -2.0191650390625, -1.93280029296875, -1.846435546875, -1.76007080078125, -1.6737060546875, -1.58734130859375, -1.5009765625, -1.41461181640625, -1.3282470703125, -1.24188232421875, -1.155517578125, -1.06915283203125, -0.9827880859375, -0.89642333984375, -0.81005859375, -0.72369384765625, -0.6373291015625, -0.55096435546875, -0.464599609375, -0.37823486328125, -0.2918701171875, -0.20550537109375, -0.119140625, -0.03277587890625, 0.0535888671875, 0.13995361328125, 0.226318359375, 0.31268310546875, 0.3990478515625, 0.48541259765625, 0.57177734375, 0.65814208984375, 0.7445068359375, 0.83087158203125, 0.917236328125, 1.00360107421875, 1.0899658203125, 1.17633056640625, 1.2626953125, 1.34906005859375, 1.4354248046875, 1.52178955078125, 1.608154296875, 1.69451904296875, 1.7808837890625, 1.86724853515625, 1.95361328125, 2.03997802734375, 2.1263427734375, 2.21270751953125, 2.299072265625, 2.38543701171875, 2.4718017578125, 2.55816650390625, 2.64453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 9.0, 15.0, 17.0, 17.0, 15.0, 17.0, 24.0, 19.0, 20.0, 31.0, 43.0, 39.0, 40.0, 45.0, 39.0, 40.0, 45.0, 48.0, 45.0, 42.0, 46.0, 34.0, 50.0, 28.0, 34.0, 23.0, 25.0, 21.0, 16.0, 16.0, 14.0, 19.0, 12.0, 5.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.720703125, -3.60357666015625, -3.4864501953125, -3.36932373046875, -3.252197265625, -3.13507080078125, -3.0179443359375, -2.90081787109375, -2.78369140625, -2.66656494140625, -2.5494384765625, -2.43231201171875, -2.315185546875, -2.19805908203125, -2.0809326171875, -1.96380615234375, -1.8466796875, -1.72955322265625, -1.6124267578125, -1.49530029296875, -1.378173828125, -1.26104736328125, -1.1439208984375, -1.02679443359375, -0.90966796875, -0.79254150390625, -0.6754150390625, -0.55828857421875, -0.441162109375, -0.32403564453125, -0.2069091796875, -0.08978271484375, 0.02734375, 0.14447021484375, 0.2615966796875, 0.37872314453125, 0.495849609375, 0.61297607421875, 0.7301025390625, 0.84722900390625, 0.96435546875, 1.08148193359375, 1.1986083984375, 1.31573486328125, 1.432861328125, 1.54998779296875, 1.6671142578125, 1.78424072265625, 1.9013671875, 2.01849365234375, 2.1356201171875, 2.25274658203125, 2.369873046875, 2.48699951171875, 2.6041259765625, 2.72125244140625, 2.83837890625, 2.95550537109375, 3.0726318359375, 3.18975830078125, 3.306884765625, 3.42401123046875, 3.5411376953125, 3.65826416015625, 3.775390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 24.0, 25.0, 46.0, 100.0, 204.0, 643.0, 3193.0, 178243.0, 860567.0, 4204.0, 761.0, 269.0, 119.0, 47.0, 32.0, 16.0, 11.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -12.0118408203125, -11.687744140625, -11.3636474609375, -11.03955078125, -10.7154541015625, -10.391357421875, -10.0672607421875, -9.7431640625, -9.4190673828125, -9.094970703125, -8.7708740234375, -8.44677734375, -8.1226806640625, -7.798583984375, -7.4744873046875, -7.150390625, -6.8262939453125, -6.502197265625, -6.1781005859375, -5.85400390625, -5.5299072265625, -5.205810546875, -4.8817138671875, -4.5576171875, -4.2335205078125, -3.909423828125, -3.5853271484375, -3.26123046875, -2.9371337890625, -2.613037109375, -2.2889404296875, -1.96484375, -1.6407470703125, -1.316650390625, -0.9925537109375, -0.66845703125, -0.3443603515625, -0.020263671875, 0.3038330078125, 0.6279296875, 0.9520263671875, 1.276123046875, 1.6002197265625, 1.92431640625, 2.2484130859375, 2.572509765625, 2.8966064453125, 3.220703125, 3.5447998046875, 3.868896484375, 4.1929931640625, 4.51708984375, 4.8411865234375, 5.165283203125, 5.4893798828125, 5.8134765625, 6.1375732421875, 6.461669921875, 6.7857666015625, 7.10986328125, 7.4339599609375, 7.758056640625, 8.0821533203125, 8.40625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 8.0, 13.0, 20.0, 49.0, 100.0, 287.0, 289.0, 112.0, 57.0, 19.0, 16.0, 5.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00047397613525390625, -0.0004614889621734619, -0.0004490017890930176, -0.00043651461601257324, -0.0004240274429321289, -0.00041154026985168457, -0.00039905309677124023, -0.0003865659236907959, -0.00037407875061035156, -0.0003615915775299072, -0.0003491044044494629, -0.00033661723136901855, -0.0003241300582885742, -0.0003116428852081299, -0.00029915571212768555, -0.0002866685390472412, -0.0002741813659667969, -0.00026169419288635254, -0.0002492070198059082, -0.00023671984672546387, -0.00022423267364501953, -0.0002117455005645752, -0.00019925832748413086, -0.00018677115440368652, -0.0001742839813232422, -0.00016179680824279785, -0.00014930963516235352, -0.00013682246208190918, -0.00012433528900146484, -0.00011184811592102051, -9.936094284057617e-05, -8.687376976013184e-05, -7.43865966796875e-05, -6.189942359924316e-05, -4.941225051879883e-05, -3.692507743835449e-05, -2.4437904357910156e-05, -1.195073127746582e-05, 5.364418029785156e-07, 1.3023614883422852e-05, 2.5510787963867188e-05, 3.7997961044311523e-05, 5.048513412475586e-05, 6.29723072052002e-05, 7.545948028564453e-05, 8.794665336608887e-05, 0.0001004338264465332, 0.00011292099952697754, 0.00012540817260742188, 0.0001378953456878662, 0.00015038251876831055, 0.00016286969184875488, 0.00017535686492919922, 0.00018784403800964355, 0.0002003312110900879, 0.00021281838417053223, 0.00022530555725097656, 0.0002377927303314209, 0.00025027990341186523, 0.00026276707649230957, 0.0002752542495727539, 0.00028774142265319824, 0.0003002285957336426, 0.0003127157688140869, 0.00032520294189453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 7.0, 6.0, 14.0, 31.0, 42.0, 83.0, 136.0, 257.0, 490.0, 1119.0, 3209.0, 11238.0, 77290.0, 847691.0, 88706.0, 12506.0, 3344.0, 1222.0, 539.0, 254.0, 144.0, 75.0, 50.0, 34.0, 14.0, 8.0, 7.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1953125, -3.100006103515625, -3.00469970703125, -2.909393310546875, -2.8140869140625, -2.718780517578125, -2.62347412109375, -2.528167724609375, -2.432861328125, -2.337554931640625, -2.24224853515625, -2.146942138671875, -2.0516357421875, -1.956329345703125, -1.86102294921875, -1.765716552734375, -1.67041015625, -1.575103759765625, -1.47979736328125, -1.384490966796875, -1.2891845703125, -1.193878173828125, -1.09857177734375, -1.003265380859375, -0.907958984375, -0.812652587890625, -0.71734619140625, -0.622039794921875, -0.5267333984375, -0.431427001953125, -0.33612060546875, -0.240814208984375, -0.1455078125, -0.050201416015625, 0.04510498046875, 0.140411376953125, 0.2357177734375, 0.331024169921875, 0.42633056640625, 0.521636962890625, 0.616943359375, 0.712249755859375, 0.80755615234375, 0.902862548828125, 0.9981689453125, 1.093475341796875, 1.18878173828125, 1.284088134765625, 1.37939453125, 1.474700927734375, 1.57000732421875, 1.665313720703125, 1.7606201171875, 1.855926513671875, 1.95123291015625, 2.046539306640625, 2.141845703125, 2.237152099609375, 2.33245849609375, 2.427764892578125, 2.5230712890625, 2.618377685546875, 2.71368408203125, 2.808990478515625, 2.904296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 17.0, 12.0, 14.0, 24.0, 30.0, 34.0, 39.0, 71.0, 89.0, 121.0, 100.0, 100.0, 92.0, 66.0, 52.0, 38.0, 29.0, 15.0, 8.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.12109375, -3.03253173828125, -2.9439697265625, -2.85540771484375, -2.766845703125, -2.67828369140625, -2.5897216796875, -2.50115966796875, -2.41259765625, -2.32403564453125, -2.2354736328125, -2.14691162109375, -2.058349609375, -1.96978759765625, -1.8812255859375, -1.79266357421875, -1.7041015625, -1.61553955078125, -1.5269775390625, -1.43841552734375, -1.349853515625, -1.26129150390625, -1.1727294921875, -1.08416748046875, -0.99560546875, -0.90704345703125, -0.8184814453125, -0.72991943359375, -0.641357421875, -0.55279541015625, -0.4642333984375, -0.37567138671875, -0.287109375, -0.19854736328125, -0.1099853515625, -0.02142333984375, 0.067138671875, 0.15570068359375, 0.2442626953125, 0.33282470703125, 0.42138671875, 0.50994873046875, 0.5985107421875, 0.68707275390625, 0.775634765625, 0.86419677734375, 0.9527587890625, 1.04132080078125, 1.1298828125, 1.21844482421875, 1.3070068359375, 1.39556884765625, 1.484130859375, 1.57269287109375, 1.6612548828125, 1.74981689453125, 1.83837890625, 1.92694091796875, 2.0155029296875, 2.10406494140625, 2.192626953125, 2.28118896484375, 2.3697509765625, 2.45831298828125, 2.546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 4.0, 7.0, 7.0, 18.0, 48.0, 138.0, 338.0, 269.0, 91.0, 35.0, 19.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.83209228515625, -76.24474334716797, -74.65739440917969, -73.0700454711914, -71.48269653320312, -69.89533996582031, -68.30799102783203, -66.72064208984375, -65.13329315185547, -63.54594421386719, -61.958595275878906, -60.37124252319336, -58.78389358520508, -57.1965446472168, -55.60919189453125, -54.02184295654297, -52.43449401855469, -50.847145080566406, -49.259796142578125, -47.67244338989258, -46.0850944519043, -44.497745513916016, -42.91039276123047, -41.32304382324219, -39.735694885253906, -38.148345947265625, -36.560997009277344, -34.9736442565918, -33.386295318603516, -31.798946380615234, -30.21159553527832, -28.624244689941406, -27.03689193725586, -25.449542999267578, -23.862192153930664, -22.27484130859375, -20.68749237060547, -19.100143432617188, -17.512792587280273, -15.925442695617676, -14.338092803955078, -12.75074291229248, -11.163393020629883, -9.576043128967285, -7.9886932373046875, -6.40134334564209, -4.813993453979492, -3.2266435623168945, -1.6392936706542969, -0.05194377899169922, 1.5354061126708984, 3.122756004333496, 4.710105895996094, 6.297455787658691, 7.884805679321289, 9.472155570983887, 11.059505462646484, 12.646855354309082, 14.23420524597168, 15.821555137634277, 17.408905029296875, 18.996253967285156, 20.58360481262207, 22.170955657958984, 23.758304595947266]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 11.0, 11.0, 3.0, 12.0, 22.0, 36.0, 55.0, 82.0, 103.0, 119.0, 136.0, 96.0, 80.0, 53.0, 47.0, 25.0, 20.0, 16.0, 6.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.01615905761719, -61.96639633178711, -59.91663360595703, -57.86686706542969, -55.81710433959961, -53.76734161376953, -51.71757888793945, -49.667816162109375, -47.61804962158203, -45.56828689575195, -43.518524169921875, -41.46875762939453, -39.41899490356445, -37.369232177734375, -35.3194694519043, -33.26970672607422, -31.21994400024414, -29.170181274414062, -27.12041664123535, -25.070653915405273, -23.020889282226562, -20.971126556396484, -18.921363830566406, -16.871601104736328, -14.821836471557617, -12.772072792053223, -10.722309112548828, -8.67254638671875, -6.6227827072143555, -4.573019027709961, -2.523256301879883, -0.4734926223754883, 1.5762710571289062, 3.6260344982147217, 5.675797939300537, 7.725561141967773, 9.775324821472168, 11.825088500976562, 13.87485122680664, 15.924614906311035, 17.97437858581543, 20.024141311645508, 22.07390594482422, 24.123668670654297, 26.173431396484375, 28.223196029663086, 30.272958755493164, 32.322723388671875, 34.37248611450195, 36.42224884033203, 38.47201156616211, 40.52177429199219, 42.57154083251953, 44.62130355834961, 46.67106628417969, 48.720829010009766, 50.770591735839844, 52.82035446166992, 54.8701171875, 56.919883728027344, 58.96964645385742, 61.0194091796875, 63.06917190551758, 65.11893463134766, 67.168701171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 26.0, 27.0, 31.0, 59.0, 101.0, 186.0, 363.0, 827.0, 2101.0, 7581.0, 61495.0, 4088553.0, 27178.0, 3956.0, 1086.0, 374.0, 162.0, 72.0, 34.0, 17.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.53125, -20.984375, -20.4375, -19.890625, -19.34375, -18.796875, -18.25, -17.703125, -17.15625, -16.609375, -16.0625, -15.515625, -14.96875, -14.421875, -13.875, -13.328125, -12.78125, -12.234375, -11.6875, -11.140625, -10.59375, -10.046875, -9.5, -8.953125, -8.40625, -7.859375, -7.3125, -6.765625, -6.21875, -5.671875, -5.125, -4.578125, -4.03125, -3.484375, -2.9375, -2.390625, -1.84375, -1.296875, -0.75, -0.203125, 0.34375, 0.890625, 1.4375, 1.984375, 2.53125, 3.078125, 3.625, 4.171875, 4.71875, 5.265625, 5.8125, 6.359375, 6.90625, 7.453125, 8.0, 8.546875, 9.09375, 9.640625, 10.1875, 10.734375, 11.28125, 11.828125, 12.375, 12.921875, 13.46875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 3.0, 4.0, 5.0, 9.0, 8.0, 7.0, 9.0, 24.0, 73.0, 232.0, 345.0, 149.0, 39.0, 16.0, 14.0, 15.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.48046875, -1.44268798828125, -1.4049072265625, -1.36712646484375, -1.329345703125, -1.29156494140625, -1.2537841796875, -1.21600341796875, -1.17822265625, -1.14044189453125, -1.1026611328125, -1.06488037109375, -1.027099609375, -0.98931884765625, -0.9515380859375, -0.91375732421875, -0.8759765625, -0.83819580078125, -0.8004150390625, -0.76263427734375, -0.724853515625, -0.68707275390625, -0.6492919921875, -0.61151123046875, -0.57373046875, -0.53594970703125, -0.4981689453125, -0.46038818359375, -0.422607421875, -0.38482666015625, -0.3470458984375, -0.30926513671875, -0.271484375, -0.23370361328125, -0.1959228515625, -0.15814208984375, -0.120361328125, -0.08258056640625, -0.0447998046875, -0.00701904296875, 0.03076171875, 0.06854248046875, 0.1063232421875, 0.14410400390625, 0.181884765625, 0.21966552734375, 0.2574462890625, 0.29522705078125, 0.3330078125, 0.37078857421875, 0.4085693359375, 0.44635009765625, 0.484130859375, 0.52191162109375, 0.5596923828125, 0.59747314453125, 0.63525390625, 0.67303466796875, 0.7108154296875, 0.74859619140625, 0.786376953125, 0.82415771484375, 0.8619384765625, 0.89971923828125, 0.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 17.0, 29.0, 30.0, 90.0, 143.0, 324.0, 759.0, 2175.0, 8958.0, 69429.0, 3933878.0, 158356.0, 14671.0, 3394.0, 1064.0, 488.0, 197.0, 95.0, 53.0, 39.0, 20.0, 18.0, 10.0, 10.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0572509765625, -7.794189453125, -7.5311279296875, -7.26806640625, -7.0050048828125, -6.741943359375, -6.4788818359375, -6.2158203125, -5.9527587890625, -5.689697265625, -5.4266357421875, -5.16357421875, -4.9005126953125, -4.637451171875, -4.3743896484375, -4.111328125, -3.8482666015625, -3.585205078125, -3.3221435546875, -3.05908203125, -2.7960205078125, -2.532958984375, -2.2698974609375, -2.0068359375, -1.7437744140625, -1.480712890625, -1.2176513671875, -0.95458984375, -0.6915283203125, -0.428466796875, -0.1654052734375, 0.09765625, 0.3607177734375, 0.623779296875, 0.8868408203125, 1.14990234375, 1.4129638671875, 1.676025390625, 1.9390869140625, 2.2021484375, 2.4652099609375, 2.728271484375, 2.9913330078125, 3.25439453125, 3.5174560546875, 3.780517578125, 4.0435791015625, 4.306640625, 4.5697021484375, 4.832763671875, 5.0958251953125, 5.35888671875, 5.6219482421875, 5.885009765625, 6.1480712890625, 6.4111328125, 6.6741943359375, 6.937255859375, 7.2003173828125, 7.46337890625, 7.7264404296875, 7.989501953125, 8.2525634765625, 8.515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 15.0, 14.0, 19.0, 25.0, 47.0, 52.0, 75.0, 130.0, 245.0, 725.0, 1808.0, 375.0, 158.0, 113.0, 82.0, 40.0, 30.0, 24.0, 14.0, 20.0, 9.0, 9.0, 6.0, 8.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.15625, -1.120361328125, -1.08447265625, -1.048583984375, -1.0126953125, -0.976806640625, -0.94091796875, -0.905029296875, -0.869140625, -0.833251953125, -0.79736328125, -0.761474609375, -0.7255859375, -0.689697265625, -0.65380859375, -0.617919921875, -0.58203125, -0.546142578125, -0.51025390625, -0.474365234375, -0.4384765625, -0.402587890625, -0.36669921875, -0.330810546875, -0.294921875, -0.259033203125, -0.22314453125, -0.187255859375, -0.1513671875, -0.115478515625, -0.07958984375, -0.043701171875, -0.0078125, 0.028076171875, 0.06396484375, 0.099853515625, 0.1357421875, 0.171630859375, 0.20751953125, 0.243408203125, 0.279296875, 0.315185546875, 0.35107421875, 0.386962890625, 0.4228515625, 0.458740234375, 0.49462890625, 0.530517578125, 0.56640625, 0.602294921875, 0.63818359375, 0.674072265625, 0.7099609375, 0.745849609375, 0.78173828125, 0.817626953125, 0.853515625, 0.889404296875, 0.92529296875, 0.961181640625, 0.9970703125, 1.032958984375, 1.06884765625, 1.104736328125, 1.140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 29.0, 836.0, 119.0, 10.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.163687705993652, -4.046584129333496, -2.9294800758361816, -1.8123762607574463, -0.6952724456787109, 0.4218311309814453, 1.5389351844787598, 2.656039237976074, 3.7731428146362305, 4.890246391296387, 6.007350444793701, 7.124454498291016, 8.241558074951172, 9.358661651611328, 10.475765228271484, 11.592869758605957, 12.709973335266113, 13.82707691192627, 14.944181442260742, 16.0612850189209, 17.178388595581055, 18.29549217224121, 19.412595748901367, 20.529701232910156, 21.646804809570312, 22.76390838623047, 23.881011962890625, 24.99811553955078, 26.115219116210938, 27.232322692871094, 28.349428176879883, 29.46653175354004, 30.583633422851562, 31.70073699951172, 32.817840576171875, 33.93494415283203, 35.05204772949219, 36.169151306152344, 37.2862548828125, 38.403358459472656, 39.52046203613281, 40.63756561279297, 41.754669189453125, 42.87177276611328, 43.98887634277344, 45.105979919433594, 46.22308349609375, 47.340187072753906, 48.45729446411133, 49.574398040771484, 50.69150161743164, 51.8086051940918, 52.92570877075195, 54.04281234741211, 55.159915924072266, 56.27702331542969, 57.394126892089844, 58.51123046875, 59.628334045410156, 60.74543762207031, 61.86254119873047, 62.979644775390625, 64.09674835205078, 65.21385192871094, 66.3309555053711]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 12.0, 12.0, 19.0, 22.0, 15.0, 27.0, 35.0, 42.0, 41.0, 43.0, 57.0, 75.0, 74.0, 55.0, 66.0, 58.0, 63.0, 58.0, 37.0, 43.0, 32.0, 18.0, 17.0, 12.0, 9.0, 12.0, 4.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.042205810546875, -4.890949726104736, -4.739693641662598, -4.588437557220459, -4.43718147277832, -4.285925388336182, -4.134669303894043, -3.9834132194519043, -3.8321571350097656, -3.680901050567627, -3.5296449661254883, -3.3783888816833496, -3.227132797241211, -3.0758767127990723, -2.9246206283569336, -2.773364543914795, -2.622108221054077, -2.4708521366119385, -2.3195960521698, -2.168339967727661, -2.0170838832855225, -1.8658277988433838, -1.7145715951919556, -1.563315510749817, -1.4120594263076782, -1.2608033418655396, -1.1095472574234009, -0.9582911133766174, -0.8070350289344788, -0.6557789444923401, -0.5045228004455566, -0.35326671600341797, -0.2020106315612793, -0.05075453221797943, 0.10050156712532043, 0.2517576813697815, 0.40301376581192017, 0.5542698502540588, 0.7055259943008423, 0.856782078742981, 1.0080381631851196, 1.1592942476272583, 1.310550332069397, 1.4618065357208252, 1.6130626201629639, 1.7643187046051025, 1.9155747890472412, 2.06683087348938, 2.2180869579315186, 2.3693430423736572, 2.520599126815796, 2.6718552112579346, 2.8231112957000732, 2.974367380142212, 3.1256237030029297, 3.2768797874450684, 3.428135871887207, 3.5793919563293457, 3.7306480407714844, 3.881904125213623, 4.033160209655762, 4.1844162940979, 4.335672378540039, 4.486928462982178, 4.638184547424316]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 12.0, 11.0, 24.0, 26.0, 40.0, 54.0, 65.0, 101.0, 161.0, 220.0, 390.0, 695.0, 1318.0, 2546.0, 5185.0, 12221.0, 48434.0, 871957.0, 77848.0, 14716.0, 5909.0, 2919.0, 1553.0, 836.0, 455.0, 260.0, 163.0, 116.0, 69.0, 52.0, 38.0, 37.0, 21.0, 21.0, 15.0, 11.0, 17.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.21875, -7.9586181640625, -7.698486328125, -7.4383544921875, -7.17822265625, -6.9180908203125, -6.657958984375, -6.3978271484375, -6.1376953125, -5.8775634765625, -5.617431640625, -5.3572998046875, -5.09716796875, -4.8370361328125, -4.576904296875, -4.3167724609375, -4.056640625, -3.7965087890625, -3.536376953125, -3.2762451171875, -3.01611328125, -2.7559814453125, -2.495849609375, -2.2357177734375, -1.9755859375, -1.7154541015625, -1.455322265625, -1.1951904296875, -0.93505859375, -0.6749267578125, -0.414794921875, -0.1546630859375, 0.10546875, 0.3656005859375, 0.625732421875, 0.8858642578125, 1.14599609375, 1.4061279296875, 1.666259765625, 1.9263916015625, 2.1865234375, 2.4466552734375, 2.706787109375, 2.9669189453125, 3.22705078125, 3.4871826171875, 3.747314453125, 4.0074462890625, 4.267578125, 4.5277099609375, 4.787841796875, 5.0479736328125, 5.30810546875, 5.5682373046875, 5.828369140625, 6.0885009765625, 6.3486328125, 6.6087646484375, 6.868896484375, 7.1290283203125, 7.38916015625, 7.6492919921875, 7.909423828125, 8.1695556640625, 8.4296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 12.0, 12.0, 23.0, 52.0, 173.0, 318.0, 212.0, 77.0, 30.0, 13.0, 12.0, 6.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5654296875, -1.5286026000976562, -1.4917755126953125, -1.4549484252929688, -1.418121337890625, -1.3812942504882812, -1.3444671630859375, -1.3076400756835938, -1.27081298828125, -1.2339859008789062, -1.1971588134765625, -1.1603317260742188, -1.123504638671875, -1.0866775512695312, -1.0498504638671875, -1.0130233764648438, -0.9761962890625, -0.9393692016601562, -0.9025421142578125, -0.8657150268554688, -0.828887939453125, -0.7920608520507812, -0.7552337646484375, -0.7184066772460938, -0.68157958984375, -0.6447525024414062, -0.6079254150390625, -0.5710983276367188, -0.534271240234375, -0.49744415283203125, -0.4606170654296875, -0.42378997802734375, -0.386962890625, -0.35013580322265625, -0.3133087158203125, -0.27648162841796875, -0.239654541015625, -0.20282745361328125, -0.1660003662109375, -0.12917327880859375, -0.09234619140625, -0.05551910400390625, -0.0186920166015625, 0.01813507080078125, 0.054962158203125, 0.09178924560546875, 0.1286163330078125, 0.16544342041015625, 0.2022705078125, 0.23909759521484375, 0.2759246826171875, 0.31275177001953125, 0.349578857421875, 0.38640594482421875, 0.4232330322265625, 0.46006011962890625, 0.49688720703125, 0.5337142944335938, 0.5705413818359375, 0.6073684692382812, 0.644195556640625, 0.6810226440429688, 0.7178497314453125, 0.7546768188476562, 0.79150390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 8.0, 11.0, 8.0, 18.0, 13.0, 24.0, 28.0, 38.0, 56.0, 65.0, 132.0, 194.0, 378.0, 723.0, 1588.0, 4278.0, 14141.0, 55328.0, 308039.0, 547742.0, 86044.0, 19983.0, 5811.0, 1964.0, 881.0, 397.0, 232.0, 123.0, 79.0, 57.0, 38.0, 23.0, 23.0, 14.0, 15.0, 15.0, 12.0, 7.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.9588623046875, -3.831787109375, -3.7047119140625, -3.57763671875, -3.4505615234375, -3.323486328125, -3.1964111328125, -3.0693359375, -2.9422607421875, -2.815185546875, -2.6881103515625, -2.56103515625, -2.4339599609375, -2.306884765625, -2.1798095703125, -2.052734375, -1.9256591796875, -1.798583984375, -1.6715087890625, -1.54443359375, -1.4173583984375, -1.290283203125, -1.1632080078125, -1.0361328125, -0.9090576171875, -0.781982421875, -0.6549072265625, -0.52783203125, -0.4007568359375, -0.273681640625, -0.1466064453125, -0.01953125, 0.1075439453125, 0.234619140625, 0.3616943359375, 0.48876953125, 0.6158447265625, 0.742919921875, 0.8699951171875, 0.9970703125, 1.1241455078125, 1.251220703125, 1.3782958984375, 1.50537109375, 1.6324462890625, 1.759521484375, 1.8865966796875, 2.013671875, 2.1407470703125, 2.267822265625, 2.3948974609375, 2.52197265625, 2.6490478515625, 2.776123046875, 2.9031982421875, 3.0302734375, 3.1573486328125, 3.284423828125, 3.4114990234375, 3.53857421875, 3.6656494140625, 3.792724609375, 3.9197998046875, 4.046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 14.0, 11.0, 21.0, 16.0, 21.0, 27.0, 30.0, 29.0, 26.0, 23.0, 33.0, 44.0, 35.0, 35.0, 42.0, 39.0, 41.0, 41.0, 43.0, 33.0, 38.0, 38.0, 36.0, 37.0, 22.0, 32.0, 28.0, 19.0, 16.0, 14.0, 15.0, 13.0, 15.0, 10.0, 9.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.445953369140625, -2.36846923828125, -2.290985107421875, -2.2135009765625, -2.136016845703125, -2.05853271484375, -1.981048583984375, -1.903564453125, -1.826080322265625, -1.74859619140625, -1.671112060546875, -1.5936279296875, -1.516143798828125, -1.43865966796875, -1.361175537109375, -1.28369140625, -1.206207275390625, -1.12872314453125, -1.051239013671875, -0.9737548828125, -0.896270751953125, -0.81878662109375, -0.741302490234375, -0.663818359375, -0.586334228515625, -0.50885009765625, -0.431365966796875, -0.3538818359375, -0.276397705078125, -0.19891357421875, -0.121429443359375, -0.0439453125, 0.033538818359375, 0.11102294921875, 0.188507080078125, 0.2659912109375, 0.343475341796875, 0.42095947265625, 0.498443603515625, 0.575927734375, 0.653411865234375, 0.73089599609375, 0.808380126953125, 0.8858642578125, 0.963348388671875, 1.04083251953125, 1.118316650390625, 1.19580078125, 1.273284912109375, 1.35076904296875, 1.428253173828125, 1.5057373046875, 1.583221435546875, 1.66070556640625, 1.738189697265625, 1.815673828125, 1.893157958984375, 1.97064208984375, 2.048126220703125, 2.1256103515625, 2.203094482421875, 2.28057861328125, 2.358062744140625, 2.435546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 4.0, 11.0, 14.0, 17.0, 26.0, 48.0, 73.0, 130.0, 288.0, 721.0, 2048.0, 12330.0, 971291.0, 56229.0, 3400.0, 1054.0, 374.0, 223.0, 110.0, 48.0, 30.0, 19.0, 17.0, 9.0, 8.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.94921875, -7.73260498046875, -7.5159912109375, -7.29937744140625, -7.082763671875, -6.86614990234375, -6.6495361328125, -6.43292236328125, -6.21630859375, -5.99969482421875, -5.7830810546875, -5.56646728515625, -5.349853515625, -5.13323974609375, -4.9166259765625, -4.70001220703125, -4.4833984375, -4.26678466796875, -4.0501708984375, -3.83355712890625, -3.616943359375, -3.40032958984375, -3.1837158203125, -2.96710205078125, -2.75048828125, -2.53387451171875, -2.3172607421875, -2.10064697265625, -1.884033203125, -1.66741943359375, -1.4508056640625, -1.23419189453125, -1.017578125, -0.80096435546875, -0.5843505859375, -0.36773681640625, -0.151123046875, 0.06549072265625, 0.2821044921875, 0.49871826171875, 0.71533203125, 0.93194580078125, 1.1485595703125, 1.36517333984375, 1.581787109375, 1.79840087890625, 2.0150146484375, 2.23162841796875, 2.4482421875, 2.66485595703125, 2.8814697265625, 3.09808349609375, 3.314697265625, 3.53131103515625, 3.7479248046875, 3.96453857421875, 4.18115234375, 4.39776611328125, 4.6143798828125, 4.83099365234375, 5.047607421875, 5.26422119140625, 5.4808349609375, 5.69744873046875, 5.9140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 10.0, 20.0, 36.0, 64.0, 208.0, 354.0, 161.0, 78.0, 31.0, 16.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042366981506347656, -0.00041138753294944763, -0.0003991052508354187, -0.00038682296872138977, -0.00037454068660736084, -0.0003622584044933319, -0.000349976122379303, -0.00033769384026527405, -0.0003254115581512451, -0.0003131292760372162, -0.00030084699392318726, -0.0002885647118091583, -0.0002762824296951294, -0.00026400014758110046, -0.00025171786546707153, -0.0002394355833530426, -0.00022715330123901367, -0.00021487101912498474, -0.0002025887370109558, -0.00019030645489692688, -0.00017802417278289795, -0.00016574189066886902, -0.0001534596085548401, -0.00014117732644081116, -0.00012889504432678223, -0.0001166127622127533, -0.00010433048009872437, -9.204819798469543e-05, -7.97659158706665e-05, -6.748363375663757e-05, -5.520135164260864e-05, -4.291906952857971e-05, -3.063678741455078e-05, -1.835450530052185e-05, -6.07222318649292e-06, 6.210058927536011e-06, 1.849234104156494e-05, 3.077462315559387e-05, 4.30569052696228e-05, 5.5339187383651733e-05, 6.762146949768066e-05, 7.99037516117096e-05, 9.218603372573853e-05, 0.00010446831583976746, 0.00011675059795379639, 0.00012903288006782532, 0.00014131516218185425, 0.00015359744429588318, 0.0001658797264099121, 0.00017816200852394104, 0.00019044429063796997, 0.0002027265727519989, 0.00021500885486602783, 0.00022729113698005676, 0.0002395734190940857, 0.0002518557012081146, 0.00026413798332214355, 0.0002764202654361725, 0.0002887025475502014, 0.00030098482966423035, 0.0003132671117782593, 0.0003255493938922882, 0.00033783167600631714, 0.00035011395812034607, 0.000362396240234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 7.0, 13.0, 23.0, 41.0, 102.0, 159.0, 307.0, 759.0, 2196.0, 11191.0, 227269.0, 777313.0, 23912.0, 3438.0, 1013.0, 426.0, 182.0, 75.0, 38.0, 26.0, 18.0, 12.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.21661376953125, -4.0894775390625, -3.96234130859375, -3.835205078125, -3.70806884765625, -3.5809326171875, -3.45379638671875, -3.32666015625, -3.19952392578125, -3.0723876953125, -2.94525146484375, -2.818115234375, -2.69097900390625, -2.5638427734375, -2.43670654296875, -2.3095703125, -2.18243408203125, -2.0552978515625, -1.92816162109375, -1.801025390625, -1.67388916015625, -1.5467529296875, -1.41961669921875, -1.29248046875, -1.16534423828125, -1.0382080078125, -0.91107177734375, -0.783935546875, -0.65679931640625, -0.5296630859375, -0.40252685546875, -0.275390625, -0.14825439453125, -0.0211181640625, 0.10601806640625, 0.233154296875, 0.36029052734375, 0.4874267578125, 0.61456298828125, 0.74169921875, 0.86883544921875, 0.9959716796875, 1.12310791015625, 1.250244140625, 1.37738037109375, 1.5045166015625, 1.63165283203125, 1.7587890625, 1.88592529296875, 2.0130615234375, 2.14019775390625, 2.267333984375, 2.39447021484375, 2.5216064453125, 2.64874267578125, 2.77587890625, 2.90301513671875, 3.0301513671875, 3.15728759765625, 3.284423828125, 3.41156005859375, 3.5386962890625, 3.66583251953125, 3.79296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 10.0, 8.0, 24.0, 26.0, 40.0, 49.0, 72.0, 69.0, 110.0, 170.0, 117.0, 89.0, 77.0, 43.0, 31.0, 20.0, 12.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.728515625, -2.649261474609375, -2.57000732421875, -2.490753173828125, -2.4114990234375, -2.332244873046875, -2.25299072265625, -2.173736572265625, -2.094482421875, -2.015228271484375, -1.93597412109375, -1.856719970703125, -1.7774658203125, -1.698211669921875, -1.61895751953125, -1.539703369140625, -1.46044921875, -1.381195068359375, -1.30194091796875, -1.222686767578125, -1.1434326171875, -1.064178466796875, -0.98492431640625, -0.905670166015625, -0.826416015625, -0.747161865234375, -0.66790771484375, -0.588653564453125, -0.5093994140625, -0.430145263671875, -0.35089111328125, -0.271636962890625, -0.1923828125, -0.113128662109375, -0.03387451171875, 0.045379638671875, 0.1246337890625, 0.203887939453125, 0.28314208984375, 0.362396240234375, 0.441650390625, 0.520904541015625, 0.60015869140625, 0.679412841796875, 0.7586669921875, 0.837921142578125, 0.91717529296875, 0.996429443359375, 1.07568359375, 1.154937744140625, 1.23419189453125, 1.313446044921875, 1.3927001953125, 1.471954345703125, 1.55120849609375, 1.630462646484375, 1.709716796875, 1.788970947265625, 1.86822509765625, 1.947479248046875, 2.0267333984375, 2.105987548828125, 2.18524169921875, 2.264495849609375, 2.34375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 19.0, 44.0, 132.0, 487.0, 232.0, 52.0, 18.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.1846923828125, -64.59866333007812, -63.012638092041016, -61.426612854003906, -59.84058380126953, -58.25455856323242, -56.66852951049805, -55.08250427246094, -53.49647521972656, -51.91044998168945, -50.32442092895508, -48.73839569091797, -47.152366638183594, -45.566341400146484, -43.98031234741211, -42.394287109375, -40.808258056640625, -39.222232818603516, -37.63620376586914, -36.05017852783203, -34.464149475097656, -32.87812423706055, -31.292095184326172, -29.706069946289062, -28.120044708251953, -26.53401756286621, -24.94799041748047, -23.361963272094727, -21.775936126708984, -20.189908981323242, -18.6038818359375, -17.01785659790039, -15.431827545166016, -13.845800399780273, -12.259773254394531, -10.673746109008789, -9.087718963623047, -7.501692295074463, -5.915665626525879, -4.329638481140137, -2.7436113357543945, -1.157584309577942, 0.42844271659851074, 2.014469623565674, 3.600496768951416, 5.186523914337158, 6.772550582885742, 8.358577728271484, 9.944604873657227, 11.530632019042969, 13.116659164428711, 14.702686309814453, 16.288713455200195, 17.874740600585938, 19.460765838623047, 21.046794891357422, 22.63282012939453, 24.218847274780273, 25.804874420166016, 27.390901565551758, 28.9769287109375, 30.562955856323242, 32.148983001708984, 33.735008239746094, 35.32103729248047]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 7.0, 9.0, 27.0, 34.0, 40.0, 48.0, 54.0, 83.0, 70.0, 95.0, 91.0, 85.0, 77.0, 55.0, 46.0, 30.0, 29.0, 18.0, 21.0, 9.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.79064178466797, -34.79438400268555, -33.79812240600586, -32.80186462402344, -31.80560302734375, -30.809343338012695, -29.81308364868164, -28.81682586669922, -27.82056427001953, -26.824304580688477, -25.828044891357422, -24.831785202026367, -23.835525512695312, -22.839265823364258, -21.843006134033203, -20.84674835205078, -19.850488662719727, -18.854228973388672, -17.857969284057617, -16.861709594726562, -15.865449905395508, -14.869190216064453, -13.872931480407715, -12.87667179107666, -11.880412101745605, -10.88415241241455, -9.887892723083496, -8.891633987426758, -7.895373821258545, -6.89911413192749, -5.902854919433594, -4.906595230102539, -3.9103355407714844, -2.9140758514404297, -1.917816400527954, -0.9215569496154785, 0.07470273971557617, 1.0709624290466309, 2.0672216415405273, 3.063481330871582, 4.059741020202637, 5.056000709533691, 6.052260398864746, 7.048519611358643, 8.044778823852539, 9.041038513183594, 10.037298202514648, 11.033557891845703, 12.029817581176758, 13.026077270507812, 14.022336959838867, 15.018596649169922, 16.014856338500977, 17.01111602783203, 18.007373809814453, 19.00363540649414, 19.999893188476562, 20.996152877807617, 21.992412567138672, 22.988672256469727, 23.98493194580078, 24.981191635131836, 25.97745132446289, 26.973709106445312, 27.969970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 3.0, 7.0, 4.0, 8.0, 8.0, 6.0, 6.0, 11.0, 10.0, 21.0, 26.0, 27.0, 32.0, 34.0, 44.0, 60.0, 89.0, 80.0, 98.0, 152.0, 172.0, 220.0, 291.0, 448.0, 883.0, 1711.0, 3578.0, 11374.0, 139544.0, 4002693.0, 22634.0, 5071.0, 2162.0, 1084.0, 606.0, 342.0, 238.0, 153.0, 87.0, 67.0, 56.0, 44.0, 22.0, 16.0, 12.0, 12.0, 10.0, 5.0, 5.0], "bins": [-20.15625, -19.7000732421875, -19.243896484375, -18.7877197265625, -18.33154296875, -17.8753662109375, -17.419189453125, -16.9630126953125, -16.5068359375, -16.0506591796875, -15.594482421875, -15.1383056640625, -14.68212890625, -14.2259521484375, -13.769775390625, -13.3135986328125, -12.857421875, -12.4012451171875, -11.945068359375, -11.4888916015625, -11.03271484375, -10.5765380859375, -10.120361328125, -9.6641845703125, -9.2080078125, -8.7518310546875, -8.295654296875, -7.8394775390625, -7.38330078125, -6.9271240234375, -6.470947265625, -6.0147705078125, -5.55859375, -5.1024169921875, -4.646240234375, -4.1900634765625, -3.73388671875, -3.2777099609375, -2.821533203125, -2.3653564453125, -1.9091796875, -1.4530029296875, -0.996826171875, -0.5406494140625, -0.08447265625, 0.3717041015625, 0.827880859375, 1.2840576171875, 1.740234375, 2.1964111328125, 2.652587890625, 3.1087646484375, 3.56494140625, 4.0211181640625, 4.477294921875, 4.9334716796875, 5.3896484375, 5.8458251953125, 6.302001953125, 6.7581787109375, 7.21435546875, 7.6705322265625, 8.126708984375, 8.5828857421875, 9.0390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 13.0, 16.0, 14.0, 34.0, 96.0, 215.0, 266.0, 170.0, 75.0, 32.0, 17.0, 12.0, 11.0, 11.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.736328125, -1.6971435546875, -1.657958984375, -1.6187744140625, -1.57958984375, -1.5404052734375, -1.501220703125, -1.4620361328125, -1.4228515625, -1.3836669921875, -1.344482421875, -1.3052978515625, -1.26611328125, -1.2269287109375, -1.187744140625, -1.1485595703125, -1.109375, -1.0701904296875, -1.031005859375, -0.9918212890625, -0.95263671875, -0.9134521484375, -0.874267578125, -0.8350830078125, -0.7958984375, -0.7567138671875, -0.717529296875, -0.6783447265625, -0.63916015625, -0.5999755859375, -0.560791015625, -0.5216064453125, -0.482421875, -0.4432373046875, -0.404052734375, -0.3648681640625, -0.32568359375, -0.2864990234375, -0.247314453125, -0.2081298828125, -0.1689453125, -0.1297607421875, -0.090576171875, -0.0513916015625, -0.01220703125, 0.0269775390625, 0.066162109375, 0.1053466796875, 0.14453125, 0.1837158203125, 0.222900390625, 0.2620849609375, 0.30126953125, 0.3404541015625, 0.379638671875, 0.4188232421875, 0.4580078125, 0.4971923828125, 0.536376953125, 0.5755615234375, 0.61474609375, 0.6539306640625, 0.693115234375, 0.7322998046875, 0.771484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 10.0, 19.0, 20.0, 45.0, 69.0, 110.0, 275.0, 1014.0, 8852.0, 1870234.0, 2303047.0, 8938.0, 1082.0, 239.0, 87.0, 65.0, 47.0, 29.0, 17.0, 13.0, 8.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.1385498046875, -12.613037109375, -12.0875244140625, -11.56201171875, -11.0364990234375, -10.510986328125, -9.9854736328125, -9.4599609375, -8.9344482421875, -8.408935546875, -7.8834228515625, -7.35791015625, -6.8323974609375, -6.306884765625, -5.7813720703125, -5.255859375, -4.7303466796875, -4.204833984375, -3.6793212890625, -3.15380859375, -2.6282958984375, -2.102783203125, -1.5772705078125, -1.0517578125, -0.5262451171875, -0.000732421875, 0.5247802734375, 1.05029296875, 1.5758056640625, 2.101318359375, 2.6268310546875, 3.15234375, 3.6778564453125, 4.203369140625, 4.7288818359375, 5.25439453125, 5.7799072265625, 6.305419921875, 6.8309326171875, 7.3564453125, 7.8819580078125, 8.407470703125, 8.9329833984375, 9.45849609375, 9.9840087890625, 10.509521484375, 11.0350341796875, 11.560546875, 12.0860595703125, 12.611572265625, 13.1370849609375, 13.66259765625, 14.1881103515625, 14.713623046875, 15.2391357421875, 15.7646484375, 16.2901611328125, 16.815673828125, 17.3411865234375, 17.86669921875, 18.3922119140625, 18.917724609375, 19.4432373046875, 19.96875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 4.0, 11.0, 13.0, 18.0, 20.0, 28.0, 38.0, 62.0, 129.0, 346.0, 2299.0, 652.0, 179.0, 87.0, 47.0, 35.0, 30.0, 9.0, 11.0, 9.0, 9.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.068359375, -2.018768310546875, -1.96917724609375, -1.919586181640625, -1.8699951171875, -1.820404052734375, -1.77081298828125, -1.721221923828125, -1.671630859375, -1.622039794921875, -1.57244873046875, -1.522857666015625, -1.4732666015625, -1.423675537109375, -1.37408447265625, -1.324493408203125, -1.27490234375, -1.225311279296875, -1.17572021484375, -1.126129150390625, -1.0765380859375, -1.026947021484375, -0.97735595703125, -0.927764892578125, -0.878173828125, -0.828582763671875, -0.77899169921875, -0.729400634765625, -0.6798095703125, -0.630218505859375, -0.58062744140625, -0.531036376953125, -0.4814453125, -0.431854248046875, -0.38226318359375, -0.332672119140625, -0.2830810546875, -0.233489990234375, -0.18389892578125, -0.134307861328125, -0.084716796875, -0.035125732421875, 0.01446533203125, 0.064056396484375, 0.1136474609375, 0.163238525390625, 0.21282958984375, 0.262420654296875, 0.31201171875, 0.361602783203125, 0.41119384765625, 0.460784912109375, 0.5103759765625, 0.559967041015625, 0.60955810546875, 0.659149169921875, 0.708740234375, 0.758331298828125, 0.80792236328125, 0.857513427734375, 0.9071044921875, 0.956695556640625, 1.00628662109375, 1.055877685546875, 1.10546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 10.0, 35.0, 159.0, 571.0, 183.0, 34.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5868446826934814, -3.0413684844970703, -2.495892286300659, -1.950416088104248, -1.404939889907837, -0.8594636917114258, -0.31398749351501465, 0.23148870468139648, 0.7769649028778076, 1.3224411010742188, 1.8679172992706299, 2.413393497467041, 2.958869695663452, 3.5043458938598633, 4.049821853637695, 4.5952982902526855, 5.140774726867676, 5.686250686645508, 6.231727123260498, 6.777203559875488, 7.32267951965332, 7.868155479431152, 8.413631439208984, 8.959108352661133, 9.504584312438965, 10.050060272216797, 10.595537185668945, 11.141013145446777, 11.68648910522461, 12.231965065002441, 12.777441024780273, 13.322917938232422, 13.86839485168457, 14.413870811462402, 14.959346771240234, 15.504823684692383, 16.05030059814453, 16.595775604248047, 17.141252517700195, 17.68672752380371, 18.23220443725586, 18.777681350708008, 19.323156356811523, 19.868633270263672, 20.414108276367188, 20.959585189819336, 21.505062103271484, 22.050537109375, 22.59601402282715, 23.141490936279297, 23.686965942382812, 24.23244285583496, 24.77791976928711, 25.323394775390625, 25.868871688842773, 26.41434669494629, 26.959823608398438, 27.505300521850586, 28.0507755279541, 28.59625244140625, 29.141727447509766, 29.687204360961914, 30.232681274414062, 30.778156280517578, 31.323633193969727]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 4.0, 15.0, 17.0, 12.0, 22.0, 25.0, 32.0, 26.0, 40.0, 43.0, 54.0, 45.0, 62.0, 51.0, 66.0, 63.0, 51.0, 57.0, 60.0, 32.0, 38.0, 29.0, 26.0, 22.0, 17.0, 23.0, 8.0, 6.0, 8.0, 8.0, 3.0, 2.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2804365158081055, -5.115255355834961, -4.950074672698975, -4.78489351272583, -4.619712829589844, -4.454531669616699, -4.289350509643555, -4.124169826507568, -3.958988666534424, -3.7938077449798584, -3.628626823425293, -3.4634456634521484, -3.298264741897583, -3.1330838203430176, -2.967902898788452, -2.8027219772338867, -2.6375410556793213, -2.472360134124756, -2.3071792125701904, -2.141998291015625, -1.9768171310424805, -1.811636209487915, -1.6464552879333496, -1.4812742471694946, -1.3160933256149292, -1.1509124040603638, -0.9857313632965088, -0.8205504417419434, -0.6553694605827332, -0.49018847942352295, -0.3250075578689575, -0.15982651710510254, 0.005354404449462891, 0.1705353707075119, 0.3357163369655609, 0.5008972883224487, 0.6660782694816589, 0.8312592506408691, 0.9964401721954346, 1.1616212129592896, 1.326802134513855, 1.4919830560684204, 1.6571640968322754, 1.8223450183868408, 1.9875259399414062, 2.152707099914551, 2.317887783050537, 2.4830689430236816, 2.648249864578247, 2.8134307861328125, 2.978611707687378, 3.1437926292419434, 3.308973789215088, 3.4741547107696533, 3.6393356323242188, 3.8045167922973633, 3.9696974754333496, 4.134878635406494, 4.3000593185424805, 4.465240478515625, 4.630421161651611, 4.795602321624756, 4.960783004760742, 5.125964164733887, 5.291145324707031]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 8.0, 8.0, 12.0, 22.0, 29.0, 34.0, 65.0, 102.0, 171.0, 339.0, 617.0, 1259.0, 3605.0, 26275.0, 948354.0, 59387.0, 5136.0, 1597.0, 666.0, 375.0, 193.0, 103.0, 59.0, 43.0, 28.0, 18.0, 18.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.237548828125, -12.81884765625, -12.400146484375, -11.9814453125, -11.562744140625, -11.14404296875, -10.725341796875, -10.306640625, -9.887939453125, -9.46923828125, -9.050537109375, -8.6318359375, -8.213134765625, -7.79443359375, -7.375732421875, -6.95703125, -6.538330078125, -6.11962890625, -5.700927734375, -5.2822265625, -4.863525390625, -4.44482421875, -4.026123046875, -3.607421875, -3.188720703125, -2.77001953125, -2.351318359375, -1.9326171875, -1.513916015625, -1.09521484375, -0.676513671875, -0.2578125, 0.160888671875, 0.57958984375, 0.998291015625, 1.4169921875, 1.835693359375, 2.25439453125, 2.673095703125, 3.091796875, 3.510498046875, 3.92919921875, 4.347900390625, 4.7666015625, 5.185302734375, 5.60400390625, 6.022705078125, 6.44140625, 6.860107421875, 7.27880859375, 7.697509765625, 8.1162109375, 8.534912109375, 8.95361328125, 9.372314453125, 9.791015625, 10.209716796875, 10.62841796875, 11.047119140625, 11.4658203125, 11.884521484375, 12.30322265625, 12.721923828125, 13.140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 18.0, 39.0, 87.0, 200.0, 214.0, 192.0, 136.0, 48.0, 24.0, 4.0, 12.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.6535186767578125, -1.614654541015625, -1.5757904052734375, -1.53692626953125, -1.4980621337890625, -1.459197998046875, -1.4203338623046875, -1.3814697265625, -1.3426055908203125, -1.303741455078125, -1.2648773193359375, -1.22601318359375, -1.1871490478515625, -1.148284912109375, -1.1094207763671875, -1.070556640625, -1.0316925048828125, -0.992828369140625, -0.9539642333984375, -0.91510009765625, -0.8762359619140625, -0.837371826171875, -0.7985076904296875, -0.7596435546875, -0.7207794189453125, -0.681915283203125, -0.6430511474609375, -0.60418701171875, -0.5653228759765625, -0.526458740234375, -0.4875946044921875, -0.44873046875, -0.4098663330078125, -0.371002197265625, -0.3321380615234375, -0.29327392578125, -0.2544097900390625, -0.215545654296875, -0.1766815185546875, -0.1378173828125, -0.0989532470703125, -0.060089111328125, -0.0212249755859375, 0.01763916015625, 0.0565032958984375, 0.095367431640625, 0.1342315673828125, 0.173095703125, 0.2119598388671875, 0.250823974609375, 0.2896881103515625, 0.32855224609375, 0.3674163818359375, 0.406280517578125, 0.4451446533203125, 0.4840087890625, 0.5228729248046875, 0.561737060546875, 0.6006011962890625, 0.63946533203125, 0.6783294677734375, 0.717193603515625, 0.7560577392578125, 0.794921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 13.0, 17.0, 25.0, 34.0, 39.0, 79.0, 125.0, 200.0, 414.0, 1024.0, 2709.0, 13348.0, 152380.0, 803582.0, 63178.0, 7733.0, 1910.0, 724.0, 364.0, 198.0, 131.0, 71.0, 43.0, 32.0, 19.0, 15.0, 18.0, 17.0, 13.0, 7.0, 15.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.66015625, -7.41571044921875, -7.1712646484375, -6.92681884765625, -6.682373046875, -6.43792724609375, -6.1934814453125, -5.94903564453125, -5.70458984375, -5.46014404296875, -5.2156982421875, -4.97125244140625, -4.726806640625, -4.48236083984375, -4.2379150390625, -3.99346923828125, -3.7490234375, -3.50457763671875, -3.2601318359375, -3.01568603515625, -2.771240234375, -2.52679443359375, -2.2823486328125, -2.03790283203125, -1.79345703125, -1.54901123046875, -1.3045654296875, -1.06011962890625, -0.815673828125, -0.57122802734375, -0.3267822265625, -0.08233642578125, 0.162109375, 0.40655517578125, 0.6510009765625, 0.89544677734375, 1.139892578125, 1.38433837890625, 1.6287841796875, 1.87322998046875, 2.11767578125, 2.36212158203125, 2.6065673828125, 2.85101318359375, 3.095458984375, 3.33990478515625, 3.5843505859375, 3.82879638671875, 4.0732421875, 4.31768798828125, 4.5621337890625, 4.80657958984375, 5.051025390625, 5.29547119140625, 5.5399169921875, 5.78436279296875, 6.02880859375, 6.27325439453125, 6.5177001953125, 6.76214599609375, 7.006591796875, 7.25103759765625, 7.4954833984375, 7.73992919921875, 7.984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 8.0, 7.0, 14.0, 15.0, 22.0, 19.0, 25.0, 26.0, 24.0, 26.0, 28.0, 26.0, 38.0, 38.0, 39.0, 48.0, 41.0, 51.0, 48.0, 40.0, 38.0, 30.0, 38.0, 32.0, 38.0, 25.0, 25.0, 30.0, 16.0, 14.0, 28.0, 15.0, 15.0, 12.0, 11.0, 5.0, 9.0, 7.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.470703125, -2.390838623046875, -2.31097412109375, -2.231109619140625, -2.1512451171875, -2.071380615234375, -1.99151611328125, -1.911651611328125, -1.831787109375, -1.751922607421875, -1.67205810546875, -1.592193603515625, -1.5123291015625, -1.432464599609375, -1.35260009765625, -1.272735595703125, -1.19287109375, -1.113006591796875, -1.03314208984375, -0.953277587890625, -0.8734130859375, -0.793548583984375, -0.71368408203125, -0.633819580078125, -0.553955078125, -0.474090576171875, -0.39422607421875, -0.314361572265625, -0.2344970703125, -0.154632568359375, -0.07476806640625, 0.005096435546875, 0.0849609375, 0.164825439453125, 0.24468994140625, 0.324554443359375, 0.4044189453125, 0.484283447265625, 0.56414794921875, 0.644012451171875, 0.723876953125, 0.803741455078125, 0.88360595703125, 0.963470458984375, 1.0433349609375, 1.123199462890625, 1.20306396484375, 1.282928466796875, 1.36279296875, 1.442657470703125, 1.52252197265625, 1.602386474609375, 1.6822509765625, 1.762115478515625, 1.84197998046875, 1.921844482421875, 2.001708984375, 2.081573486328125, 2.16143798828125, 2.241302490234375, 2.3211669921875, 2.401031494140625, 2.48089599609375, 2.560760498046875, 2.640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 16.0, 15.0, 28.0, 38.0, 73.0, 140.0, 301.0, 652.0, 1776.0, 10689.0, 426258.0, 592424.0, 12791.0, 2014.0, 672.0, 290.0, 141.0, 82.0, 49.0, 32.0, 22.0, 6.0, 8.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.96124267578125, -3.8248291015625, -3.68841552734375, -3.552001953125, -3.41558837890625, -3.2791748046875, -3.14276123046875, -3.00634765625, -2.86993408203125, -2.7335205078125, -2.59710693359375, -2.460693359375, -2.32427978515625, -2.1878662109375, -2.05145263671875, -1.9150390625, -1.77862548828125, -1.6422119140625, -1.50579833984375, -1.369384765625, -1.23297119140625, -1.0965576171875, -0.96014404296875, -0.82373046875, -0.68731689453125, -0.5509033203125, -0.41448974609375, -0.278076171875, -0.14166259765625, -0.0052490234375, 0.13116455078125, 0.267578125, 0.40399169921875, 0.5404052734375, 0.67681884765625, 0.813232421875, 0.94964599609375, 1.0860595703125, 1.22247314453125, 1.35888671875, 1.49530029296875, 1.6317138671875, 1.76812744140625, 1.904541015625, 2.04095458984375, 2.1773681640625, 2.31378173828125, 2.4501953125, 2.58660888671875, 2.7230224609375, 2.85943603515625, 2.995849609375, 3.13226318359375, 3.2686767578125, 3.40509033203125, 3.54150390625, 3.67791748046875, 3.8143310546875, 3.95074462890625, 4.087158203125, 4.22357177734375, 4.3599853515625, 4.49639892578125, 4.6328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 9.0, 12.0, 7.0, 19.0, 27.0, 26.0, 39.0, 48.0, 47.0, 104.0, 134.0, 121.0, 95.0, 83.0, 55.0, 43.0, 35.0, 18.0, 21.0, 15.0, 8.0, 12.0, 4.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013848207890987396, -0.00013248249888420105, -0.00012648291885852814, -0.00012048333883285522, -0.00011448375880718231, -0.0001084841787815094, -0.00010248459875583649, -9.648501873016357e-05, -9.048543870449066e-05, -8.448585867881775e-05, -7.848627865314484e-05, -7.248669862747192e-05, -6.648711860179901e-05, -6.04875385761261e-05, -5.4487958550453186e-05, -4.8488378524780273e-05, -4.248879849910736e-05, -3.648921847343445e-05, -3.0489638447761536e-05, -2.4490058422088623e-05, -1.849047839641571e-05, -1.2490898370742798e-05, -6.491318345069885e-06, -4.917383193969727e-07, 5.50784170627594e-06, 1.1507421731948853e-05, 1.7507001757621765e-05, 2.3506581783294678e-05, 2.950616180896759e-05, 3.55057418346405e-05, 4.1505321860313416e-05, 4.750490188598633e-05, 5.350448191165924e-05, 5.950406193733215e-05, 6.550364196300507e-05, 7.150322198867798e-05, 7.750280201435089e-05, 8.35023820400238e-05, 8.950196206569672e-05, 9.550154209136963e-05, 0.00010150112211704254, 0.00010750070214271545, 0.00011350028216838837, 0.00011949986219406128, 0.0001254994422197342, 0.0001314990222454071, 0.00013749860227108002, 0.00014349818229675293, 0.00014949776232242584, 0.00015549734234809875, 0.00016149692237377167, 0.00016749650239944458, 0.0001734960824251175, 0.0001794956624507904, 0.00018549524247646332, 0.00019149482250213623, 0.00019749440252780914, 0.00020349398255348206, 0.00020949356257915497, 0.00021549314260482788, 0.0002214927226305008, 0.0002274923026561737, 0.00023349188268184662, 0.00023949146270751953]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 11.0, 30.0, 35.0, 62.0, 82.0, 142.0, 352.0, 867.0, 3336.0, 26340.0, 852579.0, 153768.0, 8032.0, 1737.0, 566.0, 257.0, 119.0, 65.0, 43.0, 38.0, 22.0, 11.0, 10.0, 4.0, 8.0, 8.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 11.0, 21.0, 20.0, 37.0, 39.0, 59.0, 55.0, 84.0, 89.0, 107.0, 106.0, 76.0, 74.0, 50.0, 36.0, 39.0, 14.0, 9.0, 20.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4523773193359375, -1.399871826171875, -1.3473663330078125, -1.29486083984375, -1.2423553466796875, -1.189849853515625, -1.1373443603515625, -1.0848388671875, -1.0323333740234375, -0.979827880859375, -0.9273223876953125, -0.87481689453125, -0.8223114013671875, -0.769805908203125, -0.7173004150390625, -0.664794921875, -0.6122894287109375, -0.559783935546875, -0.5072784423828125, -0.45477294921875, -0.4022674560546875, -0.349761962890625, -0.2972564697265625, -0.2447509765625, -0.1922454833984375, -0.139739990234375, -0.0872344970703125, -0.03472900390625, 0.0177764892578125, 0.070281982421875, 0.1227874755859375, 0.17529296875, 0.2277984619140625, 0.280303955078125, 0.3328094482421875, 0.38531494140625, 0.4378204345703125, 0.490325927734375, 0.5428314208984375, 0.5953369140625, 0.6478424072265625, 0.700347900390625, 0.7528533935546875, 0.80535888671875, 0.8578643798828125, 0.910369873046875, 0.9628753662109375, 1.015380859375, 1.0678863525390625, 1.120391845703125, 1.1728973388671875, 1.22540283203125, 1.2779083251953125, 1.330413818359375, 1.3829193115234375, 1.4354248046875, 1.4879302978515625, 1.540435791015625, 1.5929412841796875, 1.64544677734375, 1.6979522705078125, 1.750457763671875, 1.8029632568359375, 1.85546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 9.0, 17.0, 119.0, 577.0, 236.0, 33.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.367431640625, -17.71942901611328, -15.07142448425293, -12.423420906066895, -9.77541732788086, -7.127413749694824, -4.479410171508789, -1.8314056396484375, 0.8165969848632812, 3.4646005630493164, 6.112604141235352, 8.760607719421387, 11.408611297607422, 14.056614875793457, 16.704618453979492, 19.352622985839844, 22.000625610351562, 24.64862823486328, 27.296632766723633, 29.944637298583984, 32.5926399230957, 35.24064254760742, 37.888648986816406, 40.536651611328125, 43.184654235839844, 45.83265686035156, 48.48065948486328, 51.128665924072266, 53.776668548583984, 56.4246711730957, 59.07267761230469, 61.720680236816406, 64.36868286132812, 67.01668548583984, 69.66468811035156, 72.31269073486328, 74.960693359375, 77.60870361328125, 80.25670623779297, 82.90470886230469, 85.5527114868164, 88.20071411132812, 90.84871673583984, 93.49671936035156, 96.14472961425781, 98.79273223876953, 101.44073486328125, 104.08873748779297, 106.73674011230469, 109.3847427368164, 112.03274536132812, 114.68074798583984, 117.32875061035156, 119.97676086425781, 122.62476348876953, 125.27276611328125, 127.92076873779297, 130.5687713623047, 133.21678161621094, 135.86477661132812, 138.51278686523438, 141.16078186035156, 143.8087921142578, 146.456787109375, 149.10479736328125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 5.0, 16.0, 16.0, 16.0, 30.0, 48.0, 52.0, 51.0, 68.0, 73.0, 76.0, 66.0, 61.0, 56.0, 67.0, 48.0, 46.0, 37.0, 38.0, 27.0, 17.0, 18.0, 10.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.94731521606445, -34.030887603759766, -33.11445617675781, -32.198028564453125, -31.281600952148438, -30.365171432495117, -29.44874382019043, -28.53231430053711, -27.615886688232422, -26.6994571685791, -25.783029556274414, -24.866600036621094, -23.950172424316406, -23.033742904663086, -22.1173152923584, -21.200885772705078, -20.28445816040039, -19.36802864074707, -18.451601028442383, -17.535171508789062, -16.618743896484375, -15.702314376831055, -14.785886764526367, -13.869457244873047, -12.953027725219727, -12.036599159240723, -11.120170593261719, -10.203742027282715, -9.287313461303711, -8.37088394165039, -7.454455852508545, -6.538027286529541, -5.621599197387695, -4.705170631408691, -3.7887420654296875, -2.8723132610321045, -1.9558846950531006, -1.0394558906555176, -0.12302732467651367, 0.7934012413024902, 1.7098298072814941, 2.626258373260498, 3.542686939239502, 4.459115982055664, 5.375544548034668, 6.291973114013672, 7.208401679992676, 8.12483024597168, 9.041258811950684, 9.957687377929688, 10.874115943908691, 11.790544509887695, 12.7069730758667, 13.623401641845703, 14.539831161499023, 15.456258773803711, 16.37268829345703, 17.28911781311035, 18.20554542541504, 19.12197494506836, 20.038402557373047, 20.954832077026367, 21.871259689331055, 22.787689208984375, 23.704116821289062]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 11.0, 18.0, 41.0, 96.0, 203.0, 594.0, 3567.0, 4179329.0, 9745.0, 438.0, 140.0, 48.0, 29.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-79.6875, -77.90283203125, -76.1181640625, -74.33349609375, -72.548828125, -70.76416015625, -68.9794921875, -67.19482421875, -65.41015625, -63.62548828125, -61.8408203125, -60.05615234375, -58.271484375, -56.48681640625, -54.7021484375, -52.91748046875, -51.1328125, -49.34814453125, -47.5634765625, -45.77880859375, -43.994140625, -42.20947265625, -40.4248046875, -38.64013671875, -36.85546875, -35.07080078125, -33.2861328125, -31.50146484375, -29.716796875, -27.93212890625, -26.1474609375, -24.36279296875, -22.578125, -20.79345703125, -19.0087890625, -17.22412109375, -15.439453125, -13.65478515625, -11.8701171875, -10.08544921875, -8.30078125, -6.51611328125, -4.7314453125, -2.94677734375, -1.162109375, 0.62255859375, 2.4072265625, 4.19189453125, 5.9765625, 7.76123046875, 9.5458984375, 11.33056640625, 13.115234375, 14.89990234375, 16.6845703125, 18.46923828125, 20.25390625, 22.03857421875, 23.8232421875, 25.60791015625, 27.392578125, 29.17724609375, 30.9619140625, 32.74658203125, 34.53125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 37.0, 78.0, 158.0, 197.0, 207.0, 140.0, 79.0, 29.0, 26.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.294921875, -2.24371337890625, -2.1925048828125, -2.14129638671875, -2.090087890625, -2.03887939453125, -1.9876708984375, -1.93646240234375, -1.88525390625, -1.83404541015625, -1.7828369140625, -1.73162841796875, -1.680419921875, -1.62921142578125, -1.5780029296875, -1.52679443359375, -1.4755859375, -1.42437744140625, -1.3731689453125, -1.32196044921875, -1.270751953125, -1.21954345703125, -1.1683349609375, -1.11712646484375, -1.06591796875, -1.01470947265625, -0.9635009765625, -0.91229248046875, -0.861083984375, -0.80987548828125, -0.7586669921875, -0.70745849609375, -0.65625, -0.60504150390625, -0.5538330078125, -0.50262451171875, -0.451416015625, -0.40020751953125, -0.3489990234375, -0.29779052734375, -0.24658203125, -0.19537353515625, -0.1441650390625, -0.09295654296875, -0.041748046875, 0.00946044921875, 0.0606689453125, 0.11187744140625, 0.1630859375, 0.21429443359375, 0.2655029296875, 0.31671142578125, 0.367919921875, 0.41912841796875, 0.4703369140625, 0.52154541015625, 0.57275390625, 0.62396240234375, 0.6751708984375, 0.72637939453125, 0.777587890625, 0.82879638671875, 0.8800048828125, 0.93121337890625, 0.982421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 16.0, 12.0, 9.0, 24.0, 43.0, 50.0, 108.0, 212.0, 447.0, 1626.0, 10193.0, 1577217.0, 2592209.0, 9945.0, 1516.0, 345.0, 133.0, 65.0, 41.0, 29.0, 17.0, 7.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.8814697265625, -19.419189453125, -18.9569091796875, -18.49462890625, -18.0323486328125, -17.570068359375, -17.1077880859375, -16.6455078125, -16.1832275390625, -15.720947265625, -15.2586669921875, -14.79638671875, -14.3341064453125, -13.871826171875, -13.4095458984375, -12.947265625, -12.4849853515625, -12.022705078125, -11.5604248046875, -11.09814453125, -10.6358642578125, -10.173583984375, -9.7113037109375, -9.2490234375, -8.7867431640625, -8.324462890625, -7.8621826171875, -7.39990234375, -6.9376220703125, -6.475341796875, -6.0130615234375, -5.55078125, -5.0885009765625, -4.626220703125, -4.1639404296875, -3.70166015625, -3.2393798828125, -2.777099609375, -2.3148193359375, -1.8525390625, -1.3902587890625, -0.927978515625, -0.4656982421875, -0.00341796875, 0.4588623046875, 0.921142578125, 1.3834228515625, 1.845703125, 2.3079833984375, 2.770263671875, 3.2325439453125, 3.69482421875, 4.1571044921875, 4.619384765625, 5.0816650390625, 5.5439453125, 6.0062255859375, 6.468505859375, 6.9307861328125, 7.39306640625, 7.8553466796875, 8.317626953125, 8.7799072265625, 9.2421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 10.0, 25.0, 36.0, 46.0, 95.0, 247.0, 2262.0, 976.0, 172.0, 89.0, 41.0, 21.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.75390625, -3.6738433837890625, -3.593780517578125, -3.5137176513671875, -3.43365478515625, -3.3535919189453125, -3.273529052734375, -3.1934661865234375, -3.1134033203125, -3.0333404541015625, -2.953277587890625, -2.8732147216796875, -2.79315185546875, -2.7130889892578125, -2.633026123046875, -2.5529632568359375, -2.472900390625, -2.3928375244140625, -2.312774658203125, -2.2327117919921875, -2.15264892578125, -2.0725860595703125, -1.992523193359375, -1.9124603271484375, -1.8323974609375, -1.7523345947265625, -1.672271728515625, -1.5922088623046875, -1.51214599609375, -1.4320831298828125, -1.352020263671875, -1.2719573974609375, -1.19189453125, -1.1118316650390625, -1.031768798828125, -0.9517059326171875, -0.87164306640625, -0.7915802001953125, -0.711517333984375, -0.6314544677734375, -0.5513916015625, -0.4713287353515625, -0.391265869140625, -0.3112030029296875, -0.23114013671875, -0.1510772705078125, -0.071014404296875, 0.0090484619140625, 0.089111328125, 0.1691741943359375, 0.249237060546875, 0.3292999267578125, 0.40936279296875, 0.4894256591796875, 0.569488525390625, 0.6495513916015625, 0.7296142578125, 0.8096771240234375, 0.889739990234375, 0.9698028564453125, 1.04986572265625, 1.1299285888671875, 1.209991455078125, 1.2900543212890625, 1.3701171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 8.0, 14.0, 42.0, 92.0, 300.0, 343.0, 132.0, 40.0, 19.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.79538917541504, -20.381046295166016, -19.96670150756836, -19.552358627319336, -19.138015747070312, -18.723670959472656, -18.309328079223633, -17.89498519897461, -17.480640411376953, -17.06629753112793, -16.651952743530273, -16.23760986328125, -15.82326602935791, -15.408923149108887, -14.994579315185547, -14.580236434936523, -14.1658935546875, -13.75154972076416, -13.337206840515137, -12.922863006591797, -12.508519172668457, -12.094176292419434, -11.679832458496094, -11.26548957824707, -10.851144790649414, -10.436800956726074, -10.02245807647705, -9.608114242553711, -9.193770408630371, -8.779427528381348, -8.365083694458008, -7.950740337371826, -7.536397457122803, -7.122054100036621, -6.707710266113281, -6.2933669090271, -5.879023551940918, -5.464679718017578, -5.0503363609313965, -4.635993003845215, -4.221649169921875, -3.8073055744171143, -3.3929622173309326, -2.978618621826172, -2.5642752647399902, -2.1499316692352295, -1.7355880737304688, -1.321244716644287, -0.9069013595581055, -0.4925578534603119, -0.07821434736251831, 0.33612918853759766, 0.7504726648330688, 1.16481614112854, 1.5791597366333008, 1.9935030937194824, 2.407846689224243, 2.822190284729004, 3.2365336418151855, 3.6508772373199463, 4.065220832824707, 4.479564189910889, 4.89390754699707, 5.30825138092041, 5.722594738006592]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 8.0, 8.0, 16.0, 17.0, 20.0, 27.0, 21.0, 33.0, 39.0, 40.0, 41.0, 37.0, 36.0, 51.0, 41.0, 45.0, 48.0, 65.0, 48.0, 39.0, 34.0, 34.0, 33.0, 34.0, 23.0, 26.0, 28.0, 9.0, 13.0, 17.0, 11.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.436602592468262, -5.275496482849121, -5.1143903732299805, -4.95328426361084, -4.792178153991699, -4.631072521209717, -4.469966411590576, -4.3088603019714355, -4.147754192352295, -3.9866480827331543, -3.8255419731140137, -3.664436101913452, -3.5033299922943115, -3.342223882675171, -3.1811180114746094, -3.0200119018554688, -2.858905792236328, -2.6977996826171875, -2.536693572998047, -2.3755877017974854, -2.2144815921783447, -2.053375482559204, -1.892269492149353, -1.731163501739502, -1.5700573921203613, -1.4089512825012207, -1.2478452920913696, -1.0867393016815186, -0.9256331920623779, -0.7645271420478821, -0.6034210920333862, -0.44231510162353516, -0.28120899200439453, -0.12010294198989868, 0.04100310802459717, 0.20210915803909302, 0.36321520805358887, 0.5243212580680847, 0.6854273080825806, 0.8465332984924316, 1.0076394081115723, 1.168745517730713, 1.329851508140564, 1.490957498550415, 1.6520636081695557, 1.8131697177886963, 1.9742757081985474, 2.1353816986083984, 2.296487808227539, 2.4575939178466797, 2.6187000274658203, 2.779805898666382, 2.9409120082855225, 3.102018117904663, 3.2631239891052246, 3.4242300987243652, 3.585336208343506, 3.7464423179626465, 3.907548427581787, 4.068654537200928, 4.22976016998291, 4.390866279602051, 4.551972389221191, 4.713078498840332, 4.874184608459473]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 9.0, 11.0, 16.0, 22.0, 18.0, 36.0, 61.0, 96.0, 179.0, 337.0, 666.0, 1645.0, 5504.0, 98169.0, 918031.0, 18741.0, 3037.0, 1000.0, 431.0, 205.0, 104.0, 83.0, 46.0, 18.0, 28.0, 17.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.953125, -12.56396484375, -12.1748046875, -11.78564453125, -11.396484375, -11.00732421875, -10.6181640625, -10.22900390625, -9.83984375, -9.45068359375, -9.0615234375, -8.67236328125, -8.283203125, -7.89404296875, -7.5048828125, -7.11572265625, -6.7265625, -6.33740234375, -5.9482421875, -5.55908203125, -5.169921875, -4.78076171875, -4.3916015625, -4.00244140625, -3.61328125, -3.22412109375, -2.8349609375, -2.44580078125, -2.056640625, -1.66748046875, -1.2783203125, -0.88916015625, -0.5, -0.11083984375, 0.2783203125, 0.66748046875, 1.056640625, 1.44580078125, 1.8349609375, 2.22412109375, 2.61328125, 3.00244140625, 3.3916015625, 3.78076171875, 4.169921875, 4.55908203125, 4.9482421875, 5.33740234375, 5.7265625, 6.11572265625, 6.5048828125, 6.89404296875, 7.283203125, 7.67236328125, 8.0615234375, 8.45068359375, 8.83984375, 9.22900390625, 9.6181640625, 10.00732421875, 10.396484375, 10.78564453125, 11.1748046875, 11.56396484375, 11.953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 11.0, 21.0, 55.0, 114.0, 164.0, 191.0, 191.0, 116.0, 69.0, 40.0, 11.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.1287765502929688, -2.0798187255859375, -2.0308609008789062, -1.981903076171875, -1.9329452514648438, -1.8839874267578125, -1.8350296020507812, -1.78607177734375, -1.7371139526367188, -1.6881561279296875, -1.6391983032226562, -1.590240478515625, -1.5412826538085938, -1.4923248291015625, -1.4433670043945312, -1.3944091796875, -1.3454513549804688, -1.2964935302734375, -1.2475357055664062, -1.198577880859375, -1.1496200561523438, -1.1006622314453125, -1.0517044067382812, -1.00274658203125, -0.9537887573242188, -0.9048309326171875, -0.8558731079101562, -0.806915283203125, -0.7579574584960938, -0.7089996337890625, -0.6600418090820312, -0.611083984375, -0.5621261596679688, -0.5131683349609375, -0.46421051025390625, -0.415252685546875, -0.36629486083984375, -0.3173370361328125, -0.26837921142578125, -0.21942138671875, -0.17046356201171875, -0.1215057373046875, -0.07254791259765625, -0.023590087890625, 0.02536773681640625, 0.0743255615234375, 0.12328338623046875, 0.1722412109375, 0.22119903564453125, 0.2701568603515625, 0.31911468505859375, 0.368072509765625, 0.41703033447265625, 0.4659881591796875, 0.5149459838867188, 0.56390380859375, 0.6128616333007812, 0.6618194580078125, 0.7107772827148438, 0.759735107421875, 0.8086929321289062, 0.8576507568359375, 0.9066085815429688, 0.95556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 7.0, 3.0, 4.0, 9.0, 4.0, 10.0, 4.0, 9.0, 21.0, 23.0, 23.0, 26.0, 43.0, 58.0, 80.0, 129.0, 221.0, 374.0, 767.0, 2012.0, 7279.0, 41879.0, 538411.0, 414507.0, 33242.0, 6052.0, 1700.0, 736.0, 319.0, 208.0, 107.0, 79.0, 50.0, 24.0, 28.0, 19.0, 17.0, 10.0, 9.0, 10.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.33203125, -7.1025390625, -6.873046875, -6.6435546875, -6.4140625, -6.1845703125, -5.955078125, -5.7255859375, -5.49609375, -5.2666015625, -5.037109375, -4.8076171875, -4.578125, -4.3486328125, -4.119140625, -3.8896484375, -3.66015625, -3.4306640625, -3.201171875, -2.9716796875, -2.7421875, -2.5126953125, -2.283203125, -2.0537109375, -1.82421875, -1.5947265625, -1.365234375, -1.1357421875, -0.90625, -0.6767578125, -0.447265625, -0.2177734375, 0.01171875, 0.2412109375, 0.470703125, 0.7001953125, 0.9296875, 1.1591796875, 1.388671875, 1.6181640625, 1.84765625, 2.0771484375, 2.306640625, 2.5361328125, 2.765625, 2.9951171875, 3.224609375, 3.4541015625, 3.68359375, 3.9130859375, 4.142578125, 4.3720703125, 4.6015625, 4.8310546875, 5.060546875, 5.2900390625, 5.51953125, 5.7490234375, 5.978515625, 6.2080078125, 6.4375, 6.6669921875, 6.896484375, 7.1259765625, 7.35546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 3.0, 7.0, 7.0, 15.0, 8.0, 12.0, 16.0, 17.0, 28.0, 28.0, 29.0, 41.0, 33.0, 30.0, 49.0, 46.0, 52.0, 37.0, 53.0, 48.0, 44.0, 52.0, 46.0, 35.0, 45.0, 26.0, 40.0, 22.0, 23.0, 17.0, 22.0, 16.0, 9.0, 10.0, 6.0, 5.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.421478271484375, -3.30389404296875, -3.186309814453125, -3.0687255859375, -2.951141357421875, -2.83355712890625, -2.715972900390625, -2.598388671875, -2.480804443359375, -2.36322021484375, -2.245635986328125, -2.1280517578125, -2.010467529296875, -1.89288330078125, -1.775299072265625, -1.65771484375, -1.540130615234375, -1.42254638671875, -1.304962158203125, -1.1873779296875, -1.069793701171875, -0.95220947265625, -0.834625244140625, -0.717041015625, -0.599456787109375, -0.48187255859375, -0.364288330078125, -0.2467041015625, -0.129119873046875, -0.01153564453125, 0.106048583984375, 0.2236328125, 0.341217041015625, 0.45880126953125, 0.576385498046875, 0.6939697265625, 0.811553955078125, 0.92913818359375, 1.046722412109375, 1.164306640625, 1.281890869140625, 1.39947509765625, 1.517059326171875, 1.6346435546875, 1.752227783203125, 1.86981201171875, 1.987396240234375, 2.10498046875, 2.222564697265625, 2.34014892578125, 2.457733154296875, 2.5753173828125, 2.692901611328125, 2.81048583984375, 2.928070068359375, 3.045654296875, 3.163238525390625, 3.28082275390625, 3.398406982421875, 3.5159912109375, 3.633575439453125, 3.75115966796875, 3.868743896484375, 3.986328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 6.0, 8.0, 8.0, 26.0, 35.0, 69.0, 150.0, 354.0, 1057.0, 5428.0, 176480.0, 845112.0, 16939.0, 1881.0, 539.0, 202.0, 123.0, 59.0, 33.0, 14.0, 14.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.36083984375, -4.2333984375, -4.10595703125, -3.978515625, -3.85107421875, -3.7236328125, -3.59619140625, -3.46875, -3.34130859375, -3.2138671875, -3.08642578125, -2.958984375, -2.83154296875, -2.7041015625, -2.57666015625, -2.44921875, -2.32177734375, -2.1943359375, -2.06689453125, -1.939453125, -1.81201171875, -1.6845703125, -1.55712890625, -1.4296875, -1.30224609375, -1.1748046875, -1.04736328125, -0.919921875, -0.79248046875, -0.6650390625, -0.53759765625, -0.41015625, -0.28271484375, -0.1552734375, -0.02783203125, 0.099609375, 0.22705078125, 0.3544921875, 0.48193359375, 0.609375, 0.73681640625, 0.8642578125, 0.99169921875, 1.119140625, 1.24658203125, 1.3740234375, 1.50146484375, 1.62890625, 1.75634765625, 1.8837890625, 2.01123046875, 2.138671875, 2.26611328125, 2.3935546875, 2.52099609375, 2.6484375, 2.77587890625, 2.9033203125, 3.03076171875, 3.158203125, 3.28564453125, 3.4130859375, 3.54052734375, 3.66796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 11.0, 16.0, 18.0, 20.0, 32.0, 40.0, 56.0, 55.0, 89.0, 107.0, 110.0, 100.0, 85.0, 53.0, 49.0, 25.0, 23.0, 20.0, 16.0, 9.0, 11.0, 7.0, 8.0, 2.0, 4.0, 3.0, 9.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001691579818725586, -0.00016393326222896576, -0.00015870854258537292, -0.0001534838229417801, -0.00014825910329818726, -0.00014303438365459442, -0.0001378096640110016, -0.00013258494436740875, -0.00012736022472381592, -0.00012213550508022308, -0.00011691078543663025, -0.00011168606579303741, -0.00010646134614944458, -0.00010123662650585175, -9.601190686225891e-05, -9.078718721866608e-05, -8.556246757507324e-05, -8.033774793148041e-05, -7.511302828788757e-05, -6.988830864429474e-05, -6.46635890007019e-05, -5.943886935710907e-05, -5.4214149713516235e-05, -4.89894300699234e-05, -4.3764710426330566e-05, -3.853999078273773e-05, -3.33152711391449e-05, -2.8090551495552063e-05, -2.286583185195923e-05, -1.7641112208366394e-05, -1.241639256477356e-05, -7.191672921180725e-06, -1.9669532775878906e-06, 3.257766366004944e-06, 8.482486009597778e-06, 1.3707205653190613e-05, 1.8931925296783447e-05, 2.4156644940376282e-05, 2.9381364583969116e-05, 3.460608422756195e-05, 3.9830803871154785e-05, 4.505552351474762e-05, 5.0280243158340454e-05, 5.550496280193329e-05, 6.072968244552612e-05, 6.595440208911896e-05, 7.117912173271179e-05, 7.640384137630463e-05, 8.162856101989746e-05, 8.68532806634903e-05, 9.207800030708313e-05, 9.730271995067596e-05, 0.0001025274395942688, 0.00010775215923786163, 0.00011297687888145447, 0.0001182015985250473, 0.00012342631816864014, 0.00012865103781223297, 0.0001338757574558258, 0.00013910047709941864, 0.00014432519674301147, 0.0001495499163866043, 0.00015477463603019714, 0.00015999935567378998, 0.0001652240753173828]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 10.0, 10.0, 15.0, 26.0, 50.0, 100.0, 276.0, 836.0, 4815.0, 296575.0, 736439.0, 7674.0, 1136.0, 315.0, 135.0, 55.0, 34.0, 23.0, 7.0, 9.0, 13.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.6763916015625, -3.493408203125, -3.3104248046875, -3.12744140625, -2.9444580078125, -2.761474609375, -2.5784912109375, -2.3955078125, -2.2125244140625, -2.029541015625, -1.8465576171875, -1.66357421875, -1.4805908203125, -1.297607421875, -1.1146240234375, -0.931640625, -0.7486572265625, -0.565673828125, -0.3826904296875, -0.19970703125, -0.0167236328125, 0.166259765625, 0.3492431640625, 0.5322265625, 0.7152099609375, 0.898193359375, 1.0811767578125, 1.26416015625, 1.4471435546875, 1.630126953125, 1.8131103515625, 1.99609375, 2.1790771484375, 2.362060546875, 2.5450439453125, 2.72802734375, 2.9110107421875, 3.093994140625, 3.2769775390625, 3.4599609375, 3.6429443359375, 3.825927734375, 4.0089111328125, 4.19189453125, 4.3748779296875, 4.557861328125, 4.7408447265625, 4.923828125, 5.1068115234375, 5.289794921875, 5.4727783203125, 5.65576171875, 5.8387451171875, 6.021728515625, 6.2047119140625, 6.3876953125, 6.5706787109375, 6.753662109375, 6.9366455078125, 7.11962890625, 7.3026123046875, 7.485595703125, 7.6685791015625, 7.8515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 4.0, 8.0, 12.0, 21.0, 28.0, 54.0, 61.0, 91.0, 151.0, 147.0, 127.0, 105.0, 72.0, 45.0, 28.0, 21.0, 15.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.50323486328125, -1.4263916015625, -1.34954833984375, -1.272705078125, -1.19586181640625, -1.1190185546875, -1.04217529296875, -0.96533203125, -0.88848876953125, -0.8116455078125, -0.73480224609375, -0.657958984375, -0.58111572265625, -0.5042724609375, -0.42742919921875, -0.3505859375, -0.27374267578125, -0.1968994140625, -0.12005615234375, -0.043212890625, 0.03363037109375, 0.1104736328125, 0.18731689453125, 0.26416015625, 0.34100341796875, 0.4178466796875, 0.49468994140625, 0.571533203125, 0.64837646484375, 0.7252197265625, 0.80206298828125, 0.87890625, 0.95574951171875, 1.0325927734375, 1.10943603515625, 1.186279296875, 1.26312255859375, 1.3399658203125, 1.41680908203125, 1.49365234375, 1.57049560546875, 1.6473388671875, 1.72418212890625, 1.801025390625, 1.87786865234375, 1.9547119140625, 2.03155517578125, 2.1083984375, 2.18524169921875, 2.2620849609375, 2.33892822265625, 2.415771484375, 2.49261474609375, 2.5694580078125, 2.64630126953125, 2.72314453125, 2.79998779296875, 2.8768310546875, 2.95367431640625, 3.030517578125, 3.10736083984375, 3.1842041015625, 3.26104736328125, 3.337890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 9.0, 52.0, 472.0, 431.0, 37.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.870460510253906, -30.08580780029297, -26.30115509033203, -22.516504287719727, -18.73185157775879, -14.947198867797852, -11.162548065185547, -7.377895355224609, -3.593242645263672, 0.19140958786010742, 3.9760618209838867, 7.760713577270508, 11.545366287231445, 15.330018997192383, 19.114669799804688, 22.899322509765625, 26.683975219726562, 30.4686279296875, 34.25328063964844, 38.037933349609375, 41.82258605957031, 45.60723876953125, 49.39188766479492, 53.17654037475586, 56.9611930847168, 60.745845794677734, 64.5304946899414, 68.31514739990234, 72.09980010986328, 75.88445281982422, 79.66910552978516, 83.4537582397461, 87.2384033203125, 91.02305603027344, 94.80770874023438, 98.59236145019531, 102.37701416015625, 106.16166687011719, 109.94631958007812, 113.73097229003906, 117.515625, 121.30027770996094, 125.08493041992188, 128.8695831298828, 132.65423583984375, 136.4388885498047, 140.22354125976562, 144.00819396972656, 147.7928466796875, 151.57749938964844, 155.36215209960938, 159.1468048095703, 162.93145751953125, 166.7161102294922, 170.50076293945312, 174.28541564941406, 178.07005310058594, 181.85470581054688, 185.6393585205078, 189.42401123046875, 193.2086639404297, 196.99331665039062, 200.77796936035156, 204.5626220703125, 208.34727478027344]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 22.0, 23.0, 20.0, 30.0, 32.0, 41.0, 39.0, 27.0, 46.0, 61.0, 57.0, 65.0, 41.0, 41.0, 41.0, 46.0, 38.0, 39.0, 23.0, 39.0, 36.0, 25.0, 19.0, 23.0, 23.0, 12.0, 11.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.824403762817383, -21.04537582397461, -20.266345977783203, -19.48731803894043, -18.708288192749023, -17.92926025390625, -17.150230407714844, -16.37120246887207, -15.592172622680664, -14.813143730163574, -14.034114837646484, -13.255085945129395, -12.476057052612305, -11.697028160095215, -10.917999267578125, -10.138971328735352, -9.359942436218262, -8.580913543701172, -7.801884651184082, -7.022855758666992, -6.243826866149902, -5.4647979736328125, -4.685769557952881, -3.906740665435791, -3.127711772918701, -2.3486828804016113, -1.569654107093811, -0.7906253337860107, -0.011596441268920898, 0.767432451248169, 1.5464611053466797, 2.3254899978637695, 3.1045188903808594, 3.883547782897949, 4.662576675415039, 5.441605567932129, 6.220634460449219, 6.999663352966309, 7.77869176864624, 8.557720184326172, 9.336750030517578, 10.115778923034668, 10.894807815551758, 11.673836708068848, 12.452865600585938, 13.231894493103027, 14.010923385620117, 14.78995132446289, 15.56898021697998, 16.34800910949707, 17.127037048339844, 17.90606689453125, 18.685094833374023, 19.46412467956543, 20.243152618408203, 21.02218246459961, 21.801210403442383, 22.580238342285156, 23.359268188476562, 24.138296127319336, 24.917325973510742, 25.696353912353516, 26.475383758544922, 27.254411697387695, 28.0334415435791]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 5.0, 2.0, 4.0, 9.0, 7.0, 18.0, 20.0, 21.0, 28.0, 30.0, 34.0, 59.0, 99.0, 128.0, 248.0, 341.0, 745.0, 1533.0, 3721.0, 17996.0, 3418532.0, 731802.0, 14593.0, 2715.0, 893.0, 350.0, 166.0, 65.0, 31.0, 26.0, 14.0, 11.0, 7.0, 8.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0], "bins": [-15.0859375, -14.7503662109375, -14.414794921875, -14.0792236328125, -13.74365234375, -13.4080810546875, -13.072509765625, -12.7369384765625, -12.4013671875, -12.0657958984375, -11.730224609375, -11.3946533203125, -11.05908203125, -10.7235107421875, -10.387939453125, -10.0523681640625, -9.716796875, -9.3812255859375, -9.045654296875, -8.7100830078125, -8.37451171875, -8.0389404296875, -7.703369140625, -7.3677978515625, -7.0322265625, -6.6966552734375, -6.361083984375, -6.0255126953125, -5.68994140625, -5.3543701171875, -5.018798828125, -4.6832275390625, -4.34765625, -4.0120849609375, -3.676513671875, -3.3409423828125, -3.00537109375, -2.6697998046875, -2.334228515625, -1.9986572265625, -1.6630859375, -1.3275146484375, -0.991943359375, -0.6563720703125, -0.32080078125, 0.0147705078125, 0.350341796875, 0.6859130859375, 1.021484375, 1.3570556640625, 1.692626953125, 2.0281982421875, 2.36376953125, 2.6993408203125, 3.034912109375, 3.3704833984375, 3.7060546875, 4.0416259765625, 4.377197265625, 4.7127685546875, 5.04833984375, 5.3839111328125, 5.719482421875, 6.0550537109375, 6.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 16.0, 29.0, 40.0, 69.0, 115.0, 132.0, 148.0, 139.0, 124.0, 82.0, 38.0, 31.0, 14.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.251953125, -2.2012100219726562, -2.1504669189453125, -2.0997238159179688, -2.048980712890625, -1.9982376098632812, -1.9474945068359375, -1.8967514038085938, -1.84600830078125, -1.7952651977539062, -1.7445220947265625, -1.6937789916992188, -1.643035888671875, -1.5922927856445312, -1.5415496826171875, -1.4908065795898438, -1.4400634765625, -1.3893203735351562, -1.3385772705078125, -1.2878341674804688, -1.237091064453125, -1.1863479614257812, -1.1356048583984375, -1.0848617553710938, -1.03411865234375, -0.9833755493164062, -0.9326324462890625, -0.8818893432617188, -0.831146240234375, -0.7804031372070312, -0.7296600341796875, -0.6789169311523438, -0.628173828125, -0.5774307250976562, -0.5266876220703125, -0.47594451904296875, -0.425201416015625, -0.37445831298828125, -0.3237152099609375, -0.27297210693359375, -0.22222900390625, -0.17148590087890625, -0.1207427978515625, -0.06999969482421875, -0.019256591796875, 0.03148651123046875, 0.0822296142578125, 0.13297271728515625, 0.1837158203125, 0.23445892333984375, 0.2852020263671875, 0.33594512939453125, 0.386688232421875, 0.43743133544921875, 0.4881744384765625, 0.5389175415039062, 0.58966064453125, 0.6404037475585938, 0.6911468505859375, 0.7418899536132812, 0.792633056640625, 0.8433761596679688, 0.8941192626953125, 0.9448623657226562, 0.99560546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 11.0, 22.0, 28.0, 62.0, 97.0, 196.0, 432.0, 971.0, 2644.0, 11263.0, 135526.0, 3972864.0, 59594.0, 7257.0, 1894.0, 735.0, 325.0, 163.0, 80.0, 44.0, 23.0, 11.0, 9.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.182373046875, -7.90380859375, -7.625244140625, -7.3466796875, -7.068115234375, -6.78955078125, -6.510986328125, -6.232421875, -5.953857421875, -5.67529296875, -5.396728515625, -5.1181640625, -4.839599609375, -4.56103515625, -4.282470703125, -4.00390625, -3.725341796875, -3.44677734375, -3.168212890625, -2.8896484375, -2.611083984375, -2.33251953125, -2.053955078125, -1.775390625, -1.496826171875, -1.21826171875, -0.939697265625, -0.6611328125, -0.382568359375, -0.10400390625, 0.174560546875, 0.453125, 0.731689453125, 1.01025390625, 1.288818359375, 1.5673828125, 1.845947265625, 2.12451171875, 2.403076171875, 2.681640625, 2.960205078125, 3.23876953125, 3.517333984375, 3.7958984375, 4.074462890625, 4.35302734375, 4.631591796875, 4.91015625, 5.188720703125, 5.46728515625, 5.745849609375, 6.0244140625, 6.302978515625, 6.58154296875, 6.860107421875, 7.138671875, 7.417236328125, 7.69580078125, 7.974365234375, 8.2529296875, 8.531494140625, 8.81005859375, 9.088623046875, 9.3671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 3.0, 6.0, 13.0, 18.0, 19.0, 31.0, 40.0, 74.0, 158.0, 450.0, 2375.0, 492.0, 152.0, 73.0, 57.0, 37.0, 17.0, 13.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9271240234375, -1.864013671875, -1.8009033203125, -1.73779296875, -1.6746826171875, -1.611572265625, -1.5484619140625, -1.4853515625, -1.4222412109375, -1.359130859375, -1.2960205078125, -1.23291015625, -1.1697998046875, -1.106689453125, -1.0435791015625, -0.98046875, -0.9173583984375, -0.854248046875, -0.7911376953125, -0.72802734375, -0.6649169921875, -0.601806640625, -0.5386962890625, -0.4755859375, -0.4124755859375, -0.349365234375, -0.2862548828125, -0.22314453125, -0.1600341796875, -0.096923828125, -0.0338134765625, 0.029296875, 0.0924072265625, 0.155517578125, 0.2186279296875, 0.28173828125, 0.3448486328125, 0.407958984375, 0.4710693359375, 0.5341796875, 0.5972900390625, 0.660400390625, 0.7235107421875, 0.78662109375, 0.8497314453125, 0.912841796875, 0.9759521484375, 1.0390625, 1.1021728515625, 1.165283203125, 1.2283935546875, 1.29150390625, 1.3546142578125, 1.417724609375, 1.4808349609375, 1.5439453125, 1.6070556640625, 1.670166015625, 1.7332763671875, 1.79638671875, 1.8594970703125, 1.922607421875, 1.9857177734375, 2.048828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 13.0, 20.0, 29.0, 66.0, 159.0, 216.0, 228.0, 140.0, 62.0, 25.0, 13.0, 17.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.367212295532227, -6.088510990142822, -5.80980920791626, -5.5311079025268555, -5.252406597137451, -4.973705291748047, -4.695003509521484, -4.41630220413208, -4.137600898742676, -3.8588993549346924, -3.580198049545288, -3.3014965057373047, -3.0227952003479004, -2.744093656539917, -2.4653921127319336, -2.1866908073425293, -1.9079890251159668, -1.629287600517273, -1.350586175918579, -1.0718846321105957, -0.7931832075119019, -0.514481782913208, -0.2357802391052246, 0.04292118549346924, 0.3216226100921631, 0.6003240346908569, 0.8790255188941956, 1.1577270030975342, 1.436428427696228, 1.7151298522949219, 1.9938313961029053, 2.2725329399108887, 2.551234245300293, 2.8299357891082764, 3.1086370944976807, 3.387338638305664, 3.6660399436950684, 3.9447414875030518, 4.223443031311035, 4.5021443367004395, 4.780845642089844, 5.059546947479248, 5.3382487297058105, 5.616950035095215, 5.895651340484619, 6.174352645874023, 6.453054428100586, 6.73175573348999, 7.010457515716553, 7.289158821105957, 7.5678606033325195, 7.846561908721924, 8.125263214111328, 8.40396499633789, 8.682666778564453, 8.9613676071167, 9.240069389343262, 9.518771171569824, 9.79747200012207, 10.076173782348633, 10.354875564575195, 10.633576393127441, 10.912278175354004, 11.190979957580566, 11.469680786132812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 10.0, 6.0, 14.0, 9.0, 17.0, 13.0, 19.0, 21.0, 30.0, 27.0, 30.0, 42.0, 39.0, 31.0, 48.0, 35.0, 27.0, 34.0, 27.0, 44.0, 39.0, 37.0, 34.0, 31.0, 33.0, 39.0, 33.0, 28.0, 30.0, 30.0, 19.0, 13.0, 16.0, 18.0, 10.0, 15.0, 8.0, 10.0, 9.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.42619514465332, -4.284749984741211, -4.143304824829102, -4.001859188079834, -3.8604140281677246, -3.7189688682556152, -3.5775234699249268, -3.4360780715942383, -3.294632911682129, -3.1531877517700195, -3.011742353439331, -2.8702969551086426, -2.728851795196533, -2.587406635284424, -2.4459612369537354, -2.304515838623047, -2.1630706787109375, -2.021625518798828, -1.8801801204681396, -1.7387348413467407, -1.5972895622253418, -1.4558442831039429, -1.314399003982544, -1.172953724861145, -1.031508445739746, -0.8900631666183472, -0.7486178874969482, -0.6071726083755493, -0.4657273292541504, -0.32428205013275146, -0.18283677101135254, -0.04139149188995361, 0.10005378723144531, 0.24149906635284424, 0.38294434547424316, 0.5243896245956421, 0.665834903717041, 0.8072801828384399, 0.9487254619598389, 1.0901707410812378, 1.2316160202026367, 1.3730612993240356, 1.5145065784454346, 1.6559518575668335, 1.7973971366882324, 1.9388424158096313, 2.0802876949310303, 2.2217330932617188, 2.363178253173828, 2.5046234130859375, 2.646068811416626, 2.7875142097473145, 2.928959369659424, 3.070404529571533, 3.2118499279022217, 3.35329532623291, 3.4947404861450195, 3.636185646057129, 3.7776310443878174, 3.919076442718506, 4.060521602630615, 4.201966762542725, 4.343412399291992, 4.484857559204102, 4.626302719116211]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 10.0, 6.0, 12.0, 13.0, 9.0, 26.0, 21.0, 37.0, 44.0, 57.0, 103.0, 146.0, 195.0, 278.0, 467.0, 793.0, 1371.0, 3182.0, 11432.0, 65076.0, 592767.0, 323502.0, 36128.0, 7426.0, 2363.0, 1106.0, 644.0, 428.0, 294.0, 193.0, 109.0, 74.0, 57.0, 40.0, 37.0, 25.0, 32.0, 8.0, 14.0, 9.0, 9.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.7265625, -5.557373046875, -5.38818359375, -5.218994140625, -5.0498046875, -4.880615234375, -4.71142578125, -4.542236328125, -4.373046875, -4.203857421875, -4.03466796875, -3.865478515625, -3.6962890625, -3.527099609375, -3.35791015625, -3.188720703125, -3.01953125, -2.850341796875, -2.68115234375, -2.511962890625, -2.3427734375, -2.173583984375, -2.00439453125, -1.835205078125, -1.666015625, -1.496826171875, -1.32763671875, -1.158447265625, -0.9892578125, -0.820068359375, -0.65087890625, -0.481689453125, -0.3125, -0.143310546875, 0.02587890625, 0.195068359375, 0.3642578125, 0.533447265625, 0.70263671875, 0.871826171875, 1.041015625, 1.210205078125, 1.37939453125, 1.548583984375, 1.7177734375, 1.886962890625, 2.05615234375, 2.225341796875, 2.39453125, 2.563720703125, 2.73291015625, 2.902099609375, 3.0712890625, 3.240478515625, 3.40966796875, 3.578857421875, 3.748046875, 3.917236328125, 4.08642578125, 4.255615234375, 4.4248046875, 4.593994140625, 4.76318359375, 4.932373046875, 5.1015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 11.0, 28.0, 40.0, 64.0, 99.0, 144.0, 148.0, 145.0, 108.0, 78.0, 63.0, 30.0, 15.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.279296875, -2.2292938232421875, -2.179290771484375, -2.1292877197265625, -2.07928466796875, -2.0292816162109375, -1.979278564453125, -1.9292755126953125, -1.8792724609375, -1.8292694091796875, -1.779266357421875, -1.7292633056640625, -1.67926025390625, -1.6292572021484375, -1.579254150390625, -1.5292510986328125, -1.479248046875, -1.4292449951171875, -1.379241943359375, -1.3292388916015625, -1.27923583984375, -1.2292327880859375, -1.179229736328125, -1.1292266845703125, -1.0792236328125, -1.0292205810546875, -0.979217529296875, -0.9292144775390625, -0.87921142578125, -0.8292083740234375, -0.779205322265625, -0.7292022705078125, -0.67919921875, -0.6291961669921875, -0.579193115234375, -0.5291900634765625, -0.47918701171875, -0.4291839599609375, -0.379180908203125, -0.3291778564453125, -0.2791748046875, -0.2291717529296875, -0.179168701171875, -0.1291656494140625, -0.07916259765625, -0.0291595458984375, 0.020843505859375, 0.0708465576171875, 0.120849609375, 0.1708526611328125, 0.220855712890625, 0.2708587646484375, 0.32086181640625, 0.3708648681640625, 0.420867919921875, 0.4708709716796875, 0.5208740234375, 0.5708770751953125, 0.620880126953125, 0.6708831787109375, 0.72088623046875, 0.7708892822265625, 0.820892333984375, 0.8708953857421875, 0.9208984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 12.0, 16.0, 17.0, 21.0, 32.0, 37.0, 69.0, 76.0, 110.0, 197.0, 333.0, 560.0, 1136.0, 2669.0, 7762.0, 29026.0, 178786.0, 679566.0, 115427.0, 21965.0, 6173.0, 2304.0, 972.0, 463.0, 275.0, 165.0, 108.0, 75.0, 56.0, 34.0, 24.0, 21.0, 18.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.5252685546875, -5.343505859375, -5.1617431640625, -4.97998046875, -4.7982177734375, -4.616455078125, -4.4346923828125, -4.2529296875, -4.0711669921875, -3.889404296875, -3.7076416015625, -3.52587890625, -3.3441162109375, -3.162353515625, -2.9805908203125, -2.798828125, -2.6170654296875, -2.435302734375, -2.2535400390625, -2.07177734375, -1.8900146484375, -1.708251953125, -1.5264892578125, -1.3447265625, -1.1629638671875, -0.981201171875, -0.7994384765625, -0.61767578125, -0.4359130859375, -0.254150390625, -0.0723876953125, 0.109375, 0.2911376953125, 0.472900390625, 0.6546630859375, 0.83642578125, 1.0181884765625, 1.199951171875, 1.3817138671875, 1.5634765625, 1.7452392578125, 1.927001953125, 2.1087646484375, 2.29052734375, 2.4722900390625, 2.654052734375, 2.8358154296875, 3.017578125, 3.1993408203125, 3.381103515625, 3.5628662109375, 3.74462890625, 3.9263916015625, 4.108154296875, 4.2899169921875, 4.4716796875, 4.6534423828125, 4.835205078125, 5.0169677734375, 5.19873046875, 5.3804931640625, 5.562255859375, 5.7440185546875, 5.92578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 2.0, 5.0, 6.0, 6.0, 10.0, 16.0, 17.0, 19.0, 30.0, 27.0, 27.0, 26.0, 49.0, 42.0, 50.0, 50.0, 59.0, 46.0, 45.0, 47.0, 57.0, 39.0, 43.0, 49.0, 40.0, 36.0, 33.0, 21.0, 13.0, 11.0, 16.0, 11.0, 11.0, 9.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.8125, -4.67315673828125, -4.5338134765625, -4.39447021484375, -4.255126953125, -4.11578369140625, -3.9764404296875, -3.83709716796875, -3.69775390625, -3.55841064453125, -3.4190673828125, -3.27972412109375, -3.140380859375, -3.00103759765625, -2.8616943359375, -2.72235107421875, -2.5830078125, -2.44366455078125, -2.3043212890625, -2.16497802734375, -2.025634765625, -1.88629150390625, -1.7469482421875, -1.60760498046875, -1.46826171875, -1.32891845703125, -1.1895751953125, -1.05023193359375, -0.910888671875, -0.77154541015625, -0.6322021484375, -0.49285888671875, -0.353515625, -0.21417236328125, -0.0748291015625, 0.06451416015625, 0.203857421875, 0.34320068359375, 0.4825439453125, 0.62188720703125, 0.76123046875, 0.90057373046875, 1.0399169921875, 1.17926025390625, 1.318603515625, 1.45794677734375, 1.5972900390625, 1.73663330078125, 1.8759765625, 2.01531982421875, 2.1546630859375, 2.29400634765625, 2.433349609375, 2.57269287109375, 2.7120361328125, 2.85137939453125, 2.99072265625, 3.13006591796875, 3.2694091796875, 3.40875244140625, 3.548095703125, 3.68743896484375, 3.8267822265625, 3.96612548828125, 4.10546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 15.0, 20.0, 28.0, 41.0, 79.0, 100.0, 163.0, 331.0, 677.0, 1458.0, 3581.0, 11665.0, 72371.0, 768172.0, 163102.0, 18095.0, 5050.0, 1827.0, 800.0, 391.0, 212.0, 121.0, 73.0, 43.0, 29.0, 22.0, 20.0, 13.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.802215576171875, -1.74700927734375, -1.691802978515625, -1.6365966796875, -1.581390380859375, -1.52618408203125, -1.470977783203125, -1.415771484375, -1.360565185546875, -1.30535888671875, -1.250152587890625, -1.1949462890625, -1.139739990234375, -1.08453369140625, -1.029327392578125, -0.97412109375, -0.918914794921875, -0.86370849609375, -0.808502197265625, -0.7532958984375, -0.698089599609375, -0.64288330078125, -0.587677001953125, -0.532470703125, -0.477264404296875, -0.42205810546875, -0.366851806640625, -0.3116455078125, -0.256439208984375, -0.20123291015625, -0.146026611328125, -0.0908203125, -0.035614013671875, 0.01959228515625, 0.074798583984375, 0.1300048828125, 0.185211181640625, 0.24041748046875, 0.295623779296875, 0.350830078125, 0.406036376953125, 0.46124267578125, 0.516448974609375, 0.5716552734375, 0.626861572265625, 0.68206787109375, 0.737274169921875, 0.79248046875, 0.847686767578125, 0.90289306640625, 0.958099365234375, 1.0133056640625, 1.068511962890625, 1.12371826171875, 1.178924560546875, 1.234130859375, 1.289337158203125, 1.34454345703125, 1.399749755859375, 1.4549560546875, 1.510162353515625, 1.56536865234375, 1.620574951171875, 1.67578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 7.0, 4.0, 2.0, 11.0, 12.0, 7.0, 10.0, 18.0, 32.0, 37.0, 60.0, 65.0, 80.0, 108.0, 104.0, 119.0, 87.0, 75.0, 44.0, 32.0, 23.0, 18.0, 17.0, 9.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016954168677330017, -0.00016432255506515503, -0.0001591034233570099, -0.00015388429164886475, -0.0001486651599407196, -0.00014344602823257446, -0.00013822689652442932, -0.00013300776481628418, -0.00012778863310813904, -0.0001225695013999939, -0.00011735036969184875, -0.00011213123798370361, -0.00010691210627555847, -0.00010169297456741333, -9.647384285926819e-05, -9.125471115112305e-05, -8.60355794429779e-05, -8.081644773483276e-05, -7.559731602668762e-05, -7.037818431854248e-05, -6.515905261039734e-05, -5.99399209022522e-05, -5.4720789194107056e-05, -4.9501657485961914e-05, -4.428252577781677e-05, -3.906339406967163e-05, -3.384426236152649e-05, -2.8625130653381348e-05, -2.3405998945236206e-05, -1.8186867237091064e-05, -1.2967735528945923e-05, -7.748603820800781e-06, -2.5294721126556396e-06, 2.689659595489502e-06, 7.908791303634644e-06, 1.3127923011779785e-05, 1.8347054719924927e-05, 2.356618642807007e-05, 2.878531813621521e-05, 3.400444984436035e-05, 3.922358155250549e-05, 4.4442713260650635e-05, 4.9661844968795776e-05, 5.488097667694092e-05, 6.010010838508606e-05, 6.53192400932312e-05, 7.053837180137634e-05, 7.575750350952148e-05, 8.097663521766663e-05, 8.619576692581177e-05, 9.141489863395691e-05, 9.663403034210205e-05, 0.00010185316205024719, 0.00010707229375839233, 0.00011229142546653748, 0.00011751055717468262, 0.00012272968888282776, 0.0001279488205909729, 0.00013316795229911804, 0.00013838708400726318, 0.00014360621571540833, 0.00014882534742355347, 0.0001540444791316986, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 13.0, 24.0, 18.0, 22.0, 37.0, 66.0, 121.0, 191.0, 420.0, 918.0, 2602.0, 9819.0, 71547.0, 806281.0, 136755.0, 13926.0, 3500.0, 1214.0, 476.0, 225.0, 131.0, 83.0, 54.0, 37.0, 17.0, 9.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.900390625, -1.836212158203125, -1.77203369140625, -1.707855224609375, -1.6436767578125, -1.579498291015625, -1.51531982421875, -1.451141357421875, -1.386962890625, -1.322784423828125, -1.25860595703125, -1.194427490234375, -1.1302490234375, -1.066070556640625, -1.00189208984375, -0.937713623046875, -0.87353515625, -0.809356689453125, -0.74517822265625, -0.680999755859375, -0.6168212890625, -0.552642822265625, -0.48846435546875, -0.424285888671875, -0.360107421875, -0.295928955078125, -0.23175048828125, -0.167572021484375, -0.1033935546875, -0.039215087890625, 0.02496337890625, 0.089141845703125, 0.1533203125, 0.217498779296875, 0.28167724609375, 0.345855712890625, 0.4100341796875, 0.474212646484375, 0.53839111328125, 0.602569580078125, 0.666748046875, 0.730926513671875, 0.79510498046875, 0.859283447265625, 0.9234619140625, 0.987640380859375, 1.05181884765625, 1.115997314453125, 1.18017578125, 1.244354248046875, 1.30853271484375, 1.372711181640625, 1.4368896484375, 1.501068115234375, 1.56524658203125, 1.629425048828125, 1.693603515625, 1.757781982421875, 1.82196044921875, 1.886138916015625, 1.9503173828125, 2.014495849609375, 2.07867431640625, 2.142852783203125, 2.20703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 9.0, 8.0, 15.0, 16.0, 28.0, 51.0, 69.0, 65.0, 121.0, 123.0, 109.0, 104.0, 69.0, 57.0, 52.0, 29.0, 18.0, 9.0, 12.0, 9.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.237762451171875, -1.19329833984375, -1.148834228515625, -1.1043701171875, -1.059906005859375, -1.01544189453125, -0.970977783203125, -0.926513671875, -0.882049560546875, -0.83758544921875, -0.793121337890625, -0.7486572265625, -0.704193115234375, -0.65972900390625, -0.615264892578125, -0.57080078125, -0.526336669921875, -0.48187255859375, -0.437408447265625, -0.3929443359375, -0.348480224609375, -0.30401611328125, -0.259552001953125, -0.215087890625, -0.170623779296875, -0.12615966796875, -0.081695556640625, -0.0372314453125, 0.007232666015625, 0.05169677734375, 0.096160888671875, 0.140625, 0.185089111328125, 0.22955322265625, 0.274017333984375, 0.3184814453125, 0.362945556640625, 0.40740966796875, 0.451873779296875, 0.496337890625, 0.540802001953125, 0.58526611328125, 0.629730224609375, 0.6741943359375, 0.718658447265625, 0.76312255859375, 0.807586669921875, 0.85205078125, 0.896514892578125, 0.94097900390625, 0.985443115234375, 1.0299072265625, 1.074371337890625, 1.11883544921875, 1.163299560546875, 1.207763671875, 1.252227783203125, 1.29669189453125, 1.341156005859375, 1.3856201171875, 1.430084228515625, 1.47454833984375, 1.519012451171875, 1.5634765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 10.0, 10.0, 39.0, 71.0, 123.0, 256.0, 214.0, 128.0, 65.0, 33.0, 24.0, 16.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-56.603397369384766, -55.40073013305664, -54.19806671142578, -52.995399475097656, -51.79273223876953, -50.590065002441406, -49.38739776611328, -48.18473434448242, -46.9820671081543, -45.77939987182617, -44.57673645019531, -43.37406921386719, -42.17140197753906, -40.96873474121094, -39.76606750488281, -38.56340408325195, -37.36073684692383, -36.1580696105957, -34.955406188964844, -33.75273895263672, -32.550071716308594, -31.34740447998047, -30.144739151000977, -28.942073822021484, -27.73940658569336, -26.536739349365234, -25.334074020385742, -24.13140869140625, -22.928741455078125, -21.72607421875, -20.523408889770508, -19.320743560791016, -18.118072509765625, -16.9154052734375, -15.712739944458008, -14.5100736618042, -13.30740737915039, -12.104741096496582, -10.902074813842773, -9.699408531188965, -8.496742248535156, -7.294075965881348, -6.091409683227539, -4.8887434005737305, -3.686077117919922, -2.4834108352661133, -1.2807445526123047, -0.0780782699584961, 1.1245880126953125, 2.327254295349121, 3.5299205780029297, 4.732586860656738, 5.935253143310547, 7.1379194259643555, 8.340585708618164, 9.543251991271973, 10.745918273925781, 11.94858455657959, 13.151250839233398, 14.353917121887207, 15.556583404541016, 16.75925064086914, 17.961915969848633, 19.164581298828125, 20.36724853515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 16.0, 15.0, 17.0, 28.0, 37.0, 40.0, 47.0, 42.0, 38.0, 66.0, 60.0, 56.0, 62.0, 61.0, 59.0, 46.0, 47.0, 27.0, 45.0, 33.0, 20.0, 16.0, 22.0, 14.0, 13.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.730220794677734, -26.736408233642578, -25.742595672607422, -24.748783111572266, -23.75497055053711, -22.761157989501953, -21.767345428466797, -20.773530960083008, -19.77971839904785, -18.785905838012695, -17.79209327697754, -16.798280715942383, -15.80446720123291, -14.810654640197754, -13.816842079162598, -12.823028564453125, -11.829216957092285, -10.835404396057129, -9.841591835021973, -8.8477783203125, -7.853965759277344, -6.8601531982421875, -5.866340637207031, -4.872527599334717, -3.8787150382995605, -2.884902238845825, -1.8910895586013794, -0.8972768783569336, 0.09653592109680176, 1.090348720550537, 2.0841612815856934, 3.077974319458008, 4.071786880493164, 5.06559944152832, 6.059412479400635, 7.053225040435791, 8.047038078308105, 9.040850639343262, 10.034663200378418, 11.02847671508789, 12.022289276123047, 13.016101837158203, 14.00991439819336, 15.003726959228516, 15.997540473937988, 16.991352081298828, 17.985164642333984, 18.978979110717773, 19.972789764404297, 20.966602325439453, 21.96041488647461, 22.954227447509766, 23.948040008544922, 24.941852569580078, 25.935665130615234, 26.929479598999023, 27.92329216003418, 28.917104721069336, 29.910917282104492, 30.90472984313965, 31.898542404174805, 32.892356872558594, 33.88616943359375, 34.879981994628906, 35.87379455566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 12.0, 8.0, 11.0, 9.0, 16.0, 18.0, 21.0, 39.0, 45.0, 64.0, 70.0, 117.0, 207.0, 359.0, 622.0, 1449.0, 3878.0, 16860.0, 883026.0, 3262336.0, 18818.0, 3960.0, 1302.0, 517.0, 245.0, 134.0, 49.0, 29.0, 14.0, 13.0, 13.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.8125, -9.589599609375, -9.36669921875, -9.143798828125, -8.9208984375, -8.697998046875, -8.47509765625, -8.252197265625, -8.029296875, -7.806396484375, -7.58349609375, -7.360595703125, -7.1376953125, -6.914794921875, -6.69189453125, -6.468994140625, -6.24609375, -6.023193359375, -5.80029296875, -5.577392578125, -5.3544921875, -5.131591796875, -4.90869140625, -4.685791015625, -4.462890625, -4.239990234375, -4.01708984375, -3.794189453125, -3.5712890625, -3.348388671875, -3.12548828125, -2.902587890625, -2.6796875, -2.456787109375, -2.23388671875, -2.010986328125, -1.7880859375, -1.565185546875, -1.34228515625, -1.119384765625, -0.896484375, -0.673583984375, -0.45068359375, -0.227783203125, -0.0048828125, 0.218017578125, 0.44091796875, 0.663818359375, 0.88671875, 1.109619140625, 1.33251953125, 1.555419921875, 1.7783203125, 2.001220703125, 2.22412109375, 2.447021484375, 2.669921875, 2.892822265625, 3.11572265625, 3.338623046875, 3.5615234375, 3.784423828125, 4.00732421875, 4.230224609375, 4.453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 10.0, 18.0, 27.0, 49.0, 67.0, 95.0, 118.0, 119.0, 110.0, 93.0, 94.0, 64.0, 49.0, 31.0, 22.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.212890625, -2.163421630859375, -2.11395263671875, -2.064483642578125, -2.0150146484375, -1.965545654296875, -1.91607666015625, -1.866607666015625, -1.817138671875, -1.767669677734375, -1.71820068359375, -1.668731689453125, -1.6192626953125, -1.569793701171875, -1.52032470703125, -1.470855712890625, -1.42138671875, -1.371917724609375, -1.32244873046875, -1.272979736328125, -1.2235107421875, -1.174041748046875, -1.12457275390625, -1.075103759765625, -1.025634765625, -0.976165771484375, -0.92669677734375, -0.877227783203125, -0.8277587890625, -0.778289794921875, -0.72882080078125, -0.679351806640625, -0.6298828125, -0.580413818359375, -0.53094482421875, -0.481475830078125, -0.4320068359375, -0.382537841796875, -0.33306884765625, -0.283599853515625, -0.234130859375, -0.184661865234375, -0.13519287109375, -0.085723876953125, -0.0362548828125, 0.013214111328125, 0.06268310546875, 0.112152099609375, 0.16162109375, 0.211090087890625, 0.26055908203125, 0.310028076171875, 0.3594970703125, 0.408966064453125, 0.45843505859375, 0.507904052734375, 0.557373046875, 0.606842041015625, 0.65631103515625, 0.705780029296875, 0.7552490234375, 0.804718017578125, 0.85418701171875, 0.903656005859375, 0.953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 26.0, 37.0, 63.0, 181.0, 402.0, 1301.0, 5229.0, 43490.0, 4082617.0, 53471.0, 5503.0, 1238.0, 400.0, 142.0, 69.0, 41.0, 16.0, 13.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.81591796875, -11.4833984375, -11.15087890625, -10.818359375, -10.48583984375, -10.1533203125, -9.82080078125, -9.48828125, -9.15576171875, -8.8232421875, -8.49072265625, -8.158203125, -7.82568359375, -7.4931640625, -7.16064453125, -6.828125, -6.49560546875, -6.1630859375, -5.83056640625, -5.498046875, -5.16552734375, -4.8330078125, -4.50048828125, -4.16796875, -3.83544921875, -3.5029296875, -3.17041015625, -2.837890625, -2.50537109375, -2.1728515625, -1.84033203125, -1.5078125, -1.17529296875, -0.8427734375, -0.51025390625, -0.177734375, 0.15478515625, 0.4873046875, 0.81982421875, 1.15234375, 1.48486328125, 1.8173828125, 2.14990234375, 2.482421875, 2.81494140625, 3.1474609375, 3.47998046875, 3.8125, 4.14501953125, 4.4775390625, 4.81005859375, 5.142578125, 5.47509765625, 5.8076171875, 6.14013671875, 6.47265625, 6.80517578125, 7.1376953125, 7.47021484375, 7.802734375, 8.13525390625, 8.4677734375, 8.80029296875, 9.1328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 5.0, 9.0, 16.0, 13.0, 33.0, 55.0, 116.0, 401.0, 2759.0, 405.0, 116.0, 46.0, 24.0, 20.0, 12.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.48828125, -2.42193603515625, -2.3555908203125, -2.28924560546875, -2.222900390625, -2.15655517578125, -2.0902099609375, -2.02386474609375, -1.95751953125, -1.89117431640625, -1.8248291015625, -1.75848388671875, -1.692138671875, -1.62579345703125, -1.5594482421875, -1.49310302734375, -1.4267578125, -1.36041259765625, -1.2940673828125, -1.22772216796875, -1.161376953125, -1.09503173828125, -1.0286865234375, -0.96234130859375, -0.89599609375, -0.82965087890625, -0.7633056640625, -0.69696044921875, -0.630615234375, -0.56427001953125, -0.4979248046875, -0.43157958984375, -0.365234375, -0.29888916015625, -0.2325439453125, -0.16619873046875, -0.099853515625, -0.03350830078125, 0.0328369140625, 0.09918212890625, 0.16552734375, 0.23187255859375, 0.2982177734375, 0.36456298828125, 0.430908203125, 0.49725341796875, 0.5635986328125, 0.62994384765625, 0.6962890625, 0.76263427734375, 0.8289794921875, 0.89532470703125, 0.961669921875, 1.02801513671875, 1.0943603515625, 1.16070556640625, 1.22705078125, 1.29339599609375, 1.3597412109375, 1.42608642578125, 1.492431640625, 1.55877685546875, 1.6251220703125, 1.69146728515625, 1.7578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 26.0, 80.0, 282.0, 397.0, 153.0, 37.0, 10.0, 5.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171379566192627, -6.702581882476807, -6.233784198760986, -5.764986991882324, -5.296189308166504, -4.827391624450684, -4.358593940734863, -3.889796257019043, -3.4209985733032227, -2.9522008895874023, -2.483403205871582, -2.014605760574341, -1.5458080768585205, -1.0770103931427002, -0.608212947845459, -0.13941526412963867, 0.32938241958618164, 0.7981800436973572, 1.2669776678085327, 1.7357752323150635, 2.204572916030884, 2.673370599746704, 3.1421680450439453, 3.6109657287597656, 4.079763412475586, 4.548561096191406, 5.017358779907227, 5.486156463623047, 5.954954147338867, 6.4237518310546875, 6.89254903793335, 7.36134672164917, 7.830144882202148, 8.298942565917969, 8.767740249633789, 9.23653793334961, 9.70533561706543, 10.17413330078125, 10.64293098449707, 11.11172866821289, 11.580526351928711, 12.049324035644531, 12.518121719360352, 12.986919403076172, 13.455717086791992, 13.924514770507812, 14.393312454223633, 14.862110137939453, 15.330906867980957, 15.799704551696777, 16.26850128173828, 16.7372989654541, 17.206096649169922, 17.674894332885742, 18.143692016601562, 18.612489700317383, 19.081287384033203, 19.550085067749023, 20.018882751464844, 20.487680435180664, 20.956478118896484, 21.425275802612305, 21.894073486328125, 22.362871170043945, 22.831668853759766]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 19.0, 10.0, 16.0, 10.0, 17.0, 21.0, 26.0, 34.0, 36.0, 32.0, 41.0, 55.0, 54.0, 41.0, 35.0, 43.0, 45.0, 54.0, 46.0, 35.0, 46.0, 38.0, 33.0, 45.0, 25.0, 26.0, 15.0, 16.0, 13.0, 15.0, 12.0, 8.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1745686531066895, -4.03913688659668, -3.9037046432495117, -3.768272638320923, -3.632840633392334, -3.497408628463745, -3.3619766235351562, -3.2265448570251465, -3.0911126136779785, -2.9556806087493896, -2.820248603820801, -2.684816598892212, -2.549384593963623, -2.413952589035034, -2.2785205841064453, -2.1430888175964355, -2.0076568126678467, -1.8722248077392578, -1.736792802810669, -1.60136079788208, -1.4659287929534912, -1.3304967880249023, -1.195064902305603, -1.0596328973770142, -0.9242008924484253, -0.7887688875198364, -0.6533368825912476, -0.5179049372673035, -0.3824729323387146, -0.24704092741012573, -0.11160898208618164, 0.023823022842407227, 0.1592550277709961, 0.29468703269958496, 0.43011900782585144, 0.5655509829521179, 0.7009829878807068, 0.8364149928092957, 0.9718469381332397, 1.1072789430618286, 1.2427109479904175, 1.3781429529190063, 1.5135749578475952, 1.6490068435668945, 1.7844388484954834, 1.9198708534240723, 2.055302858352661, 2.19073486328125, 2.326166868209839, 2.4615988731384277, 2.5970308780670166, 2.7324628829956055, 2.8678948879241943, 3.003326892852783, 3.138758659362793, 3.274190902709961, 3.4096226692199707, 3.5450546741485596, 3.6804866790771484, 3.8159186840057373, 3.951350688934326, 4.086782455444336, 4.222214698791504, 4.357646465301514, 4.493078708648682]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 7.0, 14.0, 15.0, 20.0, 28.0, 60.0, 57.0, 95.0, 156.0, 207.0, 392.0, 744.0, 1658.0, 4591.0, 19668.0, 166799.0, 729114.0, 104044.0, 14325.0, 3618.0, 1362.0, 650.0, 319.0, 195.0, 125.0, 85.0, 65.0, 33.0, 28.0, 19.0, 16.0, 12.0, 9.0, 0.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.0078125, -6.8153076171875, -6.622802734375, -6.4302978515625, -6.23779296875, -6.0452880859375, -5.852783203125, -5.6602783203125, -5.4677734375, -5.2752685546875, -5.082763671875, -4.8902587890625, -4.69775390625, -4.5052490234375, -4.312744140625, -4.1202392578125, -3.927734375, -3.7352294921875, -3.542724609375, -3.3502197265625, -3.15771484375, -2.9652099609375, -2.772705078125, -2.5802001953125, -2.3876953125, -2.1951904296875, -2.002685546875, -1.8101806640625, -1.61767578125, -1.4251708984375, -1.232666015625, -1.0401611328125, -0.84765625, -0.6551513671875, -0.462646484375, -0.2701416015625, -0.07763671875, 0.1148681640625, 0.307373046875, 0.4998779296875, 0.6923828125, 0.8848876953125, 1.077392578125, 1.2698974609375, 1.46240234375, 1.6549072265625, 1.847412109375, 2.0399169921875, 2.232421875, 2.4249267578125, 2.617431640625, 2.8099365234375, 3.00244140625, 3.1949462890625, 3.387451171875, 3.5799560546875, 3.7724609375, 3.9649658203125, 4.157470703125, 4.3499755859375, 4.54248046875, 4.7349853515625, 4.927490234375, 5.1199951171875, 5.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 12.0, 18.0, 30.0, 52.0, 78.0, 89.0, 118.0, 101.0, 108.0, 119.0, 87.0, 68.0, 49.0, 26.0, 14.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.208984375, -2.159576416015625, -2.11016845703125, -2.060760498046875, -2.0113525390625, -1.961944580078125, -1.91253662109375, -1.863128662109375, -1.813720703125, -1.764312744140625, -1.71490478515625, -1.665496826171875, -1.6160888671875, -1.566680908203125, -1.51727294921875, -1.467864990234375, -1.41845703125, -1.369049072265625, -1.31964111328125, -1.270233154296875, -1.2208251953125, -1.171417236328125, -1.12200927734375, -1.072601318359375, -1.023193359375, -0.973785400390625, -0.92437744140625, -0.874969482421875, -0.8255615234375, -0.776153564453125, -0.72674560546875, -0.677337646484375, -0.6279296875, -0.578521728515625, -0.52911376953125, -0.479705810546875, -0.4302978515625, -0.380889892578125, -0.33148193359375, -0.282073974609375, -0.232666015625, -0.183258056640625, -0.13385009765625, -0.084442138671875, -0.0350341796875, 0.014373779296875, 0.06378173828125, 0.113189697265625, 0.16259765625, 0.212005615234375, 0.26141357421875, 0.310821533203125, 0.3602294921875, 0.409637451171875, 0.45904541015625, 0.508453369140625, 0.557861328125, 0.607269287109375, 0.65667724609375, 0.706085205078125, 0.7554931640625, 0.804901123046875, 0.85430908203125, 0.903717041015625, 0.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 11.0, 12.0, 17.0, 17.0, 20.0, 28.0, 40.0, 76.0, 115.0, 207.0, 492.0, 1081.0, 3011.0, 12714.0, 81161.0, 693694.0, 221158.0, 26266.0, 5384.0, 1645.0, 621.0, 286.0, 158.0, 91.0, 54.0, 38.0, 26.0, 30.0, 19.0, 10.0, 16.0, 12.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -5.95294189453125, -5.7301025390625, -5.50726318359375, -5.284423828125, -5.06158447265625, -4.8387451171875, -4.61590576171875, -4.39306640625, -4.17022705078125, -3.9473876953125, -3.72454833984375, -3.501708984375, -3.27886962890625, -3.0560302734375, -2.83319091796875, -2.6103515625, -2.38751220703125, -2.1646728515625, -1.94183349609375, -1.718994140625, -1.49615478515625, -1.2733154296875, -1.05047607421875, -0.82763671875, -0.60479736328125, -0.3819580078125, -0.15911865234375, 0.063720703125, 0.28656005859375, 0.5093994140625, 0.73223876953125, 0.955078125, 1.17791748046875, 1.4007568359375, 1.62359619140625, 1.846435546875, 2.06927490234375, 2.2921142578125, 2.51495361328125, 2.73779296875, 2.96063232421875, 3.1834716796875, 3.40631103515625, 3.629150390625, 3.85198974609375, 4.0748291015625, 4.29766845703125, 4.5205078125, 4.74334716796875, 4.9661865234375, 5.18902587890625, 5.411865234375, 5.63470458984375, 5.8575439453125, 6.08038330078125, 6.30322265625, 6.52606201171875, 6.7489013671875, 6.97174072265625, 7.194580078125, 7.41741943359375, 7.6402587890625, 7.86309814453125, 8.0859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 15.0, 17.0, 17.0, 23.0, 23.0, 29.0, 32.0, 37.0, 37.0, 31.0, 52.0, 48.0, 52.0, 47.0, 38.0, 45.0, 41.0, 50.0, 48.0, 25.0, 41.0, 37.0, 14.0, 30.0, 29.0, 13.0, 26.0, 15.0, 9.0, 10.0, 4.0, 9.0, 10.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.27191162109375, -4.1375732421875, -4.00323486328125, -3.868896484375, -3.73455810546875, -3.6002197265625, -3.46588134765625, -3.33154296875, -3.19720458984375, -3.0628662109375, -2.92852783203125, -2.794189453125, -2.65985107421875, -2.5255126953125, -2.39117431640625, -2.2568359375, -2.12249755859375, -1.9881591796875, -1.85382080078125, -1.719482421875, -1.58514404296875, -1.4508056640625, -1.31646728515625, -1.18212890625, -1.04779052734375, -0.9134521484375, -0.77911376953125, -0.644775390625, -0.51043701171875, -0.3760986328125, -0.24176025390625, -0.107421875, 0.02691650390625, 0.1612548828125, 0.29559326171875, 0.429931640625, 0.56427001953125, 0.6986083984375, 0.83294677734375, 0.96728515625, 1.10162353515625, 1.2359619140625, 1.37030029296875, 1.504638671875, 1.63897705078125, 1.7733154296875, 1.90765380859375, 2.0419921875, 2.17633056640625, 2.3106689453125, 2.44500732421875, 2.579345703125, 2.71368408203125, 2.8480224609375, 2.98236083984375, 3.11669921875, 3.25103759765625, 3.3853759765625, 3.51971435546875, 3.654052734375, 3.78839111328125, 3.9227294921875, 4.05706787109375, 4.19140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 18.0, 23.0, 49.0, 45.0, 87.0, 120.0, 220.0, 390.0, 823.0, 1847.0, 5409.0, 23428.0, 213738.0, 697873.0, 85221.0, 12781.0, 3639.0, 1375.0, 614.0, 308.0, 182.0, 111.0, 66.0, 48.0, 36.0, 19.0, 14.0, 13.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6103515625, -1.558929443359375, -1.50750732421875, -1.456085205078125, -1.4046630859375, -1.353240966796875, -1.30181884765625, -1.250396728515625, -1.198974609375, -1.147552490234375, -1.09613037109375, -1.044708251953125, -0.9932861328125, -0.941864013671875, -0.89044189453125, -0.839019775390625, -0.78759765625, -0.736175537109375, -0.68475341796875, -0.633331298828125, -0.5819091796875, -0.530487060546875, -0.47906494140625, -0.427642822265625, -0.376220703125, -0.324798583984375, -0.27337646484375, -0.221954345703125, -0.1705322265625, -0.119110107421875, -0.06768798828125, -0.016265869140625, 0.03515625, 0.086578369140625, 0.13800048828125, 0.189422607421875, 0.2408447265625, 0.292266845703125, 0.34368896484375, 0.395111083984375, 0.446533203125, 0.497955322265625, 0.54937744140625, 0.600799560546875, 0.6522216796875, 0.703643798828125, 0.75506591796875, 0.806488037109375, 0.85791015625, 0.909332275390625, 0.96075439453125, 1.012176513671875, 1.0635986328125, 1.115020751953125, 1.16644287109375, 1.217864990234375, 1.269287109375, 1.320709228515625, 1.37213134765625, 1.423553466796875, 1.4749755859375, 1.526397705078125, 1.57781982421875, 1.629241943359375, 1.6806640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 5.0, 6.0, 4.0, 8.0, 19.0, 17.0, 37.0, 35.0, 42.0, 66.0, 84.0, 103.0, 111.0, 115.0, 93.0, 66.0, 56.0, 37.0, 31.0, 15.0, 14.0, 9.0, 5.0, 5.0, 4.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00023698806762695312, -0.0002310425043106079, -0.0002250969409942627, -0.00021915137767791748, -0.00021320581436157227, -0.00020726025104522705, -0.00020131468772888184, -0.00019536912441253662, -0.0001894235610961914, -0.0001834779977798462, -0.00017753243446350098, -0.00017158687114715576, -0.00016564130783081055, -0.00015969574451446533, -0.00015375018119812012, -0.0001478046178817749, -0.0001418590545654297, -0.00013591349124908447, -0.00012996792793273926, -0.00012402236461639404, -0.00011807680130004883, -0.00011213123798370361, -0.0001061856746673584, -0.00010024011135101318, -9.429454803466797e-05, -8.834898471832275e-05, -8.240342140197754e-05, -7.645785808563232e-05, -7.051229476928711e-05, -6.45667314529419e-05, -5.862116813659668e-05, -5.2675604820251465e-05, -4.673004150390625e-05, -4.0784478187561035e-05, -3.483891487121582e-05, -2.8893351554870605e-05, -2.294778823852539e-05, -1.7002224922180176e-05, -1.1056661605834961e-05, -5.111098289489746e-06, 8.344650268554688e-07, 6.780028343200684e-06, 1.2725591659545898e-05, 1.8671154975891113e-05, 2.4616718292236328e-05, 3.056228160858154e-05, 3.650784492492676e-05, 4.245340824127197e-05, 4.839897155761719e-05, 5.43445348739624e-05, 6.029009819030762e-05, 6.623566150665283e-05, 7.218122482299805e-05, 7.812678813934326e-05, 8.407235145568848e-05, 9.001791477203369e-05, 9.59634780883789e-05, 0.00010190904140472412, 0.00010785460472106934, 0.00011380016803741455, 0.00011974573135375977, 0.00012569129467010498, 0.0001316368579864502, 0.0001375824213027954, 0.00014352798461914062]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 12.0, 12.0, 16.0, 21.0, 39.0, 45.0, 99.0, 206.0, 475.0, 1467.0, 6483.0, 67782.0, 868546.0, 93096.0, 7572.0, 1600.0, 574.0, 236.0, 111.0, 54.0, 32.0, 28.0, 13.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.857421875, -2.772247314453125, -2.68707275390625, -2.601898193359375, -2.5167236328125, -2.431549072265625, -2.34637451171875, -2.261199951171875, -2.176025390625, -2.090850830078125, -2.00567626953125, -1.920501708984375, -1.8353271484375, -1.750152587890625, -1.66497802734375, -1.579803466796875, -1.49462890625, -1.409454345703125, -1.32427978515625, -1.239105224609375, -1.1539306640625, -1.068756103515625, -0.98358154296875, -0.898406982421875, -0.813232421875, -0.728057861328125, -0.64288330078125, -0.557708740234375, -0.4725341796875, -0.387359619140625, -0.30218505859375, -0.217010498046875, -0.1318359375, -0.046661376953125, 0.03851318359375, 0.123687744140625, 0.2088623046875, 0.294036865234375, 0.37921142578125, 0.464385986328125, 0.549560546875, 0.634735107421875, 0.71990966796875, 0.805084228515625, 0.8902587890625, 0.975433349609375, 1.06060791015625, 1.145782470703125, 1.23095703125, 1.316131591796875, 1.40130615234375, 1.486480712890625, 1.5716552734375, 1.656829833984375, 1.74200439453125, 1.827178955078125, 1.912353515625, 1.997528076171875, 2.08270263671875, 2.167877197265625, 2.2530517578125, 2.338226318359375, 2.42340087890625, 2.508575439453125, 2.59375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 15.0, 14.0, 18.0, 13.0, 20.0, 33.0, 33.0, 47.0, 80.0, 90.0, 81.0, 103.0, 100.0, 88.0, 80.0, 46.0, 41.0, 24.0, 16.0, 15.0, 9.0, 6.0, 2.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4716644287109375, -1.428680419921875, -1.3856964111328125, -1.34271240234375, -1.2997283935546875, -1.256744384765625, -1.2137603759765625, -1.1707763671875, -1.1277923583984375, -1.084808349609375, -1.0418243408203125, -0.99884033203125, -0.9558563232421875, -0.912872314453125, -0.8698883056640625, -0.826904296875, -0.7839202880859375, -0.740936279296875, -0.6979522705078125, -0.65496826171875, -0.6119842529296875, -0.569000244140625, -0.5260162353515625, -0.4830322265625, -0.4400482177734375, -0.397064208984375, -0.3540802001953125, -0.31109619140625, -0.2681121826171875, -0.225128173828125, -0.1821441650390625, -0.13916015625, -0.0961761474609375, -0.053192138671875, -0.0102081298828125, 0.03277587890625, 0.0757598876953125, 0.118743896484375, 0.1617279052734375, 0.2047119140625, 0.2476959228515625, 0.290679931640625, 0.3336639404296875, 0.37664794921875, 0.4196319580078125, 0.462615966796875, 0.5055999755859375, 0.548583984375, 0.5915679931640625, 0.634552001953125, 0.6775360107421875, 0.72052001953125, 0.7635040283203125, 0.806488037109375, 0.8494720458984375, 0.8924560546875, 0.9354400634765625, 0.978424072265625, 1.0214080810546875, 1.06439208984375, 1.1073760986328125, 1.150360107421875, 1.1933441162109375, 1.236328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 12.0, 13.0, 48.0, 128.0, 336.0, 294.0, 90.0, 37.0, 28.0, 11.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.10966491699219, -57.464717864990234, -55.819766998291016, -54.17481994628906, -52.529869079589844, -50.88492202758789, -49.23997497558594, -47.59502410888672, -45.950077056884766, -44.30513000488281, -42.660179138183594, -41.01523208618164, -39.37028503417969, -37.72533416748047, -36.080387115478516, -34.43544006347656, -32.790489196777344, -31.145540237426758, -29.500591278076172, -27.85564422607422, -26.210695266723633, -24.565746307373047, -22.920799255371094, -21.275850296020508, -19.630901336669922, -17.985952377319336, -16.34100341796875, -14.696056365966797, -13.051107406616211, -11.406158447265625, -9.761210441589355, -8.116262435913086, -6.471317291259766, -4.826368808746338, -3.18142032623291, -1.5364718437194824, 0.10847663879394531, 1.7534255981445312, 3.398373603820801, 5.04332160949707, 6.688270568847656, 8.333219528198242, 9.978167533874512, 11.623115539550781, 13.268064498901367, 14.913013458251953, 16.557960510253906, 18.202909469604492, 19.847858428955078, 21.492807388305664, 23.13775634765625, 24.782703399658203, 26.42765235900879, 28.072601318359375, 29.717548370361328, 31.362497329711914, 33.0074462890625, 34.65239334106445, 36.29734420776367, 37.942291259765625, 39.587242126464844, 41.2321891784668, 42.87713623046875, 44.52208709716797, 46.16703414916992]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 12.0, 8.0, 14.0, 20.0, 17.0, 22.0, 32.0, 42.0, 56.0, 57.0, 70.0, 71.0, 70.0, 70.0, 66.0, 55.0, 56.0, 44.0, 50.0, 47.0, 32.0, 23.0, 19.0, 18.0, 9.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40410614013672, -23.30684471130371, -22.209583282470703, -21.112323760986328, -20.01506233215332, -18.917800903320312, -17.820541381835938, -16.72327995300293, -15.626018524169922, -14.528757095336914, -13.431496620178223, -12.334236145019531, -11.236974716186523, -10.139713287353516, -9.042452812194824, -7.945191860198975, -6.847930908203125, -5.750669956207275, -4.653409004211426, -3.556148052215576, -2.4588871002197266, -1.361626148223877, -0.26436519622802734, 0.8328957557678223, 1.9301567077636719, 3.0274176597595215, 4.124678611755371, 5.221939563751221, 6.31920051574707, 7.41646146774292, 8.51372241973877, 9.610982894897461, 10.708248138427734, 11.805509567260742, 12.902770042419434, 14.000030517578125, 15.097291946411133, 16.19455337524414, 17.291812896728516, 18.389074325561523, 19.48633575439453, 20.58359718322754, 21.680858612060547, 22.778118133544922, 23.87537956237793, 24.972640991210938, 26.069900512695312, 27.16716194152832, 28.264423370361328, 29.361684799194336, 30.458946228027344, 31.55620574951172, 32.653465270996094, 33.750728607177734, 34.84798812866211, 35.94525146484375, 37.042510986328125, 38.1397705078125, 39.23703384399414, 40.334293365478516, 41.431556701660156, 42.52881622314453, 43.626075744628906, 44.72333908081055, 45.82059860229492]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 1.0, 5.0, 6.0, 9.0, 8.0, 7.0, 10.0, 12.0, 23.0, 31.0, 43.0, 45.0, 58.0, 87.0, 138.0, 201.0, 349.0, 615.0, 1305.0, 3436.0, 11807.0, 95584.0, 3964518.0, 98936.0, 11909.0, 3109.0, 1103.0, 477.0, 205.0, 93.0, 51.0, 41.0, 25.0, 12.0, 4.0, 4.0, 9.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.140625, -8.93048095703125, -8.7203369140625, -8.51019287109375, -8.300048828125, -8.08990478515625, -7.8797607421875, -7.66961669921875, -7.45947265625, -7.24932861328125, -7.0391845703125, -6.82904052734375, -6.618896484375, -6.40875244140625, -6.1986083984375, -5.98846435546875, -5.7783203125, -5.56817626953125, -5.3580322265625, -5.14788818359375, -4.937744140625, -4.72760009765625, -4.5174560546875, -4.30731201171875, -4.09716796875, -3.88702392578125, -3.6768798828125, -3.46673583984375, -3.256591796875, -3.04644775390625, -2.8363037109375, -2.62615966796875, -2.416015625, -2.20587158203125, -1.9957275390625, -1.78558349609375, -1.575439453125, -1.36529541015625, -1.1551513671875, -0.94500732421875, -0.73486328125, -0.52471923828125, -0.3145751953125, -0.10443115234375, 0.105712890625, 0.31585693359375, 0.5260009765625, 0.73614501953125, 0.9462890625, 1.15643310546875, 1.3665771484375, 1.57672119140625, 1.786865234375, 1.99700927734375, 2.2071533203125, 2.41729736328125, 2.62744140625, 2.83758544921875, 3.0477294921875, 3.25787353515625, 3.468017578125, 3.67816162109375, 3.8883056640625, 4.09844970703125, 4.30859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 16.0, 29.0, 38.0, 56.0, 77.0, 114.0, 106.0, 128.0, 115.0, 96.0, 73.0, 62.0, 34.0, 22.0, 12.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.1389007568359375, -2.084442138671875, -2.0299835205078125, -1.97552490234375, -1.9210662841796875, -1.866607666015625, -1.8121490478515625, -1.7576904296875, -1.7032318115234375, -1.648773193359375, -1.5943145751953125, -1.53985595703125, -1.4853973388671875, -1.430938720703125, -1.3764801025390625, -1.322021484375, -1.2675628662109375, -1.213104248046875, -1.1586456298828125, -1.10418701171875, -1.0497283935546875, -0.995269775390625, -0.9408111572265625, -0.8863525390625, -0.8318939208984375, -0.777435302734375, -0.7229766845703125, -0.66851806640625, -0.6140594482421875, -0.559600830078125, -0.5051422119140625, -0.45068359375, -0.3962249755859375, -0.341766357421875, -0.2873077392578125, -0.23284912109375, -0.1783905029296875, -0.123931884765625, -0.0694732666015625, -0.0150146484375, 0.0394439697265625, 0.093902587890625, 0.1483612060546875, 0.20281982421875, 0.2572784423828125, 0.311737060546875, 0.3661956787109375, 0.420654296875, 0.4751129150390625, 0.529571533203125, 0.5840301513671875, 0.63848876953125, 0.6929473876953125, 0.747406005859375, 0.8018646240234375, 0.8563232421875, 0.9107818603515625, 0.965240478515625, 1.0196990966796875, 1.07415771484375, 1.1286163330078125, 1.183074951171875, 1.2375335693359375, 1.2919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 10.0, 5.0, 14.0, 15.0, 20.0, 32.0, 49.0, 134.0, 290.0, 567.0, 1480.0, 5356.0, 32799.0, 3665627.0, 464369.0, 17880.0, 3469.0, 1159.0, 489.0, 249.0, 112.0, 66.0, 25.0, 14.0, 15.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.11712646484375, -6.8787841796875, -6.64044189453125, -6.402099609375, -6.16375732421875, -5.9254150390625, -5.68707275390625, -5.44873046875, -5.21038818359375, -4.9720458984375, -4.73370361328125, -4.495361328125, -4.25701904296875, -4.0186767578125, -3.78033447265625, -3.5419921875, -3.30364990234375, -3.0653076171875, -2.82696533203125, -2.588623046875, -2.35028076171875, -2.1119384765625, -1.87359619140625, -1.63525390625, -1.39691162109375, -1.1585693359375, -0.92022705078125, -0.681884765625, -0.44354248046875, -0.2052001953125, 0.03314208984375, 0.271484375, 0.50982666015625, 0.7481689453125, 0.98651123046875, 1.224853515625, 1.46319580078125, 1.7015380859375, 1.93988037109375, 2.17822265625, 2.41656494140625, 2.6549072265625, 2.89324951171875, 3.131591796875, 3.36993408203125, 3.6082763671875, 3.84661865234375, 4.0849609375, 4.32330322265625, 4.5616455078125, 4.79998779296875, 5.038330078125, 5.27667236328125, 5.5150146484375, 5.75335693359375, 5.99169921875, 6.23004150390625, 6.4683837890625, 6.70672607421875, 6.945068359375, 7.18341064453125, 7.4217529296875, 7.66009521484375, 7.8984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 11.0, 19.0, 36.0, 44.0, 95.0, 166.0, 493.0, 2179.0, 539.0, 211.0, 89.0, 49.0, 33.0, 21.0, 16.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.341796875, -2.269775390625, -2.19775390625, -2.125732421875, -2.0537109375, -1.981689453125, -1.90966796875, -1.837646484375, -1.765625, -1.693603515625, -1.62158203125, -1.549560546875, -1.4775390625, -1.405517578125, -1.33349609375, -1.261474609375, -1.189453125, -1.117431640625, -1.04541015625, -0.973388671875, -0.9013671875, -0.829345703125, -0.75732421875, -0.685302734375, -0.61328125, -0.541259765625, -0.46923828125, -0.397216796875, -0.3251953125, -0.253173828125, -0.18115234375, -0.109130859375, -0.037109375, 0.034912109375, 0.10693359375, 0.178955078125, 0.2509765625, 0.322998046875, 0.39501953125, 0.467041015625, 0.5390625, 0.611083984375, 0.68310546875, 0.755126953125, 0.8271484375, 0.899169921875, 0.97119140625, 1.043212890625, 1.115234375, 1.187255859375, 1.25927734375, 1.331298828125, 1.4033203125, 1.475341796875, 1.54736328125, 1.619384765625, 1.69140625, 1.763427734375, 1.83544921875, 1.907470703125, 1.9794921875, 2.051513671875, 2.12353515625, 2.195556640625, 2.267578125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 33.0, 115.0, 292.0, 350.0, 144.0, 42.0, 11.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84033203125, -18.169384002685547, -17.498435974121094, -16.82748794555664, -16.15654182434082, -15.485593795776367, -14.814645767211914, -14.143697738647461, -13.472749710083008, -12.801801681518555, -12.130854606628418, -11.459906578063965, -10.788958549499512, -10.118011474609375, -9.447063446044922, -8.776115417480469, -8.105168342590332, -7.434220790863037, -6.763272762298584, -6.092325210571289, -5.421377182006836, -4.750429630279541, -4.079482078552246, -3.408534049987793, -2.737586498260498, -2.066638708114624, -1.3956910371780396, -0.7247433662414551, -0.053795576095581055, 0.617152214050293, 1.288099765777588, 1.959047794342041, 2.629995346069336, 3.30094313621521, 3.971890926361084, 4.642838478088379, 5.313786506652832, 5.984734058380127, 6.655681610107422, 7.326629638671875, 7.99757719039917, 8.668524742126465, 9.339472770690918, 10.010419845581055, 10.681367874145508, 11.352315902709961, 12.023263931274414, 12.694211959838867, 13.365159034729004, 14.036107063293457, 14.707054138183594, 15.378002166748047, 16.0489501953125, 16.719898223876953, 17.390846252441406, 18.06179428100586, 18.73274040222168, 19.403688430786133, 20.074636459350586, 20.745582580566406, 21.41653060913086, 22.087478637695312, 22.758426666259766, 23.42937469482422, 24.100322723388672]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 11.0, 12.0, 15.0, 15.0, 19.0, 22.0, 19.0, 27.0, 27.0, 26.0, 32.0, 37.0, 50.0, 37.0, 34.0, 46.0, 35.0, 33.0, 50.0, 50.0, 47.0, 49.0, 28.0, 42.0, 37.0, 27.0, 27.0, 20.0, 17.0, 20.0, 11.0, 15.0, 10.0, 6.0, 10.0, 6.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.818304061889648, -5.642192363739014, -5.466080665588379, -5.289968490600586, -5.113856792449951, -4.937745094299316, -4.761633396148682, -4.585521697998047, -4.409409999847412, -4.233298301696777, -4.057186603546143, -3.8810746669769287, -3.704962968826294, -3.52885103225708, -3.3527393341064453, -3.1766276359558105, -3.0005156993865967, -2.824404001235962, -2.648292064666748, -2.4721803665161133, -2.2960686683654785, -2.1199569702148438, -1.9438450336456299, -1.7677333354949951, -1.5916215181350708, -1.4155097007751465, -1.2393980026245117, -1.0632861852645874, -0.8871744275093079, -0.7110626697540283, -0.534950852394104, -0.35883915424346924, -0.18272733688354492, -0.006615564227104187, 0.16949620842933655, 0.3456079959869385, 0.521719753742218, 0.6978315114974976, 0.8739433288574219, 1.0500550270080566, 1.226166844367981, 1.4022786617279053, 1.57839035987854, 1.7545021772384644, 1.9306139945983887, 2.1067256927490234, 2.282837390899658, 2.458949089050293, 2.635061025619507, 2.8111727237701416, 2.9872846603393555, 3.1633963584899902, 3.339508056640625, 3.5156197547912598, 3.6917316913604736, 3.8678433895111084, 4.043955326080322, 4.220067024230957, 4.396178722381592, 4.572290420532227, 4.7484025955200195, 4.924514293670654, 5.100625991821289, 5.276737689971924, 5.452849388122559]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 14.0, 8.0, 13.0, 23.0, 30.0, 40.0, 62.0, 90.0, 157.0, 241.0, 459.0, 825.0, 1736.0, 5273.0, 26074.0, 229131.0, 698101.0, 69653.0, 11191.0, 2882.0, 1121.0, 587.0, 297.0, 191.0, 107.0, 81.0, 39.0, 26.0, 19.0, 29.0, 19.0, 11.0, 5.0, 9.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5084228515625, -5.290283203125, -5.0721435546875, -4.85400390625, -4.6358642578125, -4.417724609375, -4.1995849609375, -3.9814453125, -3.7633056640625, -3.545166015625, -3.3270263671875, -3.10888671875, -2.8907470703125, -2.672607421875, -2.4544677734375, -2.236328125, -2.0181884765625, -1.800048828125, -1.5819091796875, -1.36376953125, -1.1456298828125, -0.927490234375, -0.7093505859375, -0.4912109375, -0.2730712890625, -0.054931640625, 0.1632080078125, 0.38134765625, 0.5994873046875, 0.817626953125, 1.0357666015625, 1.25390625, 1.4720458984375, 1.690185546875, 1.9083251953125, 2.12646484375, 2.3446044921875, 2.562744140625, 2.7808837890625, 2.9990234375, 3.2171630859375, 3.435302734375, 3.6534423828125, 3.87158203125, 4.0897216796875, 4.307861328125, 4.5260009765625, 4.744140625, 4.9622802734375, 5.180419921875, 5.3985595703125, 5.61669921875, 5.8348388671875, 6.052978515625, 6.2711181640625, 6.4892578125, 6.7073974609375, 6.925537109375, 7.1436767578125, 7.36181640625, 7.5799560546875, 7.798095703125, 8.0162353515625, 8.234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 9.0, 13.0, 34.0, 40.0, 52.0, 84.0, 97.0, 132.0, 122.0, 103.0, 97.0, 68.0, 57.0, 38.0, 22.0, 18.0, 6.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.296875, -2.243682861328125, -2.19049072265625, -2.137298583984375, -2.0841064453125, -2.030914306640625, -1.97772216796875, -1.924530029296875, -1.871337890625, -1.818145751953125, -1.76495361328125, -1.711761474609375, -1.6585693359375, -1.605377197265625, -1.55218505859375, -1.498992919921875, -1.44580078125, -1.392608642578125, -1.33941650390625, -1.286224365234375, -1.2330322265625, -1.179840087890625, -1.12664794921875, -1.073455810546875, -1.020263671875, -0.967071533203125, -0.91387939453125, -0.860687255859375, -0.8074951171875, -0.754302978515625, -0.70111083984375, -0.647918701171875, -0.5947265625, -0.541534423828125, -0.48834228515625, -0.435150146484375, -0.3819580078125, -0.328765869140625, -0.27557373046875, -0.222381591796875, -0.169189453125, -0.115997314453125, -0.06280517578125, -0.009613037109375, 0.0435791015625, 0.096771240234375, 0.14996337890625, 0.203155517578125, 0.25634765625, 0.309539794921875, 0.36273193359375, 0.415924072265625, 0.4691162109375, 0.522308349609375, 0.57550048828125, 0.628692626953125, 0.681884765625, 0.735076904296875, 0.78826904296875, 0.841461181640625, 0.8946533203125, 0.947845458984375, 1.00103759765625, 1.054229736328125, 1.107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 7.0, 5.0, 12.0, 20.0, 28.0, 38.0, 57.0, 85.0, 178.0, 340.0, 750.0, 1863.0, 6613.0, 30869.0, 260508.0, 659036.0, 70118.0, 12319.0, 3510.0, 1125.0, 494.0, 254.0, 120.0, 80.0, 35.0, 34.0, 17.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84765625, -7.6182861328125, -7.388916015625, -7.1595458984375, -6.93017578125, -6.7008056640625, -6.471435546875, -6.2420654296875, -6.0126953125, -5.7833251953125, -5.553955078125, -5.3245849609375, -5.09521484375, -4.8658447265625, -4.636474609375, -4.4071044921875, -4.177734375, -3.9483642578125, -3.718994140625, -3.4896240234375, -3.26025390625, -3.0308837890625, -2.801513671875, -2.5721435546875, -2.3427734375, -2.1134033203125, -1.884033203125, -1.6546630859375, -1.42529296875, -1.1959228515625, -0.966552734375, -0.7371826171875, -0.5078125, -0.2784423828125, -0.049072265625, 0.1802978515625, 0.40966796875, 0.6390380859375, 0.868408203125, 1.0977783203125, 1.3271484375, 1.5565185546875, 1.785888671875, 2.0152587890625, 2.24462890625, 2.4739990234375, 2.703369140625, 2.9327392578125, 3.162109375, 3.3914794921875, 3.620849609375, 3.8502197265625, 4.07958984375, 4.3089599609375, 4.538330078125, 4.7677001953125, 4.9970703125, 5.2264404296875, 5.455810546875, 5.6851806640625, 5.91455078125, 6.1439208984375, 6.373291015625, 6.6026611328125, 6.83203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 10.0, 12.0, 16.0, 13.0, 16.0, 25.0, 28.0, 36.0, 33.0, 44.0, 40.0, 49.0, 67.0, 43.0, 62.0, 56.0, 70.0, 57.0, 52.0, 37.0, 45.0, 34.0, 38.0, 25.0, 27.0, 18.0, 6.0, 11.0, 11.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.47845458984375, -5.3123779296875, -5.14630126953125, -4.980224609375, -4.81414794921875, -4.6480712890625, -4.48199462890625, -4.31591796875, -4.14984130859375, -3.9837646484375, -3.81768798828125, -3.651611328125, -3.48553466796875, -3.3194580078125, -3.15338134765625, -2.9873046875, -2.82122802734375, -2.6551513671875, -2.48907470703125, -2.322998046875, -2.15692138671875, -1.9908447265625, -1.82476806640625, -1.65869140625, -1.49261474609375, -1.3265380859375, -1.16046142578125, -0.994384765625, -0.82830810546875, -0.6622314453125, -0.49615478515625, -0.330078125, -0.16400146484375, 0.0020751953125, 0.16815185546875, 0.334228515625, 0.50030517578125, 0.6663818359375, 0.83245849609375, 0.99853515625, 1.16461181640625, 1.3306884765625, 1.49676513671875, 1.662841796875, 1.82891845703125, 1.9949951171875, 2.16107177734375, 2.3271484375, 2.49322509765625, 2.6593017578125, 2.82537841796875, 2.991455078125, 3.15753173828125, 3.3236083984375, 3.48968505859375, 3.65576171875, 3.82183837890625, 3.9879150390625, 4.15399169921875, 4.320068359375, 4.48614501953125, 4.6522216796875, 4.81829833984375, 4.984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 9.0, 5.0, 12.0, 13.0, 17.0, 31.0, 48.0, 71.0, 134.0, 219.0, 493.0, 898.0, 2059.0, 5669.0, 37052.0, 963520.0, 29456.0, 5098.0, 1859.0, 840.0, 428.0, 239.0, 140.0, 82.0, 59.0, 27.0, 22.0, 14.0, 13.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.43218994140625, -4.2432861328125, -4.05438232421875, -3.865478515625, -3.67657470703125, -3.4876708984375, -3.29876708984375, -3.10986328125, -2.92095947265625, -2.7320556640625, -2.54315185546875, -2.354248046875, -2.16534423828125, -1.9764404296875, -1.78753662109375, -1.5986328125, -1.40972900390625, -1.2208251953125, -1.03192138671875, -0.843017578125, -0.65411376953125, -0.4652099609375, -0.27630615234375, -0.08740234375, 0.10150146484375, 0.2904052734375, 0.47930908203125, 0.668212890625, 0.85711669921875, 1.0460205078125, 1.23492431640625, 1.423828125, 1.61273193359375, 1.8016357421875, 1.99053955078125, 2.179443359375, 2.36834716796875, 2.5572509765625, 2.74615478515625, 2.93505859375, 3.12396240234375, 3.3128662109375, 3.50177001953125, 3.690673828125, 3.87957763671875, 4.0684814453125, 4.25738525390625, 4.4462890625, 4.63519287109375, 4.8240966796875, 5.01300048828125, 5.201904296875, 5.39080810546875, 5.5797119140625, 5.76861572265625, 5.95751953125, 6.14642333984375, 6.3353271484375, 6.52423095703125, 6.713134765625, 6.90203857421875, 7.0909423828125, 7.27984619140625, 7.46875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 42.0, 85.0, 169.0, 306.0, 208.0, 81.0, 33.0, 16.0, 5.0, 11.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007257461547851562, -0.00070943683385849, -0.0006931275129318237, -0.0006768181920051575, -0.0006605088710784912, -0.000644199550151825, -0.0006278902292251587, -0.0006115809082984924, -0.0005952715873718262, -0.0005789622664451599, -0.0005626529455184937, -0.0005463436245918274, -0.0005300343036651611, -0.0005137249827384949, -0.0004974156618118286, -0.00048110634088516235, -0.0004647970199584961, -0.00044848769903182983, -0.0004321783781051636, -0.0004158690571784973, -0.00039955973625183105, -0.0003832504153251648, -0.00036694109439849854, -0.0003506317734718323, -0.000334322452545166, -0.00031801313161849976, -0.0003017038106918335, -0.00028539448976516724, -0.000269085168838501, -0.0002527758479118347, -0.00023646652698516846, -0.0002201572060585022, -0.00020384788513183594, -0.00018753856420516968, -0.00017122924327850342, -0.00015491992235183716, -0.0001386106014251709, -0.00012230128049850464, -0.00010599195957183838, -8.968263864517212e-05, -7.337331771850586e-05, -5.70639967918396e-05, -4.075467586517334e-05, -2.444535493850708e-05, -8.13603401184082e-06, 8.17328691482544e-06, 2.44826078414917e-05, 4.079192876815796e-05, 5.710124969482422e-05, 7.341057062149048e-05, 8.971989154815674e-05, 0.000106029212474823, 0.00012233853340148926, 0.00013864785432815552, 0.00015495717525482178, 0.00017126649618148804, 0.0001875758171081543, 0.00020388513803482056, 0.00022019445896148682, 0.00023650377988815308, 0.00025281310081481934, 0.0002691224217414856, 0.00028543174266815186, 0.0003017410635948181, 0.0003180503845214844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 14.0, 13.0, 36.0, 64.0, 140.0, 263.0, 530.0, 1314.0, 4138.0, 23714.0, 837813.0, 166161.0, 10310.0, 2419.0, 795.0, 399.0, 170.0, 100.0, 47.0, 32.0, 15.0, 17.0, 12.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.59429931640625, -4.4542236328125, -4.31414794921875, -4.174072265625, -4.03399658203125, -3.8939208984375, -3.75384521484375, -3.61376953125, -3.47369384765625, -3.3336181640625, -3.19354248046875, -3.053466796875, -2.91339111328125, -2.7733154296875, -2.63323974609375, -2.4931640625, -2.35308837890625, -2.2130126953125, -2.07293701171875, -1.932861328125, -1.79278564453125, -1.6527099609375, -1.51263427734375, -1.37255859375, -1.23248291015625, -1.0924072265625, -0.95233154296875, -0.812255859375, -0.67218017578125, -0.5321044921875, -0.39202880859375, -0.251953125, -0.11187744140625, 0.0281982421875, 0.16827392578125, 0.308349609375, 0.44842529296875, 0.5885009765625, 0.72857666015625, 0.86865234375, 1.00872802734375, 1.1488037109375, 1.28887939453125, 1.428955078125, 1.56903076171875, 1.7091064453125, 1.84918212890625, 1.9892578125, 2.12933349609375, 2.2694091796875, 2.40948486328125, 2.549560546875, 2.68963623046875, 2.8297119140625, 2.96978759765625, 3.10986328125, 3.24993896484375, 3.3900146484375, 3.53009033203125, 3.670166015625, 3.81024169921875, 3.9503173828125, 4.09039306640625, 4.23046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 7.0, 8.0, 8.0, 25.0, 31.0, 73.0, 162.0, 223.0, 199.0, 111.0, 48.0, 31.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.439453125, -3.3404541015625, -3.241455078125, -3.1424560546875, -3.04345703125, -2.9444580078125, -2.845458984375, -2.7464599609375, -2.6474609375, -2.5484619140625, -2.449462890625, -2.3504638671875, -2.25146484375, -2.1524658203125, -2.053466796875, -1.9544677734375, -1.85546875, -1.7564697265625, -1.657470703125, -1.5584716796875, -1.45947265625, -1.3604736328125, -1.261474609375, -1.1624755859375, -1.0634765625, -0.9644775390625, -0.865478515625, -0.7664794921875, -0.66748046875, -0.5684814453125, -0.469482421875, -0.3704833984375, -0.271484375, -0.1724853515625, -0.073486328125, 0.0255126953125, 0.12451171875, 0.2235107421875, 0.322509765625, 0.4215087890625, 0.5205078125, 0.6195068359375, 0.718505859375, 0.8175048828125, 0.91650390625, 1.0155029296875, 1.114501953125, 1.2135009765625, 1.3125, 1.4114990234375, 1.510498046875, 1.6094970703125, 1.70849609375, 1.8074951171875, 1.906494140625, 2.0054931640625, 2.1044921875, 2.2034912109375, 2.302490234375, 2.4014892578125, 2.50048828125, 2.5994873046875, 2.698486328125, 2.7974853515625, 2.896484375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 24.0, 52.0, 143.0, 330.0, 279.0, 111.0, 38.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.33234405517578, -37.259361267089844, -35.186378479003906, -33.11339569091797, -31.040416717529297, -28.96743392944336, -26.894451141357422, -24.821468353271484, -22.74848747253418, -20.675504684448242, -18.602523803710938, -16.529541015625, -14.456559181213379, -12.383577346801758, -10.31059455871582, -8.2376127243042, -6.164630889892578, -4.091649055480957, -2.0186667442321777, 0.05431556701660156, 2.1272974014282227, 4.200279235839844, 6.273262023925781, 8.346243858337402, 10.419225692749023, 12.492207527160645, 14.565189361572266, 16.638172149658203, 18.71115493774414, 20.784135818481445, 22.857118606567383, 24.930099487304688, 27.003082275390625, 29.076065063476562, 31.149045944213867, 33.22203063964844, 35.29500961303711, 37.36799240112305, 39.440975189208984, 41.51395797729492, 43.586936950683594, 45.65991973876953, 47.73290252685547, 49.805885314941406, 51.87886428833008, 53.951847076416016, 56.02482986450195, 58.09781265258789, 60.17079544067383, 62.243778228759766, 64.31675720214844, 66.38973999023438, 68.46272277832031, 70.53570556640625, 72.60868835449219, 74.68167114257812, 76.75465393066406, 78.82763671875, 80.90061950683594, 82.97360229492188, 85.04658508300781, 87.11956787109375, 89.19255065917969, 91.2655258178711, 93.33850860595703]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 3.0, 6.0, 13.0, 7.0, 10.0, 13.0, 15.0, 24.0, 33.0, 38.0, 25.0, 54.0, 44.0, 55.0, 65.0, 74.0, 48.0, 49.0, 51.0, 53.0, 53.0, 47.0, 52.0, 34.0, 33.0, 22.0, 20.0, 18.0, 8.0, 8.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.87354278564453, -24.869884490966797, -23.866228103637695, -22.86256980895996, -21.85891342163086, -20.855255126953125, -19.85159683227539, -18.84794044494629, -17.844284057617188, -16.840625762939453, -15.836969375610352, -14.833311080932617, -13.829654693603516, -12.825996398925781, -11.822339057922363, -10.818681716918945, -9.815023422241211, -8.811366081237793, -7.807708740234375, -6.804050922393799, -5.800393581390381, -4.796736240386963, -3.7930784225463867, -2.7894210815429688, -1.7857637405395508, -0.7821062803268433, 0.22155117988586426, 1.2252087593078613, 2.2288661003112793, 3.2325234413146973, 4.236181259155273, 5.239838600158691, 6.243495941162109, 7.247153282165527, 8.250810623168945, 9.25446891784668, 10.258125305175781, 11.261783599853516, 12.265440940856934, 13.269098281860352, 14.27275562286377, 15.276412963867188, 16.280071258544922, 17.283727645874023, 18.287385940551758, 19.29104232788086, 20.294700622558594, 21.298358917236328, 22.30201530456543, 23.305673599243164, 24.309329986572266, 25.31298828125, 26.3166446685791, 27.320302963256836, 28.323959350585938, 29.327617645263672, 30.331275939941406, 31.33493423461914, 32.338592529296875, 33.342247009277344, 34.34590530395508, 35.34956359863281, 36.35322189331055, 37.35688018798828, 38.36053466796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 5.0, 10.0, 6.0, 10.0, 15.0, 23.0, 30.0, 40.0, 61.0, 116.0, 168.0, 363.0, 707.0, 1641.0, 5440.0, 37384.0, 4027779.0, 106448.0, 9997.0, 2395.0, 838.0, 352.0, 205.0, 99.0, 59.0, 21.0, 25.0, 17.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.8203125, -9.578857421875, -9.33740234375, -9.095947265625, -8.8544921875, -8.613037109375, -8.37158203125, -8.130126953125, -7.888671875, -7.647216796875, -7.40576171875, -7.164306640625, -6.9228515625, -6.681396484375, -6.43994140625, -6.198486328125, -5.95703125, -5.715576171875, -5.47412109375, -5.232666015625, -4.9912109375, -4.749755859375, -4.50830078125, -4.266845703125, -4.025390625, -3.783935546875, -3.54248046875, -3.301025390625, -3.0595703125, -2.818115234375, -2.57666015625, -2.335205078125, -2.09375, -1.852294921875, -1.61083984375, -1.369384765625, -1.1279296875, -0.886474609375, -0.64501953125, -0.403564453125, -0.162109375, 0.079345703125, 0.32080078125, 0.562255859375, 0.8037109375, 1.045166015625, 1.28662109375, 1.528076171875, 1.76953125, 2.010986328125, 2.25244140625, 2.493896484375, 2.7353515625, 2.976806640625, 3.21826171875, 3.459716796875, 3.701171875, 3.942626953125, 4.18408203125, 4.425537109375, 4.6669921875, 4.908447265625, 5.14990234375, 5.391357421875, 5.6328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 9.0, 15.0, 33.0, 47.0, 62.0, 105.0, 111.0, 116.0, 117.0, 124.0, 83.0, 65.0, 49.0, 21.0, 21.0, 15.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.3409576416015625, -2.275665283203125, -2.2103729248046875, -2.14508056640625, -2.0797882080078125, -2.014495849609375, -1.9492034912109375, -1.8839111328125, -1.8186187744140625, -1.753326416015625, -1.6880340576171875, -1.62274169921875, -1.5574493408203125, -1.492156982421875, -1.4268646240234375, -1.361572265625, -1.2962799072265625, -1.230987548828125, -1.1656951904296875, -1.10040283203125, -1.0351104736328125, -0.969818115234375, -0.9045257568359375, -0.8392333984375, -0.7739410400390625, -0.708648681640625, -0.6433563232421875, -0.57806396484375, -0.5127716064453125, -0.447479248046875, -0.3821868896484375, -0.31689453125, -0.2516021728515625, -0.186309814453125, -0.1210174560546875, -0.05572509765625, 0.0095672607421875, 0.074859619140625, 0.1401519775390625, 0.2054443359375, 0.2707366943359375, 0.336029052734375, 0.4013214111328125, 0.46661376953125, 0.5319061279296875, 0.597198486328125, 0.6624908447265625, 0.727783203125, 0.7930755615234375, 0.858367919921875, 0.9236602783203125, 0.98895263671875, 1.0542449951171875, 1.119537353515625, 1.1848297119140625, 1.2501220703125, 1.3154144287109375, 1.380706787109375, 1.4459991455078125, 1.51129150390625, 1.5765838623046875, 1.641876220703125, 1.7071685791015625, 1.7724609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 11.0, 11.0, 19.0, 25.0, 44.0, 80.0, 131.0, 239.0, 609.0, 1385.0, 4407.0, 21766.0, 3003017.0, 1135343.0, 20454.0, 4328.0, 1252.0, 514.0, 291.0, 136.0, 80.0, 45.0, 39.0, 17.0, 17.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.086669921875, -5.82177734375, -5.556884765625, -5.2919921875, -5.027099609375, -4.76220703125, -4.497314453125, -4.232421875, -3.967529296875, -3.70263671875, -3.437744140625, -3.1728515625, -2.907958984375, -2.64306640625, -2.378173828125, -2.11328125, -1.848388671875, -1.58349609375, -1.318603515625, -1.0537109375, -0.788818359375, -0.52392578125, -0.259033203125, 0.005859375, 0.270751953125, 0.53564453125, 0.800537109375, 1.0654296875, 1.330322265625, 1.59521484375, 1.860107421875, 2.125, 2.389892578125, 2.65478515625, 2.919677734375, 3.1845703125, 3.449462890625, 3.71435546875, 3.979248046875, 4.244140625, 4.509033203125, 4.77392578125, 5.038818359375, 5.3037109375, 5.568603515625, 5.83349609375, 6.098388671875, 6.36328125, 6.628173828125, 6.89306640625, 7.157958984375, 7.4228515625, 7.687744140625, 7.95263671875, 8.217529296875, 8.482421875, 8.747314453125, 9.01220703125, 9.277099609375, 9.5419921875, 9.806884765625, 10.07177734375, 10.336669921875, 10.6015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 9.0, 12.0, 26.0, 58.0, 115.0, 567.0, 2839.0, 242.0, 87.0, 46.0, 18.0, 12.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4630126953125, -2.361572265625, -2.2601318359375, -2.15869140625, -2.0572509765625, -1.955810546875, -1.8543701171875, -1.7529296875, -1.6514892578125, -1.550048828125, -1.4486083984375, -1.34716796875, -1.2457275390625, -1.144287109375, -1.0428466796875, -0.94140625, -0.8399658203125, -0.738525390625, -0.6370849609375, -0.53564453125, -0.4342041015625, -0.332763671875, -0.2313232421875, -0.1298828125, -0.0284423828125, 0.072998046875, 0.1744384765625, 0.27587890625, 0.3773193359375, 0.478759765625, 0.5802001953125, 0.681640625, 0.7830810546875, 0.884521484375, 0.9859619140625, 1.08740234375, 1.1888427734375, 1.290283203125, 1.3917236328125, 1.4931640625, 1.5946044921875, 1.696044921875, 1.7974853515625, 1.89892578125, 2.0003662109375, 2.101806640625, 2.2032470703125, 2.3046875, 2.4061279296875, 2.507568359375, 2.6090087890625, 2.71044921875, 2.8118896484375, 2.913330078125, 3.0147705078125, 3.1162109375, 3.2176513671875, 3.319091796875, 3.4205322265625, 3.52197265625, 3.6234130859375, 3.724853515625, 3.8262939453125, 3.927734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 11.0, 104.0, 598.0, 253.0, 40.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.666475296020508, -16.371662139892578, -15.076849937438965, -13.782037734985352, -12.487224578857422, -11.192411422729492, -9.897599220275879, -8.602787017822266, -7.307973861694336, -6.0131611824035645, -4.718348503112793, -3.4235358238220215, -2.12872314453125, -0.8339104652404785, 0.46090221405029297, 1.7557144165039062, 3.050527572631836, 4.345340251922607, 5.640152931213379, 6.93496561050415, 8.229778289794922, 9.524591445922852, 10.819403648376465, 12.114215850830078, 13.409029006958008, 14.703842163085938, 15.99865436553955, 17.293466567993164, 18.588279724121094, 19.883092880249023, 21.177906036376953, 22.47271728515625, 23.767532348632812, 25.062345504760742, 26.357158660888672, 27.65196990966797, 28.9467830657959, 30.241596221923828, 31.536407470703125, 32.83122253417969, 34.126033782958984, 35.42084503173828, 36.715660095214844, 38.01047134399414, 39.30528259277344, 40.60009765625, 41.8949089050293, 43.189720153808594, 44.484535217285156, 45.77934646606445, 47.074161529541016, 48.36897277832031, 49.663787841796875, 50.95859909057617, 52.25341033935547, 53.54822540283203, 54.84303665161133, 56.137847900390625, 57.43266296386719, 58.727474212646484, 60.02228546142578, 61.317100524902344, 62.61191177368164, 63.90672302246094, 65.2015380859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 14.0, 19.0, 7.0, 16.0, 17.0, 21.0, 17.0, 25.0, 23.0, 26.0, 30.0, 21.0, 41.0, 31.0, 31.0, 46.0, 36.0, 35.0, 40.0, 36.0, 35.0, 37.0, 30.0, 39.0, 42.0, 29.0, 34.0, 28.0, 23.0, 17.0, 21.0, 26.0, 16.0, 11.0, 8.0, 8.0, 8.0, 4.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.686957359313965, -5.52431058883667, -5.361663341522217, -5.199016571044922, -5.036369800567627, -4.873723030090332, -4.711075782775879, -4.548429012298584, -4.385782241821289, -4.223135471343994, -4.060488224029541, -3.897841453552246, -3.735194683074951, -3.572547674179077, -3.409900665283203, -3.247253894805908, -3.084606647491455, -2.921959638595581, -2.759312868118286, -2.596665859222412, -2.434019088745117, -2.271372079849243, -2.108725070953369, -1.9460781812667847, -1.7834312915802002, -1.6207844018936157, -1.4581375122070312, -1.2954905033111572, -1.1328436136245728, -0.9701967239379883, -0.807549774646759, -0.6449028253555298, -0.4822559356689453, -0.31960901618003845, -0.1569620966911316, 0.0056848227977752686, 0.16833174228668213, 0.3309786319732666, 0.49362558126449585, 0.6562725305557251, 0.8189194202423096, 0.981566309928894, 1.1442131996154785, 1.3068602085113525, 1.469507098197937, 1.6321539878845215, 1.7948009967803955, 1.95744788646698, 2.1200947761535645, 2.2827417850494385, 2.4453885555267334, 2.6080355644226074, 2.7706823348999023, 2.9333293437957764, 3.0959763526916504, 3.2586231231689453, 3.4212701320648193, 3.5839171409606934, 3.7465639114379883, 3.9092109203338623, 4.071857929229736, 4.234504699707031, 4.397151470184326, 4.559798717498779, 4.722445487976074]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 8.0, 18.0, 20.0, 27.0, 33.0, 52.0, 68.0, 90.0, 144.0, 197.0, 347.0, 601.0, 1070.0, 2316.0, 5606.0, 17574.0, 74816.0, 445608.0, 405618.0, 67875.0, 16481.0, 5296.0, 2198.0, 983.0, 525.0, 277.0, 208.0, 136.0, 84.0, 85.0, 43.0, 32.0, 19.0, 16.0, 18.0, 10.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.44921875, -5.26739501953125, -5.0855712890625, -4.90374755859375, -4.721923828125, -4.54010009765625, -4.3582763671875, -4.17645263671875, -3.99462890625, -3.81280517578125, -3.6309814453125, -3.44915771484375, -3.267333984375, -3.08551025390625, -2.9036865234375, -2.72186279296875, -2.5400390625, -2.35821533203125, -2.1763916015625, -1.99456787109375, -1.812744140625, -1.63092041015625, -1.4490966796875, -1.26727294921875, -1.08544921875, -0.90362548828125, -0.7218017578125, -0.53997802734375, -0.358154296875, -0.17633056640625, 0.0054931640625, 0.18731689453125, 0.369140625, 0.55096435546875, 0.7327880859375, 0.91461181640625, 1.096435546875, 1.27825927734375, 1.4600830078125, 1.64190673828125, 1.82373046875, 2.00555419921875, 2.1873779296875, 2.36920166015625, 2.551025390625, 2.73284912109375, 2.9146728515625, 3.09649658203125, 3.2783203125, 3.46014404296875, 3.6419677734375, 3.82379150390625, 4.005615234375, 4.18743896484375, 4.3692626953125, 4.55108642578125, 4.73291015625, 4.91473388671875, 5.0965576171875, 5.27838134765625, 5.460205078125, 5.64202880859375, 5.8238525390625, 6.00567626953125, 6.1875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 7.0, 7.0, 19.0, 34.0, 44.0, 71.0, 104.0, 93.0, 133.0, 112.0, 100.0, 88.0, 78.0, 36.0, 34.0, 16.0, 18.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.34649658203125, -2.2828369140625, -2.21917724609375, -2.155517578125, -2.09185791015625, -2.0281982421875, -1.96453857421875, -1.90087890625, -1.83721923828125, -1.7735595703125, -1.70989990234375, -1.646240234375, -1.58258056640625, -1.5189208984375, -1.45526123046875, -1.3916015625, -1.32794189453125, -1.2642822265625, -1.20062255859375, -1.136962890625, -1.07330322265625, -1.0096435546875, -0.94598388671875, -0.88232421875, -0.81866455078125, -0.7550048828125, -0.69134521484375, -0.627685546875, -0.56402587890625, -0.5003662109375, -0.43670654296875, -0.373046875, -0.30938720703125, -0.2457275390625, -0.18206787109375, -0.118408203125, -0.05474853515625, 0.0089111328125, 0.07257080078125, 0.13623046875, 0.19989013671875, 0.2635498046875, 0.32720947265625, 0.390869140625, 0.45452880859375, 0.5181884765625, 0.58184814453125, 0.6455078125, 0.70916748046875, 0.7728271484375, 0.83648681640625, 0.900146484375, 0.96380615234375, 1.0274658203125, 1.09112548828125, 1.15478515625, 1.21844482421875, 1.2821044921875, 1.34576416015625, 1.409423828125, 1.47308349609375, 1.5367431640625, 1.60040283203125, 1.6640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 8.0, 14.0, 11.0, 16.0, 17.0, 29.0, 29.0, 38.0, 54.0, 68.0, 100.0, 126.0, 188.0, 315.0, 546.0, 1033.0, 2043.0, 4481.0, 11827.0, 34421.0, 126937.0, 502262.0, 269437.0, 61784.0, 19431.0, 7065.0, 2997.0, 1331.0, 665.0, 353.0, 258.0, 179.0, 131.0, 82.0, 66.0, 49.0, 43.0, 27.0, 20.0, 17.0, 12.0, 11.0, 8.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.5546875, -4.41119384765625, -4.2677001953125, -4.12420654296875, -3.980712890625, -3.83721923828125, -3.6937255859375, -3.55023193359375, -3.40673828125, -3.26324462890625, -3.1197509765625, -2.97625732421875, -2.832763671875, -2.68927001953125, -2.5457763671875, -2.40228271484375, -2.2587890625, -2.11529541015625, -1.9718017578125, -1.82830810546875, -1.684814453125, -1.54132080078125, -1.3978271484375, -1.25433349609375, -1.11083984375, -0.96734619140625, -0.8238525390625, -0.68035888671875, -0.536865234375, -0.39337158203125, -0.2498779296875, -0.10638427734375, 0.037109375, 0.18060302734375, 0.3240966796875, 0.46759033203125, 0.611083984375, 0.75457763671875, 0.8980712890625, 1.04156494140625, 1.18505859375, 1.32855224609375, 1.4720458984375, 1.61553955078125, 1.759033203125, 1.90252685546875, 2.0460205078125, 2.18951416015625, 2.3330078125, 2.47650146484375, 2.6199951171875, 2.76348876953125, 2.906982421875, 3.05047607421875, 3.1939697265625, 3.33746337890625, 3.48095703125, 3.62445068359375, 3.7679443359375, 3.91143798828125, 4.054931640625, 4.19842529296875, 4.3419189453125, 4.48541259765625, 4.62890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 7.0, 11.0, 17.0, 15.0, 23.0, 36.0, 32.0, 42.0, 37.0, 49.0, 35.0, 48.0, 48.0, 49.0, 39.0, 49.0, 45.0, 50.0, 24.0, 47.0, 37.0, 35.0, 26.0, 17.0, 24.0, 21.0, 13.0, 25.0, 8.0, 9.0, 10.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.68359375, -4.5411376953125, -4.398681640625, -4.2562255859375, -4.11376953125, -3.9713134765625, -3.828857421875, -3.6864013671875, -3.5439453125, -3.4014892578125, -3.259033203125, -3.1165771484375, -2.97412109375, -2.8316650390625, -2.689208984375, -2.5467529296875, -2.404296875, -2.2618408203125, -2.119384765625, -1.9769287109375, -1.83447265625, -1.6920166015625, -1.549560546875, -1.4071044921875, -1.2646484375, -1.1221923828125, -0.979736328125, -0.8372802734375, -0.69482421875, -0.5523681640625, -0.409912109375, -0.2674560546875, -0.125, 0.0174560546875, 0.159912109375, 0.3023681640625, 0.44482421875, 0.5872802734375, 0.729736328125, 0.8721923828125, 1.0146484375, 1.1571044921875, 1.299560546875, 1.4420166015625, 1.58447265625, 1.7269287109375, 1.869384765625, 2.0118408203125, 2.154296875, 2.2967529296875, 2.439208984375, 2.5816650390625, 2.72412109375, 2.8665771484375, 3.009033203125, 3.1514892578125, 3.2939453125, 3.4364013671875, 3.578857421875, 3.7213134765625, 3.86376953125, 4.0062255859375, 4.148681640625, 4.2911376953125, 4.43359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 16.0, 18.0, 20.0, 28.0, 44.0, 75.0, 115.0, 167.0, 288.0, 563.0, 1154.0, 2595.0, 6450.0, 21239.0, 232126.0, 723258.0, 43509.0, 9929.0, 3602.0, 1579.0, 748.0, 374.0, 222.0, 129.0, 110.0, 58.0, 42.0, 26.0, 15.0, 9.0, 4.0, 11.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.30078125, -3.20428466796875, -3.1077880859375, -3.01129150390625, -2.914794921875, -2.81829833984375, -2.7218017578125, -2.62530517578125, -2.52880859375, -2.43231201171875, -2.3358154296875, -2.23931884765625, -2.142822265625, -2.04632568359375, -1.9498291015625, -1.85333251953125, -1.7568359375, -1.66033935546875, -1.5638427734375, -1.46734619140625, -1.370849609375, -1.27435302734375, -1.1778564453125, -1.08135986328125, -0.98486328125, -0.88836669921875, -0.7918701171875, -0.69537353515625, -0.598876953125, -0.50238037109375, -0.4058837890625, -0.30938720703125, -0.212890625, -0.11639404296875, -0.0198974609375, 0.07659912109375, 0.173095703125, 0.26959228515625, 0.3660888671875, 0.46258544921875, 0.55908203125, 0.65557861328125, 0.7520751953125, 0.84857177734375, 0.945068359375, 1.04156494140625, 1.1380615234375, 1.23455810546875, 1.3310546875, 1.42755126953125, 1.5240478515625, 1.62054443359375, 1.717041015625, 1.81353759765625, 1.9100341796875, 2.00653076171875, 2.10302734375, 2.19952392578125, 2.2960205078125, 2.39251708984375, 2.489013671875, 2.58551025390625, 2.6820068359375, 2.77850341796875, 2.875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 7.0, 7.0, 16.0, 28.0, 60.0, 114.0, 177.0, 202.0, 163.0, 108.0, 67.0, 22.0, 16.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003464221954345703, -0.00033332034945487976, -0.0003202185034751892, -0.00030711665749549866, -0.0002940148115158081, -0.00028091296553611755, -0.000267811119556427, -0.00025470927357673645, -0.0002416074275970459, -0.00022850558161735535, -0.0002154037356376648, -0.00020230188965797424, -0.0001892000436782837, -0.00017609819769859314, -0.0001629963517189026, -0.00014989450573921204, -0.00013679265975952148, -0.00012369081377983093, -0.00011058896780014038, -9.748712182044983e-05, -8.438527584075928e-05, -7.128342986106873e-05, -5.8181583881378174e-05, -4.507973790168762e-05, -3.197789192199707e-05, -1.887604594230652e-05, -5.774199962615967e-06, 7.327646017074585e-06, 2.0429491996765137e-05, 3.353133797645569e-05, 4.663318395614624e-05, 5.973502993583679e-05, 7.283687591552734e-05, 8.59387218952179e-05, 9.904056787490845e-05, 0.000112142413854599, 0.00012524425983428955, 0.0001383461058139801, 0.00015144795179367065, 0.0001645497977733612, 0.00017765164375305176, 0.0001907534897327423, 0.00020385533571243286, 0.0002169571816921234, 0.00023005902767181396, 0.00024316087365150452, 0.00025626271963119507, 0.0002693645656108856, 0.00028246641159057617, 0.0002955682575702667, 0.0003086701035499573, 0.00032177194952964783, 0.0003348737955093384, 0.00034797564148902893, 0.0003610774874687195, 0.00037417933344841003, 0.0003872811794281006, 0.00040038302540779114, 0.0004134848713874817, 0.00042658671736717224, 0.0004396885633468628, 0.00045279040932655334, 0.0004658922553062439, 0.00047899410128593445, 0.000492095947265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 16.0, 16.0, 20.0, 31.0, 25.0, 46.0, 72.0, 133.0, 237.0, 524.0, 1205.0, 2924.0, 8318.0, 36486.0, 444259.0, 499798.0, 40095.0, 8729.0, 3121.0, 1191.0, 583.0, 274.0, 139.0, 74.0, 64.0, 41.0, 37.0, 13.0, 10.0, 12.0, 10.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.431396484375, -2.35302734375, -2.274658203125, -2.1962890625, -2.117919921875, -2.03955078125, -1.961181640625, -1.8828125, -1.804443359375, -1.72607421875, -1.647705078125, -1.5693359375, -1.490966796875, -1.41259765625, -1.334228515625, -1.255859375, -1.177490234375, -1.09912109375, -1.020751953125, -0.9423828125, -0.864013671875, -0.78564453125, -0.707275390625, -0.62890625, -0.550537109375, -0.47216796875, -0.393798828125, -0.3154296875, -0.237060546875, -0.15869140625, -0.080322265625, -0.001953125, 0.076416015625, 0.15478515625, 0.233154296875, 0.3115234375, 0.389892578125, 0.46826171875, 0.546630859375, 0.625, 0.703369140625, 0.78173828125, 0.860107421875, 0.9384765625, 1.016845703125, 1.09521484375, 1.173583984375, 1.251953125, 1.330322265625, 1.40869140625, 1.487060546875, 1.5654296875, 1.643798828125, 1.72216796875, 1.800537109375, 1.87890625, 1.957275390625, 2.03564453125, 2.114013671875, 2.1923828125, 2.270751953125, 2.34912109375, 2.427490234375, 2.505859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 10.0, 11.0, 16.0, 20.0, 35.0, 51.0, 66.0, 88.0, 98.0, 108.0, 110.0, 92.0, 60.0, 42.0, 45.0, 25.0, 27.0, 16.0, 9.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6962890625, -1.638824462890625, -1.58135986328125, -1.523895263671875, -1.4664306640625, -1.408966064453125, -1.35150146484375, -1.294036865234375, -1.236572265625, -1.179107666015625, -1.12164306640625, -1.064178466796875, -1.0067138671875, -0.949249267578125, -0.89178466796875, -0.834320068359375, -0.77685546875, -0.719390869140625, -0.66192626953125, -0.604461669921875, -0.5469970703125, -0.489532470703125, -0.43206787109375, -0.374603271484375, -0.317138671875, -0.259674072265625, -0.20220947265625, -0.144744873046875, -0.0872802734375, -0.029815673828125, 0.02764892578125, 0.085113525390625, 0.142578125, 0.200042724609375, 0.25750732421875, 0.314971923828125, 0.3724365234375, 0.429901123046875, 0.48736572265625, 0.544830322265625, 0.602294921875, 0.659759521484375, 0.71722412109375, 0.774688720703125, 0.8321533203125, 0.889617919921875, 0.94708251953125, 1.004547119140625, 1.06201171875, 1.119476318359375, 1.17694091796875, 1.234405517578125, 1.2918701171875, 1.349334716796875, 1.40679931640625, 1.464263916015625, 1.521728515625, 1.579193115234375, 1.63665771484375, 1.694122314453125, 1.7515869140625, 1.809051513671875, 1.86651611328125, 1.923980712890625, 1.9814453125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 20.0, 31.0, 40.0, 62.0, 113.0, 145.0, 196.0, 167.0, 83.0, 54.0, 29.0, 23.0, 16.0, 3.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.765317916870117, -24.51405906677246, -23.262798309326172, -22.011539459228516, -20.760278701782227, -19.50901985168457, -18.25775909423828, -17.006500244140625, -15.755240440368652, -14.50398063659668, -13.252720832824707, -12.001461029052734, -10.750202178955078, -9.498941421508789, -8.247682571411133, -6.99642276763916, -5.7451629638671875, -4.493903160095215, -3.2426435947418213, -1.9913840293884277, -0.7401242256164551, 0.5111355781555176, 1.762394905090332, 3.0136547088623047, 4.264914512634277, 5.51617431640625, 6.767434120178223, 8.018693923950195, 9.269952774047852, 10.52121353149414, 11.772472381591797, 13.02373218536377, 14.27499008178711, 15.526249885559082, 16.777509689331055, 18.02876853942871, 19.280029296875, 20.531288146972656, 21.782546997070312, 23.0338077545166, 24.28506851196289, 25.536327362060547, 26.787588119506836, 28.038846969604492, 29.29010772705078, 30.541366577148438, 31.792625427246094, 33.04388427734375, 34.295143127441406, 35.54640197753906, 36.79766082763672, 38.04892349243164, 39.3001823425293, 40.55144119262695, 41.80270004272461, 43.05396270751953, 44.30522155761719, 45.556480407714844, 46.8077392578125, 48.05900192260742, 49.31026077270508, 50.561519622802734, 51.81277847290039, 53.06404113769531, 54.31529998779297]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 8.0, 8.0, 10.0, 14.0, 17.0, 18.0, 14.0, 27.0, 26.0, 27.0, 25.0, 39.0, 33.0, 45.0, 51.0, 54.0, 57.0, 55.0, 49.0, 53.0, 57.0, 42.0, 37.0, 29.0, 38.0, 27.0, 24.0, 15.0, 23.0, 20.0, 12.0, 15.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.067604064941406, -26.041175842285156, -25.014747619628906, -23.988319396972656, -22.961891174316406, -21.935462951660156, -20.909034729003906, -19.882606506347656, -18.856178283691406, -17.829750061035156, -16.803321838378906, -15.776893615722656, -14.750465393066406, -13.724037170410156, -12.697608947753906, -11.671180725097656, -10.644752502441406, -9.618324279785156, -8.591896057128906, -7.565467834472656, -6.539039611816406, -5.512611389160156, -4.486183166503906, -3.4597549438476562, -2.4333267211914062, -1.4068984985351562, -0.38047027587890625, 0.6459579467773438, 1.6723861694335938, 2.6988143920898438, 3.7252426147460938, 4.751670837402344, 5.778102874755859, 6.804531097412109, 7.830959320068359, 8.85738754272461, 9.88381576538086, 10.91024398803711, 11.93667221069336, 12.96310043334961, 13.98952865600586, 15.01595687866211, 16.04238510131836, 17.06881332397461, 18.09524154663086, 19.12166976928711, 20.14809799194336, 21.17452621459961, 22.20095443725586, 23.22738265991211, 24.25381088256836, 25.28023910522461, 26.30666732788086, 27.33309555053711, 28.35952377319336, 29.38595199584961, 30.41238021850586, 31.43880844116211, 32.46523666381836, 33.49166488647461, 34.51809310913086, 35.54452133178711, 36.57094955444336, 37.59737777709961, 38.62380599975586]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 4.0, 8.0, 3.0, 10.0, 16.0, 23.0, 26.0, 24.0, 35.0, 77.0, 140.0, 222.0, 410.0, 878.0, 1981.0, 5985.0, 34261.0, 3962197.0, 168029.0, 13859.0, 3402.0, 1333.0, 631.0, 342.0, 159.0, 92.0, 46.0, 19.0, 18.0, 7.0, 9.0, 6.0, 6.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.46795654296875, -8.2171630859375, -7.96636962890625, -7.715576171875, -7.46478271484375, -7.2139892578125, -6.96319580078125, -6.71240234375, -6.46160888671875, -6.2108154296875, -5.96002197265625, -5.709228515625, -5.45843505859375, -5.2076416015625, -4.95684814453125, -4.7060546875, -4.45526123046875, -4.2044677734375, -3.95367431640625, -3.702880859375, -3.45208740234375, -3.2012939453125, -2.95050048828125, -2.69970703125, -2.44891357421875, -2.1981201171875, -1.94732666015625, -1.696533203125, -1.44573974609375, -1.1949462890625, -0.94415283203125, -0.693359375, -0.44256591796875, -0.1917724609375, 0.05902099609375, 0.309814453125, 0.56060791015625, 0.8114013671875, 1.06219482421875, 1.31298828125, 1.56378173828125, 1.8145751953125, 2.06536865234375, 2.316162109375, 2.56695556640625, 2.8177490234375, 3.06854248046875, 3.3193359375, 3.57012939453125, 3.8209228515625, 4.07171630859375, 4.322509765625, 4.57330322265625, 4.8240966796875, 5.07489013671875, 5.32568359375, 5.57647705078125, 5.8272705078125, 6.07806396484375, 6.328857421875, 6.57965087890625, 6.8304443359375, 7.08123779296875, 7.33203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 13.0, 18.0, 31.0, 52.0, 76.0, 88.0, 95.0, 102.0, 128.0, 110.0, 91.0, 64.0, 46.0, 32.0, 26.0, 13.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.54229736328125, -2.4674072265625, -2.39251708984375, -2.317626953125, -2.24273681640625, -2.1678466796875, -2.09295654296875, -2.01806640625, -1.94317626953125, -1.8682861328125, -1.79339599609375, -1.718505859375, -1.64361572265625, -1.5687255859375, -1.49383544921875, -1.4189453125, -1.34405517578125, -1.2691650390625, -1.19427490234375, -1.119384765625, -1.04449462890625, -0.9696044921875, -0.89471435546875, -0.81982421875, -0.74493408203125, -0.6700439453125, -0.59515380859375, -0.520263671875, -0.44537353515625, -0.3704833984375, -0.29559326171875, -0.220703125, -0.14581298828125, -0.0709228515625, 0.00396728515625, 0.078857421875, 0.15374755859375, 0.2286376953125, 0.30352783203125, 0.37841796875, 0.45330810546875, 0.5281982421875, 0.60308837890625, 0.677978515625, 0.75286865234375, 0.8277587890625, 0.90264892578125, 0.9775390625, 1.05242919921875, 1.1273193359375, 1.20220947265625, 1.277099609375, 1.35198974609375, 1.4268798828125, 1.50177001953125, 1.57666015625, 1.65155029296875, 1.7264404296875, 1.80133056640625, 1.876220703125, 1.95111083984375, 2.0260009765625, 2.10089111328125, 2.17578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 12.0, 19.0, 25.0, 36.0, 64.0, 94.0, 150.0, 259.0, 348.0, 594.0, 1019.0, 1886.0, 3569.0, 8299.0, 24831.0, 140795.0, 3789540.0, 176475.0, 28283.0, 9179.0, 3959.0, 1999.0, 1079.0, 599.0, 424.0, 261.0, 154.0, 110.0, 60.0, 51.0, 31.0, 29.0, 18.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.00537109375, -3.8544921875, -3.70361328125, -3.552734375, -3.40185546875, -3.2509765625, -3.10009765625, -2.94921875, -2.79833984375, -2.6474609375, -2.49658203125, -2.345703125, -2.19482421875, -2.0439453125, -1.89306640625, -1.7421875, -1.59130859375, -1.4404296875, -1.28955078125, -1.138671875, -0.98779296875, -0.8369140625, -0.68603515625, -0.53515625, -0.38427734375, -0.2333984375, -0.08251953125, 0.068359375, 0.21923828125, 0.3701171875, 0.52099609375, 0.671875, 0.82275390625, 0.9736328125, 1.12451171875, 1.275390625, 1.42626953125, 1.5771484375, 1.72802734375, 1.87890625, 2.02978515625, 2.1806640625, 2.33154296875, 2.482421875, 2.63330078125, 2.7841796875, 2.93505859375, 3.0859375, 3.23681640625, 3.3876953125, 3.53857421875, 3.689453125, 3.84033203125, 3.9912109375, 4.14208984375, 4.29296875, 4.44384765625, 4.5947265625, 4.74560546875, 4.896484375, 5.04736328125, 5.1982421875, 5.34912109375, 5.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 0.0, 7.0, 11.0, 15.0, 22.0, 39.0, 49.0, 127.0, 279.0, 2379.0, 759.0, 163.0, 70.0, 48.0, 23.0, 20.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.658203125, -2.56903076171875, -2.4798583984375, -2.39068603515625, -2.301513671875, -2.21234130859375, -2.1231689453125, -2.03399658203125, -1.94482421875, -1.85565185546875, -1.7664794921875, -1.67730712890625, -1.588134765625, -1.49896240234375, -1.4097900390625, -1.32061767578125, -1.2314453125, -1.14227294921875, -1.0531005859375, -0.96392822265625, -0.874755859375, -0.78558349609375, -0.6964111328125, -0.60723876953125, -0.51806640625, -0.42889404296875, -0.3397216796875, -0.25054931640625, -0.161376953125, -0.07220458984375, 0.0169677734375, 0.10614013671875, 0.1953125, 0.28448486328125, 0.3736572265625, 0.46282958984375, 0.552001953125, 0.64117431640625, 0.7303466796875, 0.81951904296875, 0.90869140625, 0.99786376953125, 1.0870361328125, 1.17620849609375, 1.265380859375, 1.35455322265625, 1.4437255859375, 1.53289794921875, 1.6220703125, 1.71124267578125, 1.8004150390625, 1.88958740234375, 1.978759765625, 2.06793212890625, 2.1571044921875, 2.24627685546875, 2.33544921875, 2.42462158203125, 2.5137939453125, 2.60296630859375, 2.692138671875, 2.78131103515625, 2.8704833984375, 2.95965576171875, 3.048828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 19.0, 92.0, 414.0, 391.0, 67.0, 19.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.033733367919922, -20.808725357055664, -19.58371925354004, -18.35871124267578, -17.133705139160156, -15.908697128295898, -14.68368911743164, -13.4586820602417, -12.233675003051758, -11.008667945861816, -9.783660888671875, -8.558652877807617, -7.333645820617676, -6.108638763427734, -4.883631229400635, -3.658623695373535, -2.4336166381835938, -1.2086093425750732, 0.016397953033447266, 1.2414052486419678, 2.4664125442504883, 3.6914196014404297, 4.916427135467529, 6.141434669494629, 7.36644172668457, 8.591448783874512, 9.816455841064453, 11.041463851928711, 12.266470909118652, 13.491477966308594, 14.716485977172852, 15.941493034362793, 17.16650390625, 18.391511917114258, 19.616518020629883, 20.84152603149414, 22.066532135009766, 23.291540145874023, 24.51654815673828, 25.741554260253906, 26.966562271118164, 28.191570281982422, 29.416576385498047, 30.641584396362305, 31.866592407226562, 33.09159851074219, 34.31660461425781, 35.5416145324707, 36.76662063598633, 37.99162673950195, 39.216636657714844, 40.44164276123047, 41.666648864746094, 42.89165496826172, 44.11666488647461, 45.341670989990234, 46.566680908203125, 47.79168701171875, 49.01669692993164, 50.241703033447266, 51.46670913696289, 52.69171905517578, 53.916725158691406, 55.14173126220703, 56.366737365722656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 7.0, 9.0, 5.0, 14.0, 10.0, 15.0, 32.0, 36.0, 29.0, 33.0, 45.0, 43.0, 54.0, 59.0, 65.0, 69.0, 55.0, 65.0, 51.0, 45.0, 45.0, 44.0, 33.0, 40.0, 35.0, 16.0, 17.0, 6.0, 7.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296586990356445, -8.014235496520996, -7.731884002685547, -7.449532985687256, -7.167181491851807, -6.884829998016357, -6.602478981018066, -6.320127487182617, -6.037775993347168, -5.755424499511719, -5.4730730056762695, -5.1907219886779785, -4.908370494842529, -4.62601900100708, -4.343667984008789, -4.06131649017334, -3.7789649963378906, -3.4966135025024414, -3.2142622470855713, -2.931910991668701, -2.649559497833252, -2.3672080039978027, -2.0848567485809326, -1.802505373954773, -1.5201539993286133, -1.2378026247024536, -0.955451250076294, -0.6730998754501343, -0.3907485008239746, -0.10839712619781494, 0.17395424842834473, 0.4563056230545044, 0.7386579513549805, 1.0210093259811401, 1.3033607006072998, 1.5857120752334595, 1.8680634498596191, 2.1504149436950684, 2.4327661991119385, 2.7151174545288086, 2.997468948364258, 3.279820442199707, 3.562171697616577, 3.8445229530334473, 4.1268744468688965, 4.409225940704346, 4.691576957702637, 4.973928451538086, 5.256279945373535, 5.538631439208984, 5.820982933044434, 6.103333950042725, 6.385685443878174, 6.668036937713623, 6.950387954711914, 7.232739448547363, 7.5150909423828125, 7.797442436218262, 8.079793930053711, 8.36214542388916, 8.64449691772461, 8.926847457885742, 9.209198951721191, 9.49155044555664, 9.77390193939209]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 10.0, 17.0, 24.0, 30.0, 46.0, 54.0, 66.0, 128.0, 204.0, 291.0, 567.0, 1123.0, 2620.0, 7264.0, 24773.0, 128883.0, 739217.0, 109442.0, 22064.0, 6711.0, 2491.0, 1092.0, 528.0, 296.0, 182.0, 111.0, 75.0, 50.0, 43.0, 35.0, 14.0, 22.0, 13.0, 6.0, 4.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.37890625, -6.16949462890625, -5.9600830078125, -5.75067138671875, -5.541259765625, -5.33184814453125, -5.1224365234375, -4.91302490234375, -4.70361328125, -4.49420166015625, -4.2847900390625, -4.07537841796875, -3.865966796875, -3.65655517578125, -3.4471435546875, -3.23773193359375, -3.0283203125, -2.81890869140625, -2.6094970703125, -2.40008544921875, -2.190673828125, -1.98126220703125, -1.7718505859375, -1.56243896484375, -1.35302734375, -1.14361572265625, -0.9342041015625, -0.72479248046875, -0.515380859375, -0.30596923828125, -0.0965576171875, 0.11285400390625, 0.322265625, 0.53167724609375, 0.7410888671875, 0.95050048828125, 1.159912109375, 1.36932373046875, 1.5787353515625, 1.78814697265625, 1.99755859375, 2.20697021484375, 2.4163818359375, 2.62579345703125, 2.835205078125, 3.04461669921875, 3.2540283203125, 3.46343994140625, 3.6728515625, 3.88226318359375, 4.0916748046875, 4.30108642578125, 4.510498046875, 4.71990966796875, 4.9293212890625, 5.13873291015625, 5.34814453125, 5.55755615234375, 5.7669677734375, 5.97637939453125, 6.185791015625, 6.39520263671875, 6.6046142578125, 6.81402587890625, 7.0234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 20.0, 47.0, 64.0, 73.0, 93.0, 130.0, 123.0, 126.0, 85.0, 80.0, 55.0, 26.0, 33.0, 10.0, 9.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.592041015625, -2.51416015625, -2.436279296875, -2.3583984375, -2.280517578125, -2.20263671875, -2.124755859375, -2.046875, -1.968994140625, -1.89111328125, -1.813232421875, -1.7353515625, -1.657470703125, -1.57958984375, -1.501708984375, -1.423828125, -1.345947265625, -1.26806640625, -1.190185546875, -1.1123046875, -1.034423828125, -0.95654296875, -0.878662109375, -0.80078125, -0.722900390625, -0.64501953125, -0.567138671875, -0.4892578125, -0.411376953125, -0.33349609375, -0.255615234375, -0.177734375, -0.099853515625, -0.02197265625, 0.055908203125, 0.1337890625, 0.211669921875, 0.28955078125, 0.367431640625, 0.4453125, 0.523193359375, 0.60107421875, 0.678955078125, 0.7568359375, 0.834716796875, 0.91259765625, 0.990478515625, 1.068359375, 1.146240234375, 1.22412109375, 1.302001953125, 1.3798828125, 1.457763671875, 1.53564453125, 1.613525390625, 1.69140625, 1.769287109375, 1.84716796875, 1.925048828125, 2.0029296875, 2.080810546875, 2.15869140625, 2.236572265625, 2.314453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 17.0, 17.0, 18.0, 32.0, 43.0, 71.0, 120.0, 211.0, 354.0, 672.0, 1541.0, 4295.0, 15582.0, 88291.0, 786975.0, 122230.0, 19498.0, 5057.0, 1711.0, 808.0, 400.0, 221.0, 117.0, 77.0, 44.0, 41.0, 25.0, 22.0, 10.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -5.98846435546875, -5.7542724609375, -5.52008056640625, -5.285888671875, -5.05169677734375, -4.8175048828125, -4.58331298828125, -4.34912109375, -4.11492919921875, -3.8807373046875, -3.64654541015625, -3.412353515625, -3.17816162109375, -2.9439697265625, -2.70977783203125, -2.4755859375, -2.24139404296875, -2.0072021484375, -1.77301025390625, -1.538818359375, -1.30462646484375, -1.0704345703125, -0.83624267578125, -0.60205078125, -0.36785888671875, -0.1336669921875, 0.10052490234375, 0.334716796875, 0.56890869140625, 0.8031005859375, 1.03729248046875, 1.271484375, 1.50567626953125, 1.7398681640625, 1.97406005859375, 2.208251953125, 2.44244384765625, 2.6766357421875, 2.91082763671875, 3.14501953125, 3.37921142578125, 3.6134033203125, 3.84759521484375, 4.081787109375, 4.31597900390625, 4.5501708984375, 4.78436279296875, 5.0185546875, 5.25274658203125, 5.4869384765625, 5.72113037109375, 5.955322265625, 6.18951416015625, 6.4237060546875, 6.65789794921875, 6.89208984375, 7.12628173828125, 7.3604736328125, 7.59466552734375, 7.828857421875, 8.06304931640625, 8.2972412109375, 8.53143310546875, 8.765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 11.0, 14.0, 19.0, 17.0, 28.0, 33.0, 36.0, 36.0, 46.0, 56.0, 60.0, 78.0, 82.0, 68.0, 81.0, 61.0, 44.0, 44.0, 45.0, 33.0, 27.0, 18.0, 17.0, 13.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.49835205078125, -5.2818603515625, -5.06536865234375, -4.848876953125, -4.63238525390625, -4.4158935546875, -4.19940185546875, -3.98291015625, -3.76641845703125, -3.5499267578125, -3.33343505859375, -3.116943359375, -2.90045166015625, -2.6839599609375, -2.46746826171875, -2.2509765625, -2.03448486328125, -1.8179931640625, -1.60150146484375, -1.385009765625, -1.16851806640625, -0.9520263671875, -0.73553466796875, -0.51904296875, -0.30255126953125, -0.0860595703125, 0.13043212890625, 0.346923828125, 0.56341552734375, 0.7799072265625, 0.99639892578125, 1.212890625, 1.42938232421875, 1.6458740234375, 1.86236572265625, 2.078857421875, 2.29534912109375, 2.5118408203125, 2.72833251953125, 2.94482421875, 3.16131591796875, 3.3778076171875, 3.59429931640625, 3.810791015625, 4.02728271484375, 4.2437744140625, 4.46026611328125, 4.6767578125, 4.89324951171875, 5.1097412109375, 5.32623291015625, 5.542724609375, 5.75921630859375, 5.9757080078125, 6.19219970703125, 6.40869140625, 6.62518310546875, 6.8416748046875, 7.05816650390625, 7.274658203125, 7.49114990234375, 7.7076416015625, 7.92413330078125, 8.140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 16.0, 32.0, 77.0, 170.0, 461.0, 2336.0, 41966.0, 989578.0, 12017.0, 1289.0, 339.0, 139.0, 55.0, 24.0, 17.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.04998779296875, -7.8343505859375, -7.61871337890625, -7.403076171875, -7.18743896484375, -6.9718017578125, -6.75616455078125, -6.54052734375, -6.32489013671875, -6.1092529296875, -5.89361572265625, -5.677978515625, -5.46234130859375, -5.2467041015625, -5.03106689453125, -4.8154296875, -4.59979248046875, -4.3841552734375, -4.16851806640625, -3.952880859375, -3.73724365234375, -3.5216064453125, -3.30596923828125, -3.09033203125, -2.87469482421875, -2.6590576171875, -2.44342041015625, -2.227783203125, -2.01214599609375, -1.7965087890625, -1.58087158203125, -1.365234375, -1.14959716796875, -0.9339599609375, -0.71832275390625, -0.502685546875, -0.28704833984375, -0.0714111328125, 0.14422607421875, 0.35986328125, 0.57550048828125, 0.7911376953125, 1.00677490234375, 1.222412109375, 1.43804931640625, 1.6536865234375, 1.86932373046875, 2.0849609375, 2.30059814453125, 2.5162353515625, 2.73187255859375, 2.947509765625, 3.16314697265625, 3.3787841796875, 3.59442138671875, 3.81005859375, 4.02569580078125, 4.2413330078125, 4.45697021484375, 4.672607421875, 4.88824462890625, 5.1038818359375, 5.31951904296875, 5.53515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 7.0, 20.0, 28.0, 33.0, 42.0, 103.0, 201.0, 238.0, 118.0, 61.0, 40.0, 22.0, 27.0, 8.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027370452880859375, -0.00026428326964378357, -0.0002548620104789734, -0.0002454407513141632, -0.00023601949214935303, -0.00022659823298454285, -0.00021717697381973267, -0.00020775571465492249, -0.0001983344554901123, -0.00018891319632530212, -0.00017949193716049194, -0.00017007067799568176, -0.00016064941883087158, -0.0001512281596660614, -0.00014180690050125122, -0.00013238564133644104, -0.00012296438217163086, -0.00011354312300682068, -0.0001041218638420105, -9.470060467720032e-05, -8.527934551239014e-05, -7.585808634757996e-05, -6.643682718276978e-05, -5.7015568017959595e-05, -4.7594308853149414e-05, -3.8173049688339233e-05, -2.8751790523529053e-05, -1.9330531358718872e-05, -9.909272193908691e-06, -4.880130290985107e-07, 8.93324613571167e-06, 1.835450530052185e-05, 2.777576446533203e-05, 3.719702363014221e-05, 4.661828279495239e-05, 5.603954195976257e-05, 6.546080112457275e-05, 7.488206028938293e-05, 8.430331945419312e-05, 9.37245786190033e-05, 0.00010314583778381348, 0.00011256709694862366, 0.00012198835611343384, 0.00013140961527824402, 0.0001408308744430542, 0.00015025213360786438, 0.00015967339277267456, 0.00016909465193748474, 0.00017851591110229492, 0.0001879371702671051, 0.00019735842943191528, 0.00020677968859672546, 0.00021620094776153564, 0.00022562220692634583, 0.000235043466091156, 0.0002444647252559662, 0.00025388598442077637, 0.00026330724358558655, 0.00027272850275039673, 0.0002821497619152069, 0.0002915710210800171, 0.00030099228024482727, 0.00031041353940963745, 0.00031983479857444763, 0.0003292560577392578]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 20.0, 31.0, 66.0, 136.0, 234.0, 574.0, 5153.0, 906893.0, 131955.0, 2583.0, 477.0, 189.0, 94.0, 64.0, 40.0, 18.0, 7.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -6.98388671875, -6.7333984375, -6.48291015625, -6.232421875, -5.98193359375, -5.7314453125, -5.48095703125, -5.23046875, -4.97998046875, -4.7294921875, -4.47900390625, -4.228515625, -3.97802734375, -3.7275390625, -3.47705078125, -3.2265625, -2.97607421875, -2.7255859375, -2.47509765625, -2.224609375, -1.97412109375, -1.7236328125, -1.47314453125, -1.22265625, -0.97216796875, -0.7216796875, -0.47119140625, -0.220703125, 0.02978515625, 0.2802734375, 0.53076171875, 0.78125, 1.03173828125, 1.2822265625, 1.53271484375, 1.783203125, 2.03369140625, 2.2841796875, 2.53466796875, 2.78515625, 3.03564453125, 3.2861328125, 3.53662109375, 3.787109375, 4.03759765625, 4.2880859375, 4.53857421875, 4.7890625, 5.03955078125, 5.2900390625, 5.54052734375, 5.791015625, 6.04150390625, 6.2919921875, 6.54248046875, 6.79296875, 7.04345703125, 7.2939453125, 7.54443359375, 7.794921875, 8.04541015625, 8.2958984375, 8.54638671875, 8.796875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 12.0, 34.0, 51.0, 142.0, 564.0, 102.0, 48.0, 21.0, 14.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.22113037109375, -5.0438232421875, -4.86651611328125, -4.689208984375, -4.51190185546875, -4.3345947265625, -4.15728759765625, -3.97998046875, -3.80267333984375, -3.6253662109375, -3.44805908203125, -3.270751953125, -3.09344482421875, -2.9161376953125, -2.73883056640625, -2.5615234375, -2.38421630859375, -2.2069091796875, -2.02960205078125, -1.852294921875, -1.67498779296875, -1.4976806640625, -1.32037353515625, -1.14306640625, -0.96575927734375, -0.7884521484375, -0.61114501953125, -0.433837890625, -0.25653076171875, -0.0792236328125, 0.09808349609375, 0.275390625, 0.45269775390625, 0.6300048828125, 0.80731201171875, 0.984619140625, 1.16192626953125, 1.3392333984375, 1.51654052734375, 1.69384765625, 1.87115478515625, 2.0484619140625, 2.22576904296875, 2.403076171875, 2.58038330078125, 2.7576904296875, 2.93499755859375, 3.1123046875, 3.28961181640625, 3.4669189453125, 3.64422607421875, 3.821533203125, 3.99884033203125, 4.1761474609375, 4.35345458984375, 4.53076171875, 4.70806884765625, 4.8853759765625, 5.06268310546875, 5.239990234375, 5.41729736328125, 5.5946044921875, 5.77191162109375, 5.94921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 23.0, 26.0, 70.0, 196.0, 315.0, 229.0, 83.0, 33.0, 14.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.58467864990234, -64.49268341064453, -62.40068435668945, -60.308685302734375, -58.21669006347656, -56.124691009521484, -54.032691955566406, -51.940696716308594, -49.848697662353516, -47.75669860839844, -45.664703369140625, -43.57270431518555, -41.48070526123047, -39.388710021972656, -37.29671096801758, -35.2047119140625, -33.11271667480469, -31.020719528198242, -28.928722381591797, -26.83672332763672, -24.744726181030273, -22.652729034423828, -20.56072998046875, -18.468732833862305, -16.37673568725586, -14.284738540649414, -12.192740440368652, -10.10074234008789, -8.008745193481445, -5.916748046875, -3.8247499465942383, -1.7327518463134766, 0.3592529296875, 2.4512505531311035, 4.543248176574707, 6.6352458000183105, 8.727243423461914, 10.81924057006836, 12.911238670349121, 15.003236770629883, 17.095233917236328, 19.187231063842773, 21.27922821044922, 23.371227264404297, 25.463224411010742, 27.555221557617188, 29.647220611572266, 31.73921775817871, 33.831214904785156, 35.923213958740234, 38.01520919799805, 40.107208251953125, 42.19920349121094, 44.291202545166016, 46.383201599121094, 48.475196838378906, 50.567195892333984, 52.65919494628906, 54.751190185546875, 56.84318923950195, 58.93518829345703, 61.027183532714844, 63.11918258666992, 65.211181640625, 67.30317687988281]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 14.0, 22.0, 20.0, 23.0, 24.0, 35.0, 38.0, 42.0, 40.0, 47.0, 50.0, 53.0, 65.0, 58.0, 55.0, 49.0, 48.0, 49.0, 37.0, 39.0, 31.0, 28.0, 24.0, 23.0, 18.0, 11.0, 13.0, 3.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.08418846130371, -30.067859649658203, -29.051528930664062, -28.035200119018555, -27.018869400024414, -26.002540588378906, -24.986209869384766, -23.969881057739258, -22.95355224609375, -21.937223434448242, -20.9208927154541, -19.904563903808594, -18.888233184814453, -17.871904373168945, -16.855575561523438, -15.839244842529297, -14.822914123535156, -13.806584358215332, -12.790254592895508, -11.77392578125, -10.75759506225586, -9.741266250610352, -8.724936485290527, -7.708606719970703, -6.692276954650879, -5.675947189331055, -4.6596174240112305, -3.6432881355285645, -2.6269583702087402, -1.610628604888916, -0.59429931640625, 0.4220304489135742, 1.4383583068847656, 2.45468807220459, 3.471017599105835, 4.48734712600708, 5.503676891326904, 6.5200066566467285, 7.5363359451293945, 8.552665710449219, 9.568995475769043, 10.585325241088867, 11.601655006408691, 12.617984771728516, 13.634313583374023, 14.650644302368164, 15.666973114013672, 16.683303833007812, 17.69963264465332, 18.715961456298828, 19.73229217529297, 20.748620986938477, 21.764951705932617, 22.781280517578125, 23.797611236572266, 24.813940048217773, 25.83026885986328, 26.84659767150879, 27.86292839050293, 28.879257202148438, 29.895587921142578, 30.911916732788086, 31.928245544433594, 32.944576263427734, 33.960906982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 18.0, 21.0, 26.0, 51.0, 87.0, 128.0, 302.0, 616.0, 1646.0, 5346.0, 31541.0, 4074078.0, 68912.0, 7878.0, 2130.0, 780.0, 341.0, 139.0, 90.0, 48.0, 30.0, 13.0, 7.0, 10.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2286376953125, -9.894775390625, -9.5609130859375, -9.22705078125, -8.8931884765625, -8.559326171875, -8.2254638671875, -7.8916015625, -7.5577392578125, -7.223876953125, -6.8900146484375, -6.55615234375, -6.2222900390625, -5.888427734375, -5.5545654296875, -5.220703125, -4.8868408203125, -4.552978515625, -4.2191162109375, -3.88525390625, -3.5513916015625, -3.217529296875, -2.8836669921875, -2.5498046875, -2.2159423828125, -1.882080078125, -1.5482177734375, -1.21435546875, -0.8804931640625, -0.546630859375, -0.2127685546875, 0.12109375, 0.4549560546875, 0.788818359375, 1.1226806640625, 1.45654296875, 1.7904052734375, 2.124267578125, 2.4581298828125, 2.7919921875, 3.1258544921875, 3.459716796875, 3.7935791015625, 4.12744140625, 4.4613037109375, 4.795166015625, 5.1290283203125, 5.462890625, 5.7967529296875, 6.130615234375, 6.4644775390625, 6.79833984375, 7.1322021484375, 7.466064453125, 7.7999267578125, 8.1337890625, 8.4676513671875, 8.801513671875, 9.1353759765625, 9.46923828125, 9.8031005859375, 10.136962890625, 10.4708251953125, 10.8046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 11.0, 11.0, 24.0, 35.0, 50.0, 85.0, 97.0, 126.0, 138.0, 124.0, 107.0, 77.0, 58.0, 22.0, 14.0, 9.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.86822509765625, -2.7794189453125, -2.69061279296875, -2.601806640625, -2.51300048828125, -2.4241943359375, -2.33538818359375, -2.24658203125, -2.15777587890625, -2.0689697265625, -1.98016357421875, -1.891357421875, -1.80255126953125, -1.7137451171875, -1.62493896484375, -1.5361328125, -1.44732666015625, -1.3585205078125, -1.26971435546875, -1.180908203125, -1.09210205078125, -1.0032958984375, -0.91448974609375, -0.82568359375, -0.73687744140625, -0.6480712890625, -0.55926513671875, -0.470458984375, -0.38165283203125, -0.2928466796875, -0.20404052734375, -0.115234375, -0.02642822265625, 0.0623779296875, 0.15118408203125, 0.239990234375, 0.32879638671875, 0.4176025390625, 0.50640869140625, 0.59521484375, 0.68402099609375, 0.7728271484375, 0.86163330078125, 0.950439453125, 1.03924560546875, 1.1280517578125, 1.21685791015625, 1.3056640625, 1.39447021484375, 1.4832763671875, 1.57208251953125, 1.660888671875, 1.74969482421875, 1.8385009765625, 1.92730712890625, 2.01611328125, 2.10491943359375, 2.1937255859375, 2.28253173828125, 2.371337890625, 2.46014404296875, 2.5489501953125, 2.63775634765625, 2.7265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 10.0, 9.0, 11.0, 20.0, 24.0, 41.0, 52.0, 84.0, 112.0, 139.0, 183.0, 271.0, 377.0, 592.0, 944.0, 1708.0, 3527.0, 9149.0, 34443.0, 916496.0, 3168556.0, 38833.0, 9802.0, 3897.0, 1849.0, 1017.0, 642.0, 412.0, 291.0, 209.0, 164.0, 124.0, 72.0, 73.0, 47.0, 33.0, 29.0, 15.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.23828125, -6.0494384765625, -5.860595703125, -5.6717529296875, -5.48291015625, -5.2940673828125, -5.105224609375, -4.9163818359375, -4.7275390625, -4.5386962890625, -4.349853515625, -4.1610107421875, -3.97216796875, -3.7833251953125, -3.594482421875, -3.4056396484375, -3.216796875, -3.0279541015625, -2.839111328125, -2.6502685546875, -2.46142578125, -2.2725830078125, -2.083740234375, -1.8948974609375, -1.7060546875, -1.5172119140625, -1.328369140625, -1.1395263671875, -0.95068359375, -0.7618408203125, -0.572998046875, -0.3841552734375, -0.1953125, -0.0064697265625, 0.182373046875, 0.3712158203125, 0.56005859375, 0.7489013671875, 0.937744140625, 1.1265869140625, 1.3154296875, 1.5042724609375, 1.693115234375, 1.8819580078125, 2.07080078125, 2.2596435546875, 2.448486328125, 2.6373291015625, 2.826171875, 3.0150146484375, 3.203857421875, 3.3927001953125, 3.58154296875, 3.7703857421875, 3.959228515625, 4.1480712890625, 4.3369140625, 4.5257568359375, 4.714599609375, 4.9034423828125, 5.09228515625, 5.2811279296875, 5.469970703125, 5.6588134765625, 5.84765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 13.0, 12.0, 30.0, 46.0, 131.0, 859.0, 2675.0, 152.0, 57.0, 28.0, 22.0, 12.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.751953125, -3.638641357421875, -3.52532958984375, -3.412017822265625, -3.2987060546875, -3.185394287109375, -3.07208251953125, -2.958770751953125, -2.845458984375, -2.732147216796875, -2.61883544921875, -2.505523681640625, -2.3922119140625, -2.278900146484375, -2.16558837890625, -2.052276611328125, -1.93896484375, -1.825653076171875, -1.71234130859375, -1.599029541015625, -1.4857177734375, -1.372406005859375, -1.25909423828125, -1.145782470703125, -1.032470703125, -0.919158935546875, -0.80584716796875, -0.692535400390625, -0.5792236328125, -0.465911865234375, -0.35260009765625, -0.239288330078125, -0.1259765625, -0.012664794921875, 0.10064697265625, 0.213958740234375, 0.3272705078125, 0.440582275390625, 0.55389404296875, 0.667205810546875, 0.780517578125, 0.893829345703125, 1.00714111328125, 1.120452880859375, 1.2337646484375, 1.347076416015625, 1.46038818359375, 1.573699951171875, 1.68701171875, 1.800323486328125, 1.91363525390625, 2.026947021484375, 2.1402587890625, 2.253570556640625, 2.36688232421875, 2.480194091796875, 2.593505859375, 2.706817626953125, 2.82012939453125, 2.933441162109375, 3.0467529296875, 3.160064697265625, 3.27337646484375, 3.386688232421875, 3.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 17.0, 112.0, 602.0, 228.0, 45.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.793275833129883, -10.251688003540039, -8.710100173950195, -7.168511390686035, -5.626923561096191, -4.085335731506348, -2.5437469482421875, -1.0021591186523438, 0.5394287109375, 2.081016778945923, 3.6226048469543457, 5.164193153381348, 6.705780982971191, 8.247368812561035, 9.788957595825195, 11.330545425415039, 12.872133255004883, 14.413721084594727, 15.95530891418457, 17.496898651123047, 19.03848648071289, 20.580074310302734, 22.121662139892578, 23.663249969482422, 25.204837799072266, 26.74642562866211, 28.288013458251953, 29.829601287841797, 31.37118911743164, 32.912776947021484, 34.454368591308594, 35.99595642089844, 37.53754425048828, 39.079132080078125, 40.62071990966797, 42.16230773925781, 43.703895568847656, 45.2454833984375, 46.787071228027344, 48.32865905761719, 49.87024688720703, 51.411834716796875, 52.95342254638672, 54.49501037597656, 56.036598205566406, 57.57818603515625, 59.119773864746094, 60.66136169433594, 62.20295333862305, 63.74454116821289, 65.2861328125, 66.82772064208984, 68.36930847167969, 69.91089630126953, 71.45248413085938, 72.99407196044922, 74.53565979003906, 76.0772476196289, 77.61883544921875, 79.1604232788086, 80.70201110839844, 82.24359893798828, 83.78518676757812, 85.32677459716797, 86.86836242675781]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 2.0, 8.0, 10.0, 9.0, 24.0, 18.0, 28.0, 29.0, 35.0, 44.0, 43.0, 52.0, 61.0, 62.0, 45.0, 61.0, 36.0, 62.0, 49.0, 58.0, 43.0, 32.0, 37.0, 34.0, 27.0, 15.0, 12.0, 14.0, 16.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.504338264465332, -7.247499465942383, -6.990660190582275, -6.733821392059326, -6.476982116699219, -6.2201433181762695, -5.96330451965332, -5.706465244293213, -5.4496259689331055, -5.192787170410156, -4.935947895050049, -4.6791090965271, -4.422269821166992, -4.165431022644043, -3.9085919857025146, -3.6517529487609863, -3.394914150238037, -3.138075113296509, -2.8812360763549805, -2.6243972778320312, -2.367558002471924, -2.1107192039489746, -1.8538801670074463, -1.597041130065918, -1.3402020931243896, -1.0833630561828613, -0.8265240788459778, -0.5696851015090942, -0.3128460645675659, -0.0560070276260376, 0.20083189010620117, 0.4576709270477295, 0.7145099639892578, 0.9713490009307861, 1.2281880378723145, 1.4850269556045532, 1.7418659925460815, 1.9987050294876099, 2.2555439472198486, 2.512382984161377, 2.7692220211029053, 3.0260610580444336, 3.282900094985962, 3.5397391319274902, 3.7965779304504395, 4.053417205810547, 4.310256004333496, 4.567094802856445, 4.823934078216553, 5.080772876739502, 5.337612152099609, 5.594450950622559, 5.851290225982666, 6.108129024505615, 6.364968299865723, 6.621807098388672, 6.878645896911621, 7.13548469543457, 7.392323970794678, 7.649162769317627, 7.906002044677734, 8.162840843200684, 8.419679641723633, 8.676519393920898, 8.933358192443848]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 32.0, 50.0, 80.0, 162.0, 289.0, 864.0, 2897.0, 20344.0, 600293.0, 402599.0, 16870.0, 2606.0, 796.0, 296.0, 149.0, 68.0, 55.0, 24.0, 22.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.296875, -11.912109375, -11.52734375, -11.142578125, -10.7578125, -10.373046875, -9.98828125, -9.603515625, -9.21875, -8.833984375, -8.44921875, -8.064453125, -7.6796875, -7.294921875, -6.91015625, -6.525390625, -6.140625, -5.755859375, -5.37109375, -4.986328125, -4.6015625, -4.216796875, -3.83203125, -3.447265625, -3.0625, -2.677734375, -2.29296875, -1.908203125, -1.5234375, -1.138671875, -0.75390625, -0.369140625, 0.015625, 0.400390625, 0.78515625, 1.169921875, 1.5546875, 1.939453125, 2.32421875, 2.708984375, 3.09375, 3.478515625, 3.86328125, 4.248046875, 4.6328125, 5.017578125, 5.40234375, 5.787109375, 6.171875, 6.556640625, 6.94140625, 7.326171875, 7.7109375, 8.095703125, 8.48046875, 8.865234375, 9.25, 9.634765625, 10.01953125, 10.404296875, 10.7890625, 11.173828125, 11.55859375, 11.943359375, 12.328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 22.0, 26.0, 55.0, 70.0, 104.0, 141.0, 138.0, 125.0, 103.0, 81.0, 60.0, 27.0, 12.0, 9.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.969879150390625, -2.87530517578125, -2.780731201171875, -2.6861572265625, -2.591583251953125, -2.49700927734375, -2.402435302734375, -2.307861328125, -2.213287353515625, -2.11871337890625, -2.024139404296875, -1.9295654296875, -1.834991455078125, -1.74041748046875, -1.645843505859375, -1.55126953125, -1.456695556640625, -1.36212158203125, -1.267547607421875, -1.1729736328125, -1.078399658203125, -0.98382568359375, -0.889251708984375, -0.794677734375, -0.700103759765625, -0.60552978515625, -0.510955810546875, -0.4163818359375, -0.321807861328125, -0.22723388671875, -0.132659912109375, -0.0380859375, 0.056488037109375, 0.15106201171875, 0.245635986328125, 0.3402099609375, 0.434783935546875, 0.52935791015625, 0.623931884765625, 0.718505859375, 0.813079833984375, 0.90765380859375, 1.002227783203125, 1.0968017578125, 1.191375732421875, 1.28594970703125, 1.380523681640625, 1.47509765625, 1.569671630859375, 1.66424560546875, 1.758819580078125, 1.8533935546875, 1.947967529296875, 2.04254150390625, 2.137115478515625, 2.231689453125, 2.326263427734375, 2.42083740234375, 2.515411376953125, 2.6099853515625, 2.704559326171875, 2.79913330078125, 2.893707275390625, 2.98828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 11.0, 11.0, 18.0, 36.0, 20.0, 51.0, 77.0, 143.0, 260.0, 553.0, 1248.0, 2932.0, 7553.0, 22534.0, 91966.0, 689675.0, 179202.0, 34522.0, 10585.0, 3952.0, 1641.0, 738.0, 359.0, 154.0, 102.0, 56.0, 42.0, 19.0, 15.0, 13.0, 10.0, 13.0, 8.0, 1.0, 2.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.36920166015625, -6.1680908203125, -5.96697998046875, -5.765869140625, -5.56475830078125, -5.3636474609375, -5.16253662109375, -4.96142578125, -4.76031494140625, -4.5592041015625, -4.35809326171875, -4.156982421875, -3.95587158203125, -3.7547607421875, -3.55364990234375, -3.3525390625, -3.15142822265625, -2.9503173828125, -2.74920654296875, -2.548095703125, -2.34698486328125, -2.1458740234375, -1.94476318359375, -1.74365234375, -1.54254150390625, -1.3414306640625, -1.14031982421875, -0.939208984375, -0.73809814453125, -0.5369873046875, -0.33587646484375, -0.134765625, 0.06634521484375, 0.2674560546875, 0.46856689453125, 0.669677734375, 0.87078857421875, 1.0718994140625, 1.27301025390625, 1.47412109375, 1.67523193359375, 1.8763427734375, 2.07745361328125, 2.278564453125, 2.47967529296875, 2.6807861328125, 2.88189697265625, 3.0830078125, 3.28411865234375, 3.4852294921875, 3.68634033203125, 3.887451171875, 4.08856201171875, 4.2896728515625, 4.49078369140625, 4.69189453125, 4.89300537109375, 5.0941162109375, 5.29522705078125, 5.496337890625, 5.69744873046875, 5.8985595703125, 6.09967041015625, 6.30078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 5.0, 8.0, 17.0, 14.0, 20.0, 17.0, 22.0, 24.0, 41.0, 51.0, 49.0, 54.0, 49.0, 64.0, 60.0, 53.0, 57.0, 60.0, 48.0, 38.0, 38.0, 37.0, 30.0, 21.0, 18.0, 12.0, 19.0, 15.0, 7.0, 11.0, 13.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5511474609375, -5.360107421875, -5.1690673828125, -4.97802734375, -4.7869873046875, -4.595947265625, -4.4049072265625, -4.2138671875, -4.0228271484375, -3.831787109375, -3.6407470703125, -3.44970703125, -3.2586669921875, -3.067626953125, -2.8765869140625, -2.685546875, -2.4945068359375, -2.303466796875, -2.1124267578125, -1.92138671875, -1.7303466796875, -1.539306640625, -1.3482666015625, -1.1572265625, -0.9661865234375, -0.775146484375, -0.5841064453125, -0.39306640625, -0.2020263671875, -0.010986328125, 0.1800537109375, 0.37109375, 0.5621337890625, 0.753173828125, 0.9442138671875, 1.13525390625, 1.3262939453125, 1.517333984375, 1.7083740234375, 1.8994140625, 2.0904541015625, 2.281494140625, 2.4725341796875, 2.66357421875, 2.8546142578125, 3.045654296875, 3.2366943359375, 3.427734375, 3.6187744140625, 3.809814453125, 4.0008544921875, 4.19189453125, 4.3829345703125, 4.573974609375, 4.7650146484375, 4.9560546875, 5.1470947265625, 5.338134765625, 5.5291748046875, 5.72021484375, 5.9112548828125, 6.102294921875, 6.2933349609375, 6.484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 4.0, 9.0, 10.0, 17.0, 16.0, 26.0, 42.0, 46.0, 79.0, 130.0, 210.0, 378.0, 658.0, 1144.0, 2340.0, 5094.0, 12779.0, 43396.0, 304202.0, 584018.0, 64215.0, 17135.0, 6466.0, 2925.0, 1400.0, 730.0, 412.0, 252.0, 135.0, 89.0, 60.0, 34.0, 30.0, 19.0, 11.0, 13.0, 5.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7568359375, -1.7038116455078125, -1.650787353515625, -1.5977630615234375, -1.54473876953125, -1.4917144775390625, -1.438690185546875, -1.3856658935546875, -1.3326416015625, -1.2796173095703125, -1.226593017578125, -1.1735687255859375, -1.12054443359375, -1.0675201416015625, -1.014495849609375, -0.9614715576171875, -0.908447265625, -0.8554229736328125, -0.802398681640625, -0.7493743896484375, -0.69635009765625, -0.6433258056640625, -0.590301513671875, -0.5372772216796875, -0.4842529296875, -0.4312286376953125, -0.378204345703125, -0.3251800537109375, -0.27215576171875, -0.2191314697265625, -0.166107177734375, -0.1130828857421875, -0.06005859375, -0.0070343017578125, 0.045989990234375, 0.0990142822265625, 0.15203857421875, 0.2050628662109375, 0.258087158203125, 0.3111114501953125, 0.3641357421875, 0.4171600341796875, 0.470184326171875, 0.5232086181640625, 0.57623291015625, 0.6292572021484375, 0.682281494140625, 0.7353057861328125, 0.788330078125, 0.8413543701171875, 0.894378662109375, 0.9474029541015625, 1.00042724609375, 1.0534515380859375, 1.106475830078125, 1.1595001220703125, 1.2125244140625, 1.2655487060546875, 1.318572998046875, 1.3715972900390625, 1.42462158203125, 1.4776458740234375, 1.530670166015625, 1.5836944580078125, 1.63671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 16.0, 18.0, 19.0, 36.0, 40.0, 62.0, 104.0, 166.0, 151.0, 124.0, 74.0, 45.0, 26.0, 31.0, 14.0, 16.0, 9.0, 5.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021779164671897888, -0.0002102777361869812, -0.00020276382565498352, -0.00019524991512298584, -0.00018773600459098816, -0.00018022209405899048, -0.0001727081835269928, -0.00016519427299499512, -0.00015768036246299744, -0.00015016645193099976, -0.00014265254139900208, -0.0001351386308670044, -0.00012762472033500671, -0.00012011080980300903, -0.00011259689927101135, -0.00010508298873901367, -9.756907820701599e-05, -9.005516767501831e-05, -8.254125714302063e-05, -7.502734661102295e-05, -6.751343607902527e-05, -5.999952554702759e-05, -5.248561501502991e-05, -4.4971704483032227e-05, -3.7457793951034546e-05, -2.9943883419036865e-05, -2.2429972887039185e-05, -1.4916062355041504e-05, -7.402151823043823e-06, 1.1175870895385742e-07, 7.625669240951538e-06, 1.5139579772949219e-05, 2.26534903049469e-05, 3.016740083694458e-05, 3.768131136894226e-05, 4.519522190093994e-05, 5.270913243293762e-05, 6.02230429649353e-05, 6.773695349693298e-05, 7.525086402893066e-05, 8.276477456092834e-05, 9.027868509292603e-05, 9.77925956249237e-05, 0.00010530650615692139, 0.00011282041668891907, 0.00012033432722091675, 0.00012784823775291443, 0.0001353621482849121, 0.0001428760588169098, 0.00015038996934890747, 0.00015790387988090515, 0.00016541779041290283, 0.0001729317009449005, 0.0001804456114768982, 0.00018795952200889587, 0.00019547343254089355, 0.00020298734307289124, 0.00021050125360488892, 0.0002180151641368866, 0.00022552907466888428, 0.00023304298520088196, 0.00024055689573287964, 0.0002480708062648773, 0.000255584716796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 12.0, 28.0, 61.0, 85.0, 150.0, 412.0, 827.0, 2265.0, 7807.0, 59569.0, 880936.0, 82492.0, 9450.0, 2613.0, 989.0, 427.0, 173.0, 108.0, 64.0, 20.0, 10.0, 11.0, 12.0, 7.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.259765625, -3.162628173828125, -3.06549072265625, -2.968353271484375, -2.8712158203125, -2.774078369140625, -2.67694091796875, -2.579803466796875, -2.482666015625, -2.385528564453125, -2.28839111328125, -2.191253662109375, -2.0941162109375, -1.996978759765625, -1.89984130859375, -1.802703857421875, -1.70556640625, -1.608428955078125, -1.51129150390625, -1.414154052734375, -1.3170166015625, -1.219879150390625, -1.12274169921875, -1.025604248046875, -0.928466796875, -0.831329345703125, -0.73419189453125, -0.637054443359375, -0.5399169921875, -0.442779541015625, -0.34564208984375, -0.248504638671875, -0.1513671875, -0.054229736328125, 0.04290771484375, 0.140045166015625, 0.2371826171875, 0.334320068359375, 0.43145751953125, 0.528594970703125, 0.625732421875, 0.722869873046875, 0.82000732421875, 0.917144775390625, 1.0142822265625, 1.111419677734375, 1.20855712890625, 1.305694580078125, 1.40283203125, 1.499969482421875, 1.59710693359375, 1.694244384765625, 1.7913818359375, 1.888519287109375, 1.98565673828125, 2.082794189453125, 2.179931640625, 2.277069091796875, 2.37420654296875, 2.471343994140625, 2.5684814453125, 2.665618896484375, 2.76275634765625, 2.859893798828125, 2.95703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 9.0, 18.0, 23.0, 41.0, 44.0, 70.0, 98.0, 205.0, 175.0, 122.0, 53.0, 39.0, 24.0, 22.0, 15.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.029296875, -1.954254150390625, -1.87921142578125, -1.804168701171875, -1.7291259765625, -1.654083251953125, -1.57904052734375, -1.503997802734375, -1.428955078125, -1.353912353515625, -1.27886962890625, -1.203826904296875, -1.1287841796875, -1.053741455078125, -0.97869873046875, -0.903656005859375, -0.82861328125, -0.753570556640625, -0.67852783203125, -0.603485107421875, -0.5284423828125, -0.453399658203125, -0.37835693359375, -0.303314208984375, -0.228271484375, -0.153228759765625, -0.07818603515625, -0.003143310546875, 0.0718994140625, 0.146942138671875, 0.22198486328125, 0.297027587890625, 0.3720703125, 0.447113037109375, 0.52215576171875, 0.597198486328125, 0.6722412109375, 0.747283935546875, 0.82232666015625, 0.897369384765625, 0.972412109375, 1.047454833984375, 1.12249755859375, 1.197540283203125, 1.2725830078125, 1.347625732421875, 1.42266845703125, 1.497711181640625, 1.57275390625, 1.647796630859375, 1.72283935546875, 1.797882080078125, 1.8729248046875, 1.947967529296875, 2.02301025390625, 2.098052978515625, 2.173095703125, 2.248138427734375, 2.32318115234375, 2.398223876953125, 2.4732666015625, 2.548309326171875, 2.62335205078125, 2.698394775390625, 2.7734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 20.0, 82.0, 369.0, 385.0, 110.0, 26.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.17121124267578, -44.05184555053711, -40.93247985839844, -37.813114166259766, -34.693748474121094, -31.574382781982422, -28.45501708984375, -25.335651397705078, -22.216285705566406, -19.096920013427734, -15.977554321289062, -12.85818862915039, -9.738822937011719, -6.619457244873047, -3.500091552734375, -0.3807258605957031, 2.7386398315429688, 5.858005523681641, 8.977371215820312, 12.096736907958984, 15.216102600097656, 18.335468292236328, 21.454833984375, 24.574199676513672, 27.693565368652344, 30.812931060791016, 33.93229675292969, 37.05166244506836, 40.17102813720703, 43.2903938293457, 46.409759521484375, 49.52912521362305, 52.64849853515625, 55.76786422729492, 58.887229919433594, 62.006595611572266, 65.12596130371094, 68.24533081054688, 71.36469268798828, 74.48405456542969, 77.60342407226562, 80.72279357910156, 83.84215545654297, 86.96151733398438, 90.08088684082031, 93.20025634765625, 96.31961822509766, 99.43898010253906, 102.558349609375, 105.67771911621094, 108.79708099365234, 111.91644287109375, 115.03581237792969, 118.15518188476562, 121.27454376220703, 124.39390563964844, 127.51327514648438, 130.6326446533203, 133.75201416015625, 136.87136840820312, 139.99073791503906, 143.110107421875, 146.22946166992188, 149.3488311767578, 152.46820068359375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 13.0, 6.0, 18.0, 6.0, 10.0, 19.0, 22.0, 17.0, 28.0, 21.0, 25.0, 44.0, 28.0, 23.0, 36.0, 41.0, 43.0, 47.0, 47.0, 41.0, 35.0, 39.0, 39.0, 38.0, 39.0, 27.0, 32.0, 32.0, 22.0, 20.0, 19.0, 13.0, 17.0, 14.0, 9.0, 14.0, 8.0, 15.0, 5.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.87316131591797, -21.203048706054688, -20.532936096191406, -19.862823486328125, -19.19270896911621, -18.52259635925293, -17.85248374938965, -17.182371139526367, -16.512256622314453, -15.842144012451172, -15.172030448913574, -14.501917839050293, -13.831804275512695, -13.161691665649414, -12.491579055786133, -11.821466445922852, -11.15135383605957, -10.481241226196289, -9.811127662658691, -9.14101505279541, -8.470901489257812, -7.800788879394531, -7.13067626953125, -6.4605631828308105, -5.790450096130371, -5.120337009429932, -4.450223922729492, -3.780111312866211, -3.1099982261657715, -2.439885139465332, -1.7697725296020508, -1.0996594429016113, -0.4295482635498047, 0.24056470394134521, 0.9106776714324951, 1.5807905197143555, 2.250903606414795, 2.9210166931152344, 3.5911293029785156, 4.261242389678955, 4.9313554763793945, 5.601468563079834, 6.271581649780273, 6.941694259643555, 7.611807346343994, 8.281920433044434, 8.952033042907715, 9.622146606445312, 10.292259216308594, 10.962371826171875, 11.632485389709473, 12.302597999572754, 12.972711563110352, 13.642824172973633, 14.312936782836914, 14.983049392700195, 15.653162956237793, 16.32327651977539, 16.993389129638672, 17.663501739501953, 18.333614349365234, 19.003726959228516, 19.673839569091797, 20.34395408630371, 21.014066696166992]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 6.0, 11.0, 13.0, 21.0, 26.0, 41.0, 82.0, 146.0, 254.0, 522.0, 1128.0, 3176.0, 12679.0, 206098.0, 3944629.0, 18815.0, 4146.0, 1329.0, 553.0, 271.0, 117.0, 78.0, 39.0, 29.0, 17.0, 14.0, 6.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.865234375, -15.37109375, -14.876953125, -14.3828125, -13.888671875, -13.39453125, -12.900390625, -12.40625, -11.912109375, -11.41796875, -10.923828125, -10.4296875, -9.935546875, -9.44140625, -8.947265625, -8.453125, -7.958984375, -7.46484375, -6.970703125, -6.4765625, -5.982421875, -5.48828125, -4.994140625, -4.5, -4.005859375, -3.51171875, -3.017578125, -2.5234375, -2.029296875, -1.53515625, -1.041015625, -0.546875, -0.052734375, 0.44140625, 0.935546875, 1.4296875, 1.923828125, 2.41796875, 2.912109375, 3.40625, 3.900390625, 4.39453125, 4.888671875, 5.3828125, 5.876953125, 6.37109375, 6.865234375, 7.359375, 7.853515625, 8.34765625, 8.841796875, 9.3359375, 9.830078125, 10.32421875, 10.818359375, 11.3125, 11.806640625, 12.30078125, 12.794921875, 13.2890625, 13.783203125, 14.27734375, 14.771484375, 15.265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 6.0, 9.0, 20.0, 23.0, 46.0, 61.0, 77.0, 108.0, 134.0, 134.0, 117.0, 93.0, 66.0, 45.0, 30.0, 11.0, 15.0, 10.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -3.00103759765625, -2.9044189453125, -2.80780029296875, -2.711181640625, -2.61456298828125, -2.5179443359375, -2.42132568359375, -2.32470703125, -2.22808837890625, -2.1314697265625, -2.03485107421875, -1.938232421875, -1.84161376953125, -1.7449951171875, -1.64837646484375, -1.5517578125, -1.45513916015625, -1.3585205078125, -1.26190185546875, -1.165283203125, -1.06866455078125, -0.9720458984375, -0.87542724609375, -0.77880859375, -0.68218994140625, -0.5855712890625, -0.48895263671875, -0.392333984375, -0.29571533203125, -0.1990966796875, -0.10247802734375, -0.005859375, 0.09075927734375, 0.1873779296875, 0.28399658203125, 0.380615234375, 0.47723388671875, 0.5738525390625, 0.67047119140625, 0.76708984375, 0.86370849609375, 0.9603271484375, 1.05694580078125, 1.153564453125, 1.25018310546875, 1.3468017578125, 1.44342041015625, 1.5400390625, 1.63665771484375, 1.7332763671875, 1.82989501953125, 1.926513671875, 2.02313232421875, 2.1197509765625, 2.21636962890625, 2.31298828125, 2.40960693359375, 2.5062255859375, 2.60284423828125, 2.699462890625, 2.79608154296875, 2.8927001953125, 2.98931884765625, 3.0859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 5.0, 16.0, 14.0, 16.0, 38.0, 34.0, 59.0, 67.0, 92.0, 127.0, 176.0, 284.0, 381.0, 544.0, 855.0, 1377.0, 2189.0, 3507.0, 6118.0, 12625.0, 31575.0, 148624.0, 3831950.0, 101584.0, 26355.0, 11158.0, 5680.0, 3170.0, 1957.0, 1174.0, 799.0, 496.0, 315.0, 243.0, 164.0, 137.0, 92.0, 69.0, 55.0, 40.0, 30.0, 25.0, 14.0, 10.0, 13.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.48046875, -6.280517578125, -6.08056640625, -5.880615234375, -5.6806640625, -5.480712890625, -5.28076171875, -5.080810546875, -4.880859375, -4.680908203125, -4.48095703125, -4.281005859375, -4.0810546875, -3.881103515625, -3.68115234375, -3.481201171875, -3.28125, -3.081298828125, -2.88134765625, -2.681396484375, -2.4814453125, -2.281494140625, -2.08154296875, -1.881591796875, -1.681640625, -1.481689453125, -1.28173828125, -1.081787109375, -0.8818359375, -0.681884765625, -0.48193359375, -0.281982421875, -0.08203125, 0.117919921875, 0.31787109375, 0.517822265625, 0.7177734375, 0.917724609375, 1.11767578125, 1.317626953125, 1.517578125, 1.717529296875, 1.91748046875, 2.117431640625, 2.3173828125, 2.517333984375, 2.71728515625, 2.917236328125, 3.1171875, 3.317138671875, 3.51708984375, 3.717041015625, 3.9169921875, 4.116943359375, 4.31689453125, 4.516845703125, 4.716796875, 4.916748046875, 5.11669921875, 5.316650390625, 5.5166015625, 5.716552734375, 5.91650390625, 6.116455078125, 6.31640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 9.0, 5.0, 14.0, 16.0, 30.0, 52.0, 145.0, 3194.0, 351.0, 93.0, 48.0, 27.0, 17.0, 16.0, 11.0, 4.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.296875, -4.15234375, -4.0078125, -3.86328125, -3.71875, -3.57421875, -3.4296875, -3.28515625, -3.140625, -2.99609375, -2.8515625, -2.70703125, -2.5625, -2.41796875, -2.2734375, -2.12890625, -1.984375, -1.83984375, -1.6953125, -1.55078125, -1.40625, -1.26171875, -1.1171875, -0.97265625, -0.828125, -0.68359375, -0.5390625, -0.39453125, -0.25, -0.10546875, 0.0390625, 0.18359375, 0.328125, 0.47265625, 0.6171875, 0.76171875, 0.90625, 1.05078125, 1.1953125, 1.33984375, 1.484375, 1.62890625, 1.7734375, 1.91796875, 2.0625, 2.20703125, 2.3515625, 2.49609375, 2.640625, 2.78515625, 2.9296875, 3.07421875, 3.21875, 3.36328125, 3.5078125, 3.65234375, 3.796875, 3.94140625, 4.0859375, 4.23046875, 4.375, 4.51953125, 4.6640625, 4.80859375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 14.0, 18.0, 42.0, 84.0, 220.0, 269.0, 186.0, 90.0, 44.0, 16.0, 12.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.05235481262207, -14.3546142578125, -13.65687370300293, -12.959134101867676, -12.261393547058105, -11.563652992248535, -10.865913391113281, -10.168172836303711, -9.47043228149414, -8.77269172668457, -8.074951171875, -7.377211570739746, -6.679471015930176, -5.9817304611206055, -5.283990383148193, -4.586250305175781, -3.888509750366211, -3.1907694339752197, -2.4930291175842285, -1.7952888011932373, -1.097548484802246, -0.3998081684112549, 0.29793214797973633, 0.9956722259521484, 1.6934127807617188, 2.39115309715271, 3.088893413543701, 3.7866337299346924, 4.484374046325684, 5.182114601135254, 5.879854679107666, 6.577594757080078, 7.275333404541016, 7.973073959350586, 8.670814514160156, 9.36855411529541, 10.06629467010498, 10.76403522491455, 11.461774826049805, 12.159515380859375, 12.857255935668945, 13.554996490478516, 14.252737045288086, 14.95047664642334, 15.64821720123291, 16.345956802368164, 17.043697357177734, 17.741437911987305, 18.439178466796875, 19.136919021606445, 19.834659576416016, 20.532400131225586, 21.230140686035156, 21.927879333496094, 22.625619888305664, 23.323360443115234, 24.021100997924805, 24.718841552734375, 25.416582107543945, 26.114322662353516, 26.812061309814453, 27.509801864624023, 28.207542419433594, 28.905282974243164, 29.603023529052734]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 25.0, 24.0, 28.0, 46.0, 44.0, 66.0, 54.0, 61.0, 89.0, 55.0, 76.0, 54.0, 69.0, 55.0, 54.0, 37.0, 33.0, 28.0, 27.0, 18.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.620869636535645, -11.232672691345215, -10.844475746154785, -10.456278800964355, -10.068081855773926, -9.679884910583496, -9.29168701171875, -8.90349006652832, -8.51529312133789, -8.127096176147461, -7.738899230957031, -7.350702285766602, -6.962505340576172, -6.574308395385742, -6.186110973358154, -5.797914028167725, -5.409717559814453, -5.021520614624023, -4.633323669433594, -4.245126724243164, -3.8569295406341553, -3.4687325954437256, -3.080535411834717, -2.692338466644287, -2.3041415214538574, -1.9159445762634277, -1.5277475118637085, -1.1395504474639893, -0.7513535022735596, -0.3631565570831299, 0.025040626525878906, 0.4132375717163086, 0.8014335632324219, 1.1896305084228516, 1.5778275728225708, 1.96602463722229, 2.3542215824127197, 2.7424185276031494, 3.130615711212158, 3.518812656402588, 3.9070096015930176, 4.295206546783447, 4.683403491973877, 5.071600914001465, 5.4597978591918945, 5.847994804382324, 6.236191749572754, 6.624388694763184, 7.012585639953613, 7.400782585144043, 7.788979530334473, 8.177176475524902, 8.565373420715332, 8.953570365905762, 9.341768264770508, 9.729965209960938, 10.118162155151367, 10.506359100341797, 10.894556045532227, 11.282752990722656, 11.670949935913086, 12.059146881103516, 12.447343826293945, 12.835540771484375, 13.223737716674805]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 14.0, 16.0, 32.0, 52.0, 88.0, 122.0, 261.0, 554.0, 1542.0, 6060.0, 42047.0, 724486.0, 248605.0, 19217.0, 3604.0, 1001.0, 391.0, 190.0, 95.0, 44.0, 38.0, 29.0, 22.0, 11.0, 5.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.2850341796875, -15.773193359375, -15.2613525390625, -14.74951171875, -14.2376708984375, -13.725830078125, -13.2139892578125, -12.7021484375, -12.1903076171875, -11.678466796875, -11.1666259765625, -10.65478515625, -10.1429443359375, -9.631103515625, -9.1192626953125, -8.607421875, -8.0955810546875, -7.583740234375, -7.0718994140625, -6.56005859375, -6.0482177734375, -5.536376953125, -5.0245361328125, -4.5126953125, -4.0008544921875, -3.489013671875, -2.9771728515625, -2.46533203125, -1.9534912109375, -1.441650390625, -0.9298095703125, -0.41796875, 0.0938720703125, 0.605712890625, 1.1175537109375, 1.62939453125, 2.1412353515625, 2.653076171875, 3.1649169921875, 3.6767578125, 4.1885986328125, 4.700439453125, 5.2122802734375, 5.72412109375, 6.2359619140625, 6.747802734375, 7.2596435546875, 7.771484375, 8.2833251953125, 8.795166015625, 9.3070068359375, 9.81884765625, 10.3306884765625, 10.842529296875, 11.3543701171875, 11.8662109375, 12.3780517578125, 12.889892578125, 13.4017333984375, 13.91357421875, 14.4254150390625, 14.937255859375, 15.4490966796875, 15.9609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 22.0, 25.0, 47.0, 70.0, 89.0, 121.0, 144.0, 120.0, 118.0, 83.0, 61.0, 44.0, 21.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.17596435546875, -3.0726318359375, -2.96929931640625, -2.865966796875, -2.76263427734375, -2.6593017578125, -2.55596923828125, -2.45263671875, -2.34930419921875, -2.2459716796875, -2.14263916015625, -2.039306640625, -1.93597412109375, -1.8326416015625, -1.72930908203125, -1.6259765625, -1.52264404296875, -1.4193115234375, -1.31597900390625, -1.212646484375, -1.10931396484375, -1.0059814453125, -0.90264892578125, -0.79931640625, -0.69598388671875, -0.5926513671875, -0.48931884765625, -0.385986328125, -0.28265380859375, -0.1793212890625, -0.07598876953125, 0.02734375, 0.13067626953125, 0.2340087890625, 0.33734130859375, 0.440673828125, 0.54400634765625, 0.6473388671875, 0.75067138671875, 0.85400390625, 0.95733642578125, 1.0606689453125, 1.16400146484375, 1.267333984375, 1.37066650390625, 1.4739990234375, 1.57733154296875, 1.6806640625, 1.78399658203125, 1.8873291015625, 1.99066162109375, 2.093994140625, 2.19732666015625, 2.3006591796875, 2.40399169921875, 2.50732421875, 2.61065673828125, 2.7139892578125, 2.81732177734375, 2.920654296875, 3.02398681640625, 3.1273193359375, 3.23065185546875, 3.333984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 9.0, 3.0, 6.0, 14.0, 4.0, 23.0, 14.0, 28.0, 37.0, 64.0, 71.0, 108.0, 186.0, 333.0, 491.0, 1057.0, 2065.0, 4681.0, 11687.0, 39187.0, 210514.0, 635449.0, 102945.0, 24263.0, 8186.0, 3478.0, 1635.0, 790.0, 460.0, 251.0, 156.0, 105.0, 85.0, 40.0, 33.0, 15.0, 20.0, 20.0, 10.0, 8.0, 5.0, 2.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.4453125, -8.1839599609375, -7.922607421875, -7.6612548828125, -7.39990234375, -7.1385498046875, -6.877197265625, -6.6158447265625, -6.3544921875, -6.0931396484375, -5.831787109375, -5.5704345703125, -5.30908203125, -5.0477294921875, -4.786376953125, -4.5250244140625, -4.263671875, -4.0023193359375, -3.740966796875, -3.4796142578125, -3.21826171875, -2.9569091796875, -2.695556640625, -2.4342041015625, -2.1728515625, -1.9114990234375, -1.650146484375, -1.3887939453125, -1.12744140625, -0.8660888671875, -0.604736328125, -0.3433837890625, -0.08203125, 0.1793212890625, 0.440673828125, 0.7020263671875, 0.96337890625, 1.2247314453125, 1.486083984375, 1.7474365234375, 2.0087890625, 2.2701416015625, 2.531494140625, 2.7928466796875, 3.05419921875, 3.3155517578125, 3.576904296875, 3.8382568359375, 4.099609375, 4.3609619140625, 4.622314453125, 4.8836669921875, 5.14501953125, 5.4063720703125, 5.667724609375, 5.9290771484375, 6.1904296875, 6.4517822265625, 6.713134765625, 6.9744873046875, 7.23583984375, 7.4971923828125, 7.758544921875, 8.0198974609375, 8.28125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 7.0, 10.0, 10.0, 15.0, 17.0, 17.0, 29.0, 29.0, 45.0, 37.0, 43.0, 43.0, 61.0, 54.0, 57.0, 46.0, 58.0, 53.0, 42.0, 53.0, 33.0, 40.0, 39.0, 28.0, 13.0, 19.0, 13.0, 17.0, 11.0, 8.0, 6.0, 6.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.62890625, -7.3880615234375, -7.147216796875, -6.9063720703125, -6.66552734375, -6.4246826171875, -6.183837890625, -5.9429931640625, -5.7021484375, -5.4613037109375, -5.220458984375, -4.9796142578125, -4.73876953125, -4.4979248046875, -4.257080078125, -4.0162353515625, -3.775390625, -3.5345458984375, -3.293701171875, -3.0528564453125, -2.81201171875, -2.5711669921875, -2.330322265625, -2.0894775390625, -1.8486328125, -1.6077880859375, -1.366943359375, -1.1260986328125, -0.88525390625, -0.6444091796875, -0.403564453125, -0.1627197265625, 0.078125, 0.3189697265625, 0.559814453125, 0.8006591796875, 1.04150390625, 1.2823486328125, 1.523193359375, 1.7640380859375, 2.0048828125, 2.2457275390625, 2.486572265625, 2.7274169921875, 2.96826171875, 3.2091064453125, 3.449951171875, 3.6907958984375, 3.931640625, 4.1724853515625, 4.413330078125, 4.6541748046875, 4.89501953125, 5.1358642578125, 5.376708984375, 5.6175537109375, 5.8583984375, 6.0992431640625, 6.340087890625, 6.5809326171875, 6.82177734375, 7.0626220703125, 7.303466796875, 7.5443115234375, 7.78515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 15.0, 10.0, 15.0, 33.0, 42.0, 63.0, 122.0, 186.0, 341.0, 744.0, 1728.0, 4847.0, 17889.0, 130555.0, 790538.0, 81319.0, 13166.0, 3906.0, 1605.0, 653.0, 344.0, 164.0, 101.0, 61.0, 35.0, 17.0, 15.0, 12.0, 6.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.9522705078125, -3.826416015625, -3.7005615234375, -3.57470703125, -3.4488525390625, -3.322998046875, -3.1971435546875, -3.0712890625, -2.9454345703125, -2.819580078125, -2.6937255859375, -2.56787109375, -2.4420166015625, -2.316162109375, -2.1903076171875, -2.064453125, -1.9385986328125, -1.812744140625, -1.6868896484375, -1.56103515625, -1.4351806640625, -1.309326171875, -1.1834716796875, -1.0576171875, -0.9317626953125, -0.805908203125, -0.6800537109375, -0.55419921875, -0.4283447265625, -0.302490234375, -0.1766357421875, -0.05078125, 0.0750732421875, 0.200927734375, 0.3267822265625, 0.45263671875, 0.5784912109375, 0.704345703125, 0.8302001953125, 0.9560546875, 1.0819091796875, 1.207763671875, 1.3336181640625, 1.45947265625, 1.5853271484375, 1.711181640625, 1.8370361328125, 1.962890625, 2.0887451171875, 2.214599609375, 2.3404541015625, 2.46630859375, 2.5921630859375, 2.718017578125, 2.8438720703125, 2.9697265625, 3.0955810546875, 3.221435546875, 3.3472900390625, 3.47314453125, 3.5989990234375, 3.724853515625, 3.8507080078125, 3.9765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 15.0, 22.0, 43.0, 71.0, 88.0, 141.0, 182.0, 136.0, 97.0, 67.0, 43.0, 25.0, 15.0, 12.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004038810729980469, -0.0003892257809638977, -0.00037457048892974854, -0.00035991519689559937, -0.0003452599048614502, -0.000330604612827301, -0.00031594932079315186, -0.0003012940287590027, -0.0002866387367248535, -0.00027198344469070435, -0.0002573281526565552, -0.000242672860622406, -0.00022801756858825684, -0.00021336227655410767, -0.0001987069845199585, -0.00018405169248580933, -0.00016939640045166016, -0.00015474110841751099, -0.00014008581638336182, -0.00012543052434921265, -0.00011077523231506348, -9.61199402809143e-05, -8.146464824676514e-05, -6.680935621261597e-05, -5.21540641784668e-05, -3.749877214431763e-05, -2.2843480110168457e-05, -8.188188076019287e-06, 6.467103958129883e-06, 2.1122395992279053e-05, 3.577768802642822e-05, 5.043298006057739e-05, 6.508827209472656e-05, 7.974356412887573e-05, 9.43988561630249e-05, 0.00010905414819717407, 0.00012370944023132324, 0.0001383647322654724, 0.00015302002429962158, 0.00016767531633377075, 0.00018233060836791992, 0.0001969859004020691, 0.00021164119243621826, 0.00022629648447036743, 0.0002409517765045166, 0.00025560706853866577, 0.00027026236057281494, 0.0002849176526069641, 0.0002995729446411133, 0.00031422823667526245, 0.0003288835287094116, 0.0003435388207435608, 0.00035819411277770996, 0.00037284940481185913, 0.0003875046968460083, 0.00040215998888015747, 0.00041681528091430664, 0.0004314705729484558, 0.000446125864982605, 0.00046078115701675415, 0.0004754364490509033, 0.0004900917410850525, 0.0005047470331192017, 0.0005194023251533508, 0.0005340576171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 12.0, 12.0, 12.0, 20.0, 28.0, 48.0, 71.0, 101.0, 171.0, 356.0, 656.0, 1443.0, 3852.0, 15527.0, 117652.0, 760472.0, 125145.0, 15946.0, 4003.0, 1435.0, 718.0, 329.0, 208.0, 111.0, 55.0, 44.0, 34.0, 24.0, 13.0, 18.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.103973388671875, -2.99114990234375, -2.878326416015625, -2.7655029296875, -2.652679443359375, -2.53985595703125, -2.427032470703125, -2.314208984375, -2.201385498046875, -2.08856201171875, -1.975738525390625, -1.8629150390625, -1.750091552734375, -1.63726806640625, -1.524444580078125, -1.41162109375, -1.298797607421875, -1.18597412109375, -1.073150634765625, -0.9603271484375, -0.847503662109375, -0.73468017578125, -0.621856689453125, -0.509033203125, -0.396209716796875, -0.28338623046875, -0.170562744140625, -0.0577392578125, 0.055084228515625, 0.16790771484375, 0.280731201171875, 0.3935546875, 0.506378173828125, 0.61920166015625, 0.732025146484375, 0.8448486328125, 0.957672119140625, 1.07049560546875, 1.183319091796875, 1.296142578125, 1.408966064453125, 1.52178955078125, 1.634613037109375, 1.7474365234375, 1.860260009765625, 1.97308349609375, 2.085906982421875, 2.19873046875, 2.311553955078125, 2.42437744140625, 2.537200927734375, 2.6500244140625, 2.762847900390625, 2.87567138671875, 2.988494873046875, 3.101318359375, 3.214141845703125, 3.32696533203125, 3.439788818359375, 3.5526123046875, 3.665435791015625, 3.77825927734375, 3.891082763671875, 4.00390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 14.0, 22.0, 19.0, 39.0, 42.0, 54.0, 77.0, 100.0, 119.0, 136.0, 96.0, 81.0, 58.0, 35.0, 35.0, 15.0, 13.0, 9.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.595977783203125, -2.48687744140625, -2.377777099609375, -2.2686767578125, -2.159576416015625, -2.05047607421875, -1.941375732421875, -1.832275390625, -1.723175048828125, -1.61407470703125, -1.504974365234375, -1.3958740234375, -1.286773681640625, -1.17767333984375, -1.068572998046875, -0.95947265625, -0.850372314453125, -0.74127197265625, -0.632171630859375, -0.5230712890625, -0.413970947265625, -0.30487060546875, -0.195770263671875, -0.086669921875, 0.022430419921875, 0.13153076171875, 0.240631103515625, 0.3497314453125, 0.458831787109375, 0.56793212890625, 0.677032470703125, 0.7861328125, 0.895233154296875, 1.00433349609375, 1.113433837890625, 1.2225341796875, 1.331634521484375, 1.44073486328125, 1.549835205078125, 1.658935546875, 1.768035888671875, 1.87713623046875, 1.986236572265625, 2.0953369140625, 2.204437255859375, 2.31353759765625, 2.422637939453125, 2.53173828125, 2.640838623046875, 2.74993896484375, 2.859039306640625, 2.9681396484375, 3.077239990234375, 3.18634033203125, 3.295440673828125, 3.404541015625, 3.513641357421875, 3.62274169921875, 3.731842041015625, 3.8409423828125, 3.950042724609375, 4.05914306640625, 4.168243408203125, 4.27734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 9.0, 13.0, 13.0, 36.0, 78.0, 140.0, 251.0, 208.0, 132.0, 60.0, 28.0, 16.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96219253540039, -60.32707595825195, -57.691959381103516, -55.05684280395508, -52.421730041503906, -49.78661346435547, -47.15149688720703, -44.516380310058594, -41.881263732910156, -39.24614715576172, -36.61103057861328, -33.975914001464844, -31.34079933166504, -28.7056827545166, -26.070568084716797, -23.43545150756836, -20.800334930419922, -18.165218353271484, -15.530102729797363, -12.894987106323242, -10.259870529174805, -7.624753952026367, -4.989638328552246, -2.354522705078125, 0.2805938720703125, 2.915709972381592, 5.550826072692871, 8.185941696166992, 10.82105827331543, 13.456174850463867, 16.091289520263672, 18.72640609741211, 21.361526489257812, 23.99664306640625, 26.631759643554688, 29.266874313354492, 31.90199089050293, 34.537109375, 37.17222213745117, 39.80733871459961, 42.44245529174805, 45.077571868896484, 47.71268844604492, 50.34780502319336, 52.98291778564453, 55.61803436279297, 58.253150939941406, 60.888267517089844, 63.52338409423828, 66.15850067138672, 68.79361724853516, 71.4287338256836, 74.06385040283203, 76.69896697998047, 79.3340835571289, 81.96919250488281, 84.60430908203125, 87.23942565917969, 89.87454223632812, 92.50965881347656, 95.144775390625, 97.77989196777344, 100.41500854492188, 103.05012512207031, 105.68524169921875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 9.0, 3.0, 7.0, 9.0, 8.0, 7.0, 19.0, 19.0, 16.0, 24.0, 26.0, 28.0, 33.0, 37.0, 35.0, 38.0, 33.0, 31.0, 33.0, 52.0, 43.0, 36.0, 48.0, 36.0, 36.0, 39.0, 40.0, 28.0, 23.0, 28.0, 27.0, 13.0, 23.0, 15.0, 13.0, 13.0, 11.0, 7.0, 12.0, 7.0, 5.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.39800262451172, -32.280540466308594, -31.16307830810547, -30.045618057250977, -28.92815589904785, -27.810693740844727, -26.693233489990234, -25.57577133178711, -24.458309173583984, -23.34084701538086, -22.223384857177734, -21.105924606323242, -19.988462448120117, -18.871000289916992, -17.7535400390625, -16.636077880859375, -15.51861572265625, -14.401153564453125, -13.283692359924316, -12.166231155395508, -11.048768997192383, -9.931306838989258, -8.81384563446045, -7.696383953094482, -6.578922271728516, -5.461460590362549, -4.343998908996582, -3.2265372276306152, -2.1090755462646484, -0.9916138648986816, 0.12584781646728516, 1.243309497833252, 2.360767364501953, 3.47822904586792, 4.595690727233887, 5.7131524085998535, 6.83061408996582, 7.948075771331787, 9.065537452697754, 10.182998657226562, 11.300460815429688, 12.417922973632812, 13.535384178161621, 14.65284538269043, 15.770307540893555, 16.88776969909668, 18.005229949951172, 19.122692108154297, 20.240154266357422, 21.357616424560547, 22.475078582763672, 23.592538833618164, 24.71000099182129, 25.827463150024414, 26.944923400878906, 28.06238555908203, 29.179847717285156, 30.29730987548828, 31.414772033691406, 32.53223419189453, 33.649696350097656, 34.767154693603516, 35.88461685180664, 37.002079010009766, 38.11954116821289]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 12.0, 21.0, 20.0, 61.0, 97.0, 148.0, 321.0, 657.0, 1434.0, 4048.0, 18658.0, 3667568.0, 479240.0, 15581.0, 3671.0, 1400.0, 608.0, 319.0, 169.0, 91.0, 53.0, 30.0, 20.0, 9.0, 7.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.73828125, -18.1328125, -17.52734375, -16.921875, -16.31640625, -15.7109375, -15.10546875, -14.5, -13.89453125, -13.2890625, -12.68359375, -12.078125, -11.47265625, -10.8671875, -10.26171875, -9.65625, -9.05078125, -8.4453125, -7.83984375, -7.234375, -6.62890625, -6.0234375, -5.41796875, -4.8125, -4.20703125, -3.6015625, -2.99609375, -2.390625, -1.78515625, -1.1796875, -0.57421875, 0.03125, 0.63671875, 1.2421875, 1.84765625, 2.453125, 3.05859375, 3.6640625, 4.26953125, 4.875, 5.48046875, 6.0859375, 6.69140625, 7.296875, 7.90234375, 8.5078125, 9.11328125, 9.71875, 10.32421875, 10.9296875, 11.53515625, 12.140625, 12.74609375, 13.3515625, 13.95703125, 14.5625, 15.16796875, 15.7734375, 16.37890625, 16.984375, 17.58984375, 18.1953125, 18.80078125, 19.40625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 19.0, 20.0, 44.0, 55.0, 63.0, 107.0, 100.0, 107.0, 104.0, 82.0, 91.0, 61.0, 42.0, 32.0, 16.0, 19.0, 13.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.14630126953125, -3.0406494140625, -2.93499755859375, -2.829345703125, -2.72369384765625, -2.6180419921875, -2.51239013671875, -2.40673828125, -2.30108642578125, -2.1954345703125, -2.08978271484375, -1.984130859375, -1.87847900390625, -1.7728271484375, -1.66717529296875, -1.5615234375, -1.45587158203125, -1.3502197265625, -1.24456787109375, -1.138916015625, -1.03326416015625, -0.9276123046875, -0.82196044921875, -0.71630859375, -0.61065673828125, -0.5050048828125, -0.39935302734375, -0.293701171875, -0.18804931640625, -0.0823974609375, 0.02325439453125, 0.12890625, 0.23455810546875, 0.3402099609375, 0.44586181640625, 0.551513671875, 0.65716552734375, 0.7628173828125, 0.86846923828125, 0.97412109375, 1.07977294921875, 1.1854248046875, 1.29107666015625, 1.396728515625, 1.50238037109375, 1.6080322265625, 1.71368408203125, 1.8193359375, 1.92498779296875, 2.0306396484375, 2.13629150390625, 2.241943359375, 2.34759521484375, 2.4532470703125, 2.55889892578125, 2.66455078125, 2.77020263671875, 2.8758544921875, 2.98150634765625, 3.087158203125, 3.19281005859375, 3.2984619140625, 3.40411376953125, 3.509765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 12.0, 18.0, 25.0, 45.0, 75.0, 94.0, 111.0, 189.0, 295.0, 384.0, 612.0, 951.0, 1737.0, 3125.0, 6849.0, 20775.0, 122413.0, 3858641.0, 140307.0, 22306.0, 7417.0, 3216.0, 1714.0, 990.0, 660.0, 421.0, 255.0, 203.0, 142.0, 87.0, 64.0, 38.0, 26.0, 19.0, 19.0, 13.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.713134765625, -11.36376953125, -11.014404296875, -10.6650390625, -10.315673828125, -9.96630859375, -9.616943359375, -9.267578125, -8.918212890625, -8.56884765625, -8.219482421875, -7.8701171875, -7.520751953125, -7.17138671875, -6.822021484375, -6.47265625, -6.123291015625, -5.77392578125, -5.424560546875, -5.0751953125, -4.725830078125, -4.37646484375, -4.027099609375, -3.677734375, -3.328369140625, -2.97900390625, -2.629638671875, -2.2802734375, -1.930908203125, -1.58154296875, -1.232177734375, -0.8828125, -0.533447265625, -0.18408203125, 0.165283203125, 0.5146484375, 0.864013671875, 1.21337890625, 1.562744140625, 1.912109375, 2.261474609375, 2.61083984375, 2.960205078125, 3.3095703125, 3.658935546875, 4.00830078125, 4.357666015625, 4.70703125, 5.056396484375, 5.40576171875, 5.755126953125, 6.1044921875, 6.453857421875, 6.80322265625, 7.152587890625, 7.501953125, 7.851318359375, 8.20068359375, 8.550048828125, 8.8994140625, 9.248779296875, 9.59814453125, 9.947509765625, 10.296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 9.0, 16.0, 26.0, 38.0, 83.0, 196.0, 2251.0, 1048.0, 186.0, 69.0, 42.0, 23.0, 17.0, 12.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.95098876953125, -5.7379150390625, -5.52484130859375, -5.311767578125, -5.09869384765625, -4.8856201171875, -4.67254638671875, -4.45947265625, -4.24639892578125, -4.0333251953125, -3.82025146484375, -3.607177734375, -3.39410400390625, -3.1810302734375, -2.96795654296875, -2.7548828125, -2.54180908203125, -2.3287353515625, -2.11566162109375, -1.902587890625, -1.68951416015625, -1.4764404296875, -1.26336669921875, -1.05029296875, -0.83721923828125, -0.6241455078125, -0.41107177734375, -0.197998046875, 0.01507568359375, 0.2281494140625, 0.44122314453125, 0.654296875, 0.86737060546875, 1.0804443359375, 1.29351806640625, 1.506591796875, 1.71966552734375, 1.9327392578125, 2.14581298828125, 2.35888671875, 2.57196044921875, 2.7850341796875, 2.99810791015625, 3.211181640625, 3.42425537109375, 3.6373291015625, 3.85040283203125, 4.0634765625, 4.27655029296875, 4.4896240234375, 4.70269775390625, 4.915771484375, 5.12884521484375, 5.3419189453125, 5.55499267578125, 5.76806640625, 5.98114013671875, 6.1942138671875, 6.40728759765625, 6.620361328125, 6.83343505859375, 7.0465087890625, 7.25958251953125, 7.47265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 15.0, 55.0, 185.0, 358.0, 240.0, 87.0, 34.0, 16.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.696670532226562, -12.765999794006348, -10.835329055786133, -8.904659271240234, -6.973988056182861, -5.043317794799805, -3.11264705657959, -1.181976318359375, 0.7486944198608398, 2.6793651580810547, 4.6100358963012695, 6.540706157684326, 8.471376419067383, 10.402047157287598, 12.332717895507812, 14.263388633728027, 16.194059371948242, 18.12472915649414, 20.055400848388672, 21.98607063293457, 23.9167423248291, 25.847412109375, 27.77808380126953, 29.70875358581543, 31.639423370361328, 33.57009506225586, 35.500762939453125, 37.431434631347656, 39.36210632324219, 41.29277801513672, 43.223445892333984, 45.154117584228516, 47.08478927612305, 49.01546096801758, 50.946128845214844, 52.876800537109375, 54.807472229003906, 56.73814392089844, 58.6688117980957, 60.599483489990234, 62.530155181884766, 64.46082305908203, 66.39149475097656, 68.3221664428711, 70.25283813476562, 72.18350982666016, 74.11418151855469, 76.04484558105469, 77.97551727294922, 79.90618896484375, 81.83686065673828, 83.76753234863281, 85.69819641113281, 87.62886810302734, 89.55953979492188, 91.4902114868164, 93.42088317871094, 95.35155487060547, 97.2822265625, 99.21289825439453, 101.14356231689453, 103.07423400878906, 105.0049057006836, 106.93557739257812, 108.86624908447266]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 8.0, 14.0, 13.0, 14.0, 19.0, 15.0, 12.0, 20.0, 32.0, 22.0, 38.0, 38.0, 39.0, 36.0, 47.0, 50.0, 41.0, 44.0, 44.0, 39.0, 43.0, 33.0, 46.0, 43.0, 25.0, 25.0, 22.0, 25.0, 26.0, 17.0, 14.0, 9.0, 15.0, 13.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-17.335174560546875, -16.855005264282227, -16.374835968017578, -15.894665718078613, -15.414496421813965, -14.934326171875, -14.454156875610352, -13.973987579345703, -13.493818283081055, -13.013648986816406, -12.533478736877441, -12.053309440612793, -11.573140144348145, -11.09296989440918, -10.612800598144531, -10.132631301879883, -9.652461051940918, -9.17229175567627, -8.692121505737305, -8.211952209472656, -7.731782913208008, -7.251613140106201, -6.7714433670043945, -6.291274070739746, -5.8111042976379395, -5.330934524536133, -4.850765228271484, -4.370595455169678, -3.89042592048645, -3.4102563858032227, -2.930086612701416, -2.4499170780181885, -1.9697484970092773, -1.4895789623260498, -1.0094093084335327, -0.5292396545410156, -0.049070119857788086, 0.43109941482543945, 0.9112691879272461, 1.3914387226104736, 1.8716082572937012, 2.3517777919769287, 2.8319473266601562, 3.312117099761963, 3.7922866344451904, 4.272456169128418, 4.752625942230225, 5.232795715332031, 5.71296501159668, 6.193134784698486, 6.673304080963135, 7.153473854064941, 7.63364315032959, 8.113813400268555, 8.593982696533203, 9.074151992797852, 9.5543212890625, 10.034490585327148, 10.514660835266113, 10.994830131530762, 11.47499942779541, 11.955169677734375, 12.435338973999023, 12.915508270263672, 13.395678520202637]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 13.0, 13.0, 22.0, 17.0, 32.0, 45.0, 75.0, 91.0, 160.0, 271.0, 481.0, 924.0, 1863.0, 3998.0, 8945.0, 21954.0, 59135.0, 217640.0, 505034.0, 151104.0, 45214.0, 17431.0, 7328.0, 3248.0, 1595.0, 806.0, 436.0, 262.0, 127.0, 87.0, 43.0, 45.0, 25.0, 19.0, 15.0, 14.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.546875, -8.2655029296875, -7.984130859375, -7.7027587890625, -7.42138671875, -7.1400146484375, -6.858642578125, -6.5772705078125, -6.2958984375, -6.0145263671875, -5.733154296875, -5.4517822265625, -5.17041015625, -4.8890380859375, -4.607666015625, -4.3262939453125, -4.044921875, -3.7635498046875, -3.482177734375, -3.2008056640625, -2.91943359375, -2.6380615234375, -2.356689453125, -2.0753173828125, -1.7939453125, -1.5125732421875, -1.231201171875, -0.9498291015625, -0.66845703125, -0.3870849609375, -0.105712890625, 0.1756591796875, 0.45703125, 0.7384033203125, 1.019775390625, 1.3011474609375, 1.58251953125, 1.8638916015625, 2.145263671875, 2.4266357421875, 2.7080078125, 2.9893798828125, 3.270751953125, 3.5521240234375, 3.83349609375, 4.1148681640625, 4.396240234375, 4.6776123046875, 4.958984375, 5.2403564453125, 5.521728515625, 5.8031005859375, 6.08447265625, 6.3658447265625, 6.647216796875, 6.9285888671875, 7.2099609375, 7.4913330078125, 7.772705078125, 8.0540771484375, 8.33544921875, 8.6168212890625, 8.898193359375, 9.1795654296875, 9.4609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 15.0, 14.0, 31.0, 49.0, 48.0, 63.0, 80.0, 106.0, 103.0, 114.0, 80.0, 70.0, 53.0, 38.0, 33.0, 38.0, 24.0, 12.0, 7.0, 8.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.234375, -3.125701904296875, -3.01702880859375, -2.908355712890625, -2.7996826171875, -2.691009521484375, -2.58233642578125, -2.473663330078125, -2.364990234375, -2.256317138671875, -2.14764404296875, -2.038970947265625, -1.9302978515625, -1.821624755859375, -1.71295166015625, -1.604278564453125, -1.49560546875, -1.386932373046875, -1.27825927734375, -1.169586181640625, -1.0609130859375, -0.952239990234375, -0.84356689453125, -0.734893798828125, -0.626220703125, -0.517547607421875, -0.40887451171875, -0.300201416015625, -0.1915283203125, -0.082855224609375, 0.02581787109375, 0.134490966796875, 0.2431640625, 0.351837158203125, 0.46051025390625, 0.569183349609375, 0.6778564453125, 0.786529541015625, 0.89520263671875, 1.003875732421875, 1.112548828125, 1.221221923828125, 1.32989501953125, 1.438568115234375, 1.5472412109375, 1.655914306640625, 1.76458740234375, 1.873260498046875, 1.98193359375, 2.090606689453125, 2.19927978515625, 2.307952880859375, 2.4166259765625, 2.525299072265625, 2.63397216796875, 2.742645263671875, 2.851318359375, 2.959991455078125, 3.06866455078125, 3.177337646484375, 3.2860107421875, 3.394683837890625, 3.50335693359375, 3.612030029296875, 3.720703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 6.0, 6.0, 10.0, 9.0, 15.0, 20.0, 28.0, 32.0, 37.0, 73.0, 119.0, 158.0, 232.0, 342.0, 621.0, 1048.0, 2069.0, 4200.0, 9976.0, 25603.0, 82223.0, 392792.0, 399898.0, 83949.0, 26029.0, 9955.0, 4296.0, 2017.0, 1106.0, 610.0, 344.0, 230.0, 153.0, 104.0, 75.0, 54.0, 30.0, 29.0, 18.0, 8.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6015625, -10.2596435546875, -9.917724609375, -9.5758056640625, -9.23388671875, -8.8919677734375, -8.550048828125, -8.2081298828125, -7.8662109375, -7.5242919921875, -7.182373046875, -6.8404541015625, -6.49853515625, -6.1566162109375, -5.814697265625, -5.4727783203125, -5.130859375, -4.7889404296875, -4.447021484375, -4.1051025390625, -3.76318359375, -3.4212646484375, -3.079345703125, -2.7374267578125, -2.3955078125, -2.0535888671875, -1.711669921875, -1.3697509765625, -1.02783203125, -0.6859130859375, -0.343994140625, -0.0020751953125, 0.33984375, 0.6817626953125, 1.023681640625, 1.3656005859375, 1.70751953125, 2.0494384765625, 2.391357421875, 2.7332763671875, 3.0751953125, 3.4171142578125, 3.759033203125, 4.1009521484375, 4.44287109375, 4.7847900390625, 5.126708984375, 5.4686279296875, 5.810546875, 6.1524658203125, 6.494384765625, 6.8363037109375, 7.17822265625, 7.5201416015625, 7.862060546875, 8.2039794921875, 8.5458984375, 8.8878173828125, 9.229736328125, 9.5716552734375, 9.91357421875, 10.2554931640625, 10.597412109375, 10.9393310546875, 11.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 25.0, 31.0, 28.0, 32.0, 43.0, 43.0, 47.0, 60.0, 56.0, 54.0, 50.0, 49.0, 40.0, 41.0, 45.0, 32.0, 40.0, 28.0, 26.0, 21.0, 28.0, 13.0, 15.0, 12.0, 16.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8671875, -11.483154296875, -11.09912109375, -10.715087890625, -10.3310546875, -9.947021484375, -9.56298828125, -9.178955078125, -8.794921875, -8.410888671875, -8.02685546875, -7.642822265625, -7.2587890625, -6.874755859375, -6.49072265625, -6.106689453125, -5.72265625, -5.338623046875, -4.95458984375, -4.570556640625, -4.1865234375, -3.802490234375, -3.41845703125, -3.034423828125, -2.650390625, -2.266357421875, -1.88232421875, -1.498291015625, -1.1142578125, -0.730224609375, -0.34619140625, 0.037841796875, 0.421875, 0.805908203125, 1.18994140625, 1.573974609375, 1.9580078125, 2.342041015625, 2.72607421875, 3.110107421875, 3.494140625, 3.878173828125, 4.26220703125, 4.646240234375, 5.0302734375, 5.414306640625, 5.79833984375, 6.182373046875, 6.56640625, 6.950439453125, 7.33447265625, 7.718505859375, 8.1025390625, 8.486572265625, 8.87060546875, 9.254638671875, 9.638671875, 10.022705078125, 10.40673828125, 10.790771484375, 11.1748046875, 11.558837890625, 11.94287109375, 12.326904296875, 12.7109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 14.0, 25.0, 34.0, 29.0, 70.0, 102.0, 149.0, 317.0, 687.0, 1597.0, 5266.0, 31245.0, 740977.0, 246393.0, 15831.0, 3468.0, 1190.0, 488.0, 249.0, 145.0, 78.0, 52.0, 38.0, 20.0, 26.0, 11.0, 8.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.09283447265625, -6.8380126953125, -6.58319091796875, -6.328369140625, -6.07354736328125, -5.8187255859375, -5.56390380859375, -5.30908203125, -5.05426025390625, -4.7994384765625, -4.54461669921875, -4.289794921875, -4.03497314453125, -3.7801513671875, -3.52532958984375, -3.2705078125, -3.01568603515625, -2.7608642578125, -2.50604248046875, -2.251220703125, -1.99639892578125, -1.7415771484375, -1.48675537109375, -1.23193359375, -0.97711181640625, -0.7222900390625, -0.46746826171875, -0.212646484375, 0.04217529296875, 0.2969970703125, 0.55181884765625, 0.806640625, 1.06146240234375, 1.3162841796875, 1.57110595703125, 1.825927734375, 2.08074951171875, 2.3355712890625, 2.59039306640625, 2.84521484375, 3.10003662109375, 3.3548583984375, 3.60968017578125, 3.864501953125, 4.11932373046875, 4.3741455078125, 4.62896728515625, 4.8837890625, 5.13861083984375, 5.3934326171875, 5.64825439453125, 5.903076171875, 6.15789794921875, 6.4127197265625, 6.66754150390625, 6.92236328125, 7.17718505859375, 7.4320068359375, 7.68682861328125, 7.941650390625, 8.19647216796875, 8.4512939453125, 8.70611572265625, 8.9609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 9.0, 4.0, 12.0, 18.0, 21.0, 23.0, 36.0, 47.0, 66.0, 114.0, 123.0, 124.0, 118.0, 90.0, 52.0, 41.0, 31.0, 17.0, 11.0, 5.0, 12.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005536079406738281, -0.0005363672971725464, -0.0005191266536712646, -0.0005018860101699829, -0.00048464536666870117, -0.00046740472316741943, -0.0004501640796661377, -0.00043292343616485596, -0.0004156827926635742, -0.0003984421491622925, -0.00038120150566101074, -0.000363960862159729, -0.00034672021865844727, -0.00032947957515716553, -0.0003122389316558838, -0.00029499828815460205, -0.0002777576446533203, -0.0002605170011520386, -0.00024327635765075684, -0.0002260357141494751, -0.00020879507064819336, -0.00019155442714691162, -0.00017431378364562988, -0.00015707314014434814, -0.0001398324966430664, -0.00012259185314178467, -0.00010535120964050293, -8.811056613922119e-05, -7.086992263793945e-05, -5.3629279136657715e-05, -3.6388635635375977e-05, -1.9147992134094238e-05, -1.9073486328125e-06, 1.5333294868469238e-05, 3.2573938369750977e-05, 4.9814581871032715e-05, 6.705522537231445e-05, 8.429586887359619e-05, 0.00010153651237487793, 0.00011877715587615967, 0.0001360177993774414, 0.00015325844287872314, 0.00017049908638000488, 0.00018773972988128662, 0.00020498037338256836, 0.0002222210168838501, 0.00023946166038513184, 0.0002567023038864136, 0.0002739429473876953, 0.00029118359088897705, 0.0003084242343902588, 0.00032566487789154053, 0.00034290552139282227, 0.000360146164894104, 0.00037738680839538574, 0.0003946274518966675, 0.0004118680953979492, 0.00042910873889923096, 0.0004463493824005127, 0.00046359002590179443, 0.00048083066940307617, 0.0004980713129043579, 0.0005153119564056396, 0.0005325525999069214, 0.0005497932434082031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 0.0, 5.0, 8.0, 6.0, 15.0, 19.0, 26.0, 29.0, 56.0, 81.0, 117.0, 180.0, 315.0, 504.0, 901.0, 1703.0, 3509.0, 8474.0, 24045.0, 94829.0, 522370.0, 307272.0, 55444.0, 16466.0, 6181.0, 2695.0, 1377.0, 752.0, 385.0, 267.0, 163.0, 112.0, 68.0, 55.0, 33.0, 26.0, 17.0, 9.0, 8.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.529296875, -3.421783447265625, -3.31427001953125, -3.206756591796875, -3.0992431640625, -2.991729736328125, -2.88421630859375, -2.776702880859375, -2.669189453125, -2.561676025390625, -2.45416259765625, -2.346649169921875, -2.2391357421875, -2.131622314453125, -2.02410888671875, -1.916595458984375, -1.80908203125, -1.701568603515625, -1.59405517578125, -1.486541748046875, -1.3790283203125, -1.271514892578125, -1.16400146484375, -1.056488037109375, -0.948974609375, -0.841461181640625, -0.73394775390625, -0.626434326171875, -0.5189208984375, -0.411407470703125, -0.30389404296875, -0.196380615234375, -0.0888671875, 0.018646240234375, 0.12615966796875, 0.233673095703125, 0.3411865234375, 0.448699951171875, 0.55621337890625, 0.663726806640625, 0.771240234375, 0.878753662109375, 0.98626708984375, 1.093780517578125, 1.2012939453125, 1.308807373046875, 1.41632080078125, 1.523834228515625, 1.63134765625, 1.738861083984375, 1.84637451171875, 1.953887939453125, 2.0614013671875, 2.168914794921875, 2.27642822265625, 2.383941650390625, 2.491455078125, 2.598968505859375, 2.70648193359375, 2.813995361328125, 2.9215087890625, 3.029022216796875, 3.13653564453125, 3.244049072265625, 3.3515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 12.0, 7.0, 12.0, 21.0, 30.0, 20.0, 44.0, 55.0, 63.0, 91.0, 100.0, 110.0, 95.0, 73.0, 53.0, 48.0, 26.0, 29.0, 14.0, 16.0, 13.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.921875, -3.7911376953125, -3.660400390625, -3.5296630859375, -3.39892578125, -3.2681884765625, -3.137451171875, -3.0067138671875, -2.8759765625, -2.7452392578125, -2.614501953125, -2.4837646484375, -2.35302734375, -2.2222900390625, -2.091552734375, -1.9608154296875, -1.830078125, -1.6993408203125, -1.568603515625, -1.4378662109375, -1.30712890625, -1.1763916015625, -1.045654296875, -0.9149169921875, -0.7841796875, -0.6534423828125, -0.522705078125, -0.3919677734375, -0.26123046875, -0.1304931640625, 0.000244140625, 0.1309814453125, 0.26171875, 0.3924560546875, 0.523193359375, 0.6539306640625, 0.78466796875, 0.9154052734375, 1.046142578125, 1.1768798828125, 1.3076171875, 1.4383544921875, 1.569091796875, 1.6998291015625, 1.83056640625, 1.9613037109375, 2.092041015625, 2.2227783203125, 2.353515625, 2.4842529296875, 2.614990234375, 2.7457275390625, 2.87646484375, 3.0072021484375, 3.137939453125, 3.2686767578125, 3.3994140625, 3.5301513671875, 3.660888671875, 3.7916259765625, 3.92236328125, 4.0531005859375, 4.183837890625, 4.3145751953125, 4.4453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 15.0, 15.0, 19.0, 18.0, 40.0, 55.0, 65.0, 99.0, 116.0, 122.0, 103.0, 91.0, 64.0, 47.0, 32.0, 14.0, 13.0, 15.0, 7.0, 4.0, 5.0, 5.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.342247009277344, -46.25959777832031, -44.17695236206055, -42.094303131103516, -40.011653900146484, -37.92900848388672, -35.84635925292969, -33.763710021972656, -31.681062698364258, -29.59841537475586, -27.515766143798828, -25.43311882019043, -23.35047149658203, -21.267822265625, -19.1851749420166, -17.102527618408203, -15.019878387451172, -12.937230110168457, -10.854581832885742, -8.771934509277344, -6.689286231994629, -4.606637954711914, -2.5239906311035156, -0.4413423538208008, 1.641305923461914, 3.72395396232605, 5.8066020011901855, 7.889249801635742, 9.971898078918457, 12.054546356201172, 14.13719367980957, 16.21984100341797, 18.302490234375, 20.3851375579834, 22.46778678894043, 24.550434112548828, 26.63308334350586, 28.715730667114258, 30.798377990722656, 32.88102722167969, 34.96367645263672, 37.04632568359375, 39.128971099853516, 41.21162033081055, 43.29426956176758, 45.376914978027344, 47.459564208984375, 49.542213439941406, 51.62485885620117, 53.7075080871582, 55.79015350341797, 57.872802734375, 59.95545196533203, 62.03810119628906, 64.12074279785156, 66.2033920288086, 68.28604125976562, 70.36869049072266, 72.45133972167969, 74.53398132324219, 76.61663055419922, 78.69927978515625, 80.78192901611328, 82.86457824707031, 84.94722747802734]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 9.0, 9.0, 4.0, 12.0, 11.0, 9.0, 17.0, 17.0, 27.0, 17.0, 29.0, 29.0, 24.0, 36.0, 39.0, 39.0, 42.0, 41.0, 57.0, 47.0, 51.0, 58.0, 39.0, 47.0, 39.0, 34.0, 31.0, 18.0, 23.0, 23.0, 23.0, 13.0, 15.0, 10.0, 10.0, 13.0, 9.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.44706344604492, -58.39943313598633, -56.351802825927734, -54.30417251586914, -52.25654220581055, -50.20891189575195, -48.16128158569336, -46.113651275634766, -44.06602096557617, -42.01839065551758, -39.970760345458984, -37.92313003540039, -35.8754997253418, -33.8278694152832, -31.78023910522461, -29.732608795166016, -27.684978485107422, -25.637348175048828, -23.589717864990234, -21.54208755493164, -19.494457244873047, -17.446826934814453, -15.39919662475586, -13.351566314697266, -11.303936004638672, -9.256305694580078, -7.208675384521484, -5.161045074462891, -3.113414764404297, -1.0657844543457031, 0.9818458557128906, 3.0294761657714844, 5.0771026611328125, 7.124732971191406, 9.17236328125, 11.219993591308594, 13.267623901367188, 15.315254211425781, 17.362884521484375, 19.41051483154297, 21.458145141601562, 23.505775451660156, 25.55340576171875, 27.601036071777344, 29.648666381835938, 31.69629669189453, 33.743927001953125, 35.79155731201172, 37.83918762207031, 39.886817932128906, 41.9344482421875, 43.982078552246094, 46.02970886230469, 48.07733917236328, 50.124969482421875, 52.17259979248047, 54.22023010253906, 56.267860412597656, 58.31549072265625, 60.363121032714844, 62.41075134277344, 64.45838165283203, 66.50601196289062, 68.55364227294922, 70.60127258300781]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 8.0, 7.0, 15.0, 18.0, 25.0, 24.0, 47.0, 57.0, 80.0, 119.0, 162.0, 247.0, 416.0, 659.0, 1262.0, 3001.0, 11132.0, 4136965.0, 31471.0, 4517.0, 1794.0, 802.0, 504.0, 305.0, 193.0, 130.0, 89.0, 67.0, 37.0, 46.0, 16.0, 22.0, 15.0, 9.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.015625, -19.384033203125, -18.75244140625, -18.120849609375, -17.4892578125, -16.857666015625, -16.22607421875, -15.594482421875, -14.962890625, -14.331298828125, -13.69970703125, -13.068115234375, -12.4365234375, -11.804931640625, -11.17333984375, -10.541748046875, -9.91015625, -9.278564453125, -8.64697265625, -8.015380859375, -7.3837890625, -6.752197265625, -6.12060546875, -5.489013671875, -4.857421875, -4.225830078125, -3.59423828125, -2.962646484375, -2.3310546875, -1.699462890625, -1.06787109375, -0.436279296875, 0.1953125, 0.826904296875, 1.45849609375, 2.090087890625, 2.7216796875, 3.353271484375, 3.98486328125, 4.616455078125, 5.248046875, 5.879638671875, 6.51123046875, 7.142822265625, 7.7744140625, 8.406005859375, 9.03759765625, 9.669189453125, 10.30078125, 10.932373046875, 11.56396484375, 12.195556640625, 12.8271484375, 13.458740234375, 14.09033203125, 14.721923828125, 15.353515625, 15.985107421875, 16.61669921875, 17.248291015625, 17.8798828125, 18.511474609375, 19.14306640625, 19.774658203125, 20.40625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 15.0, 24.0, 22.0, 24.0, 38.0, 54.0, 45.0, 65.0, 73.0, 71.0, 78.0, 76.0, 64.0, 64.0, 43.0, 32.0, 33.0, 50.0, 22.0, 21.0, 12.0, 14.0, 10.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.09423828125, -2.9775390625, -2.86083984375, -2.744140625, -2.62744140625, -2.5107421875, -2.39404296875, -2.27734375, -2.16064453125, -2.0439453125, -1.92724609375, -1.810546875, -1.69384765625, -1.5771484375, -1.46044921875, -1.34375, -1.22705078125, -1.1103515625, -0.99365234375, -0.876953125, -0.76025390625, -0.6435546875, -0.52685546875, -0.41015625, -0.29345703125, -0.1767578125, -0.06005859375, 0.056640625, 0.17333984375, 0.2900390625, 0.40673828125, 0.5234375, 0.64013671875, 0.7568359375, 0.87353515625, 0.990234375, 1.10693359375, 1.2236328125, 1.34033203125, 1.45703125, 1.57373046875, 1.6904296875, 1.80712890625, 1.923828125, 2.04052734375, 2.1572265625, 2.27392578125, 2.390625, 2.50732421875, 2.6240234375, 2.74072265625, 2.857421875, 2.97412109375, 3.0908203125, 3.20751953125, 3.32421875, 3.44091796875, 3.5576171875, 3.67431640625, 3.791015625, 3.90771484375, 4.0244140625, 4.14111328125, 4.2578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 5.0, 10.0, 17.0, 15.0, 32.0, 43.0, 48.0, 60.0, 100.0, 172.0, 322.0, 579.0, 1061.0, 2234.0, 6123.0, 55768.0, 4109783.0, 11512.0, 3253.0, 1406.0, 687.0, 388.0, 259.0, 139.0, 63.0, 46.0, 33.0, 25.0, 24.0, 16.0, 9.0, 7.0, 6.0, 3.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.65625, -25.93994140625, -25.2236328125, -24.50732421875, -23.791015625, -23.07470703125, -22.3583984375, -21.64208984375, -20.92578125, -20.20947265625, -19.4931640625, -18.77685546875, -18.060546875, -17.34423828125, -16.6279296875, -15.91162109375, -15.1953125, -14.47900390625, -13.7626953125, -13.04638671875, -12.330078125, -11.61376953125, -10.8974609375, -10.18115234375, -9.46484375, -8.74853515625, -8.0322265625, -7.31591796875, -6.599609375, -5.88330078125, -5.1669921875, -4.45068359375, -3.734375, -3.01806640625, -2.3017578125, -1.58544921875, -0.869140625, -0.15283203125, 0.5634765625, 1.27978515625, 1.99609375, 2.71240234375, 3.4287109375, 4.14501953125, 4.861328125, 5.57763671875, 6.2939453125, 7.01025390625, 7.7265625, 8.44287109375, 9.1591796875, 9.87548828125, 10.591796875, 11.30810546875, 12.0244140625, 12.74072265625, 13.45703125, 14.17333984375, 14.8896484375, 15.60595703125, 16.322265625, 17.03857421875, 17.7548828125, 18.47119140625, 19.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 8.0, 14.0, 40.0, 228.0, 3700.0, 36.0, 11.0, 10.0, 5.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.11328125, -5.983673095703125, -5.85406494140625, -5.724456787109375, -5.5948486328125, -5.465240478515625, -5.33563232421875, -5.206024169921875, -5.076416015625, -4.946807861328125, -4.81719970703125, -4.687591552734375, -4.5579833984375, -4.428375244140625, -4.29876708984375, -4.169158935546875, -4.03955078125, -3.909942626953125, -3.78033447265625, -3.650726318359375, -3.5211181640625, -3.391510009765625, -3.26190185546875, -3.132293701171875, -3.002685546875, -2.873077392578125, -2.74346923828125, -2.613861083984375, -2.4842529296875, -2.354644775390625, -2.22503662109375, -2.095428466796875, -1.9658203125, -1.836212158203125, -1.70660400390625, -1.576995849609375, -1.4473876953125, -1.317779541015625, -1.18817138671875, -1.058563232421875, -0.928955078125, -0.799346923828125, -0.66973876953125, -0.540130615234375, -0.4105224609375, -0.280914306640625, -0.15130615234375, -0.021697998046875, 0.10791015625, 0.237518310546875, 0.36712646484375, 0.496734619140625, 0.6263427734375, 0.755950927734375, 0.88555908203125, 1.015167236328125, 1.144775390625, 1.274383544921875, 1.40399169921875, 1.533599853515625, 1.6632080078125, 1.792816162109375, 1.92242431640625, 2.052032470703125, 2.181640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 11.0, 25.0, 34.0, 55.0, 106.0, 176.0, 224.0, 202.0, 83.0, 53.0, 20.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.095752716064453, -23.56075096130371, -23.02574920654297, -22.49074935913086, -21.955747604370117, -21.420745849609375, -20.885744094848633, -20.35074234008789, -19.81574249267578, -19.28074073791504, -18.745738983154297, -18.210739135742188, -17.675737380981445, -17.140735626220703, -16.60573387145996, -16.07073211669922, -15.535731315612793, -15.00072956085205, -14.465728759765625, -13.930727005004883, -13.395726203918457, -12.860724449157715, -12.325723648071289, -11.790721893310547, -11.255720138549805, -10.720718383789062, -10.185717582702637, -9.650715827941895, -9.115715026855469, -8.580713272094727, -8.045711517333984, -7.510710716247559, -6.975710868835449, -6.440709590911865, -5.905708312988281, -5.370706558227539, -4.835705757141113, -4.300704002380371, -3.765702724456787, -3.230701446533203, -2.695700168609619, -2.160698890686035, -1.6256974935531616, -1.090696096420288, -0.5556948184967041, -0.020693540573120117, 0.514307975769043, 1.049309253692627, 1.584310531616211, 2.119311809539795, 2.654313087463379, 3.189314603805542, 3.724315881729126, 4.259317398071289, 4.794318675994873, 5.329319953918457, 5.864321231842041, 6.399322509765625, 6.934323787689209, 7.469325065612793, 8.004326820373535, 8.539327621459961, 9.074329376220703, 9.609331130981445, 10.144331932067871]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 20.0, 15.0, 24.0, 26.0, 27.0, 18.0, 31.0, 21.0, 45.0, 27.0, 41.0, 34.0, 35.0, 39.0, 45.0, 39.0, 34.0, 36.0, 44.0, 35.0, 34.0, 33.0, 22.0, 34.0, 26.0, 22.0, 20.0, 20.0, 26.0, 12.0, 10.0, 12.0, 10.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5264129638671875, -5.336819171905518, -5.147225379943848, -4.957631587982178, -4.768037796020508, -4.578444480895996, -4.388850688934326, -4.199256896972656, -4.009663105010986, -3.8200693130493164, -3.6304755210876465, -3.4408819675445557, -3.2512881755828857, -3.061694383621216, -2.872100830078125, -2.682507038116455, -2.492913246154785, -2.3033194541931152, -2.1137256622314453, -1.9241321086883545, -1.7345383167266846, -1.5449445247650146, -1.3553508520126343, -1.165757179260254, -0.976163387298584, -0.7865696549415588, -0.5969759225845337, -0.40738219022750854, -0.2177884578704834, -0.028194725513458252, 0.1613990068435669, 0.35099267959594727, 0.5405864715576172, 0.7301802039146423, 0.9197739362716675, 1.1093676090240479, 1.2989614009857178, 1.4885551929473877, 1.678148865699768, 1.8677425384521484, 2.0573363304138184, 2.2469301223754883, 2.436523914337158, 2.626117467880249, 2.815711259841919, 3.005305051803589, 3.1948986053466797, 3.3844923973083496, 3.5740861892700195, 3.7636799812316895, 3.9532737731933594, 4.142867565155029, 4.332461357116699, 4.522054672241211, 4.711648464202881, 4.901242256164551, 5.090836048126221, 5.280429840087891, 5.4700236320495605, 5.6596174240112305, 5.849210739135742, 6.038804531097412, 6.228398323059082, 6.417992115020752, 6.607585906982422]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 9.0, 5.0, 15.0, 20.0, 26.0, 40.0, 54.0, 107.0, 133.0, 221.0, 419.0, 646.0, 1168.0, 2096.0, 3986.0, 7625.0, 16783.0, 39497.0, 110119.0, 354460.0, 337132.0, 103938.0, 37575.0, 16159.0, 7656.0, 3804.0, 2065.0, 1112.0, 635.0, 374.0, 243.0, 158.0, 99.0, 77.0, 35.0, 25.0, 14.0, 8.0, 4.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.60186767578125, -7.3092041015625, -7.01654052734375, -6.723876953125, -6.43121337890625, -6.1385498046875, -5.84588623046875, -5.55322265625, -5.26055908203125, -4.9678955078125, -4.67523193359375, -4.382568359375, -4.08990478515625, -3.7972412109375, -3.50457763671875, -3.2119140625, -2.91925048828125, -2.6265869140625, -2.33392333984375, -2.041259765625, -1.74859619140625, -1.4559326171875, -1.16326904296875, -0.87060546875, -0.57794189453125, -0.2852783203125, 0.00738525390625, 0.300048828125, 0.59271240234375, 0.8853759765625, 1.17803955078125, 1.470703125, 1.76336669921875, 2.0560302734375, 2.34869384765625, 2.641357421875, 2.93402099609375, 3.2266845703125, 3.51934814453125, 3.81201171875, 4.10467529296875, 4.3973388671875, 4.69000244140625, 4.982666015625, 5.27532958984375, 5.5679931640625, 5.86065673828125, 6.1533203125, 6.44598388671875, 6.7386474609375, 7.03131103515625, 7.323974609375, 7.61663818359375, 7.9093017578125, 8.20196533203125, 8.49462890625, 8.78729248046875, 9.0799560546875, 9.37261962890625, 9.665283203125, 9.95794677734375, 10.2506103515625, 10.54327392578125, 10.8359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 12.0, 13.0, 20.0, 25.0, 20.0, 39.0, 38.0, 66.0, 56.0, 77.0, 74.0, 72.0, 76.0, 66.0, 58.0, 47.0, 39.0, 42.0, 26.0, 34.0, 22.0, 13.0, 12.0, 10.0, 11.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.18096923828125, -3.0611572265625, -2.94134521484375, -2.821533203125, -2.70172119140625, -2.5819091796875, -2.46209716796875, -2.34228515625, -2.22247314453125, -2.1026611328125, -1.98284912109375, -1.863037109375, -1.74322509765625, -1.6234130859375, -1.50360107421875, -1.3837890625, -1.26397705078125, -1.1441650390625, -1.02435302734375, -0.904541015625, -0.78472900390625, -0.6649169921875, -0.54510498046875, -0.42529296875, -0.30548095703125, -0.1856689453125, -0.06585693359375, 0.053955078125, 0.17376708984375, 0.2935791015625, 0.41339111328125, 0.533203125, 0.65301513671875, 0.7728271484375, 0.89263916015625, 1.012451171875, 1.13226318359375, 1.2520751953125, 1.37188720703125, 1.49169921875, 1.61151123046875, 1.7313232421875, 1.85113525390625, 1.970947265625, 2.09075927734375, 2.2105712890625, 2.33038330078125, 2.4501953125, 2.57000732421875, 2.6898193359375, 2.80963134765625, 2.929443359375, 3.04925537109375, 3.1690673828125, 3.28887939453125, 3.40869140625, 3.52850341796875, 3.6483154296875, 3.76812744140625, 3.887939453125, 4.00775146484375, 4.1275634765625, 4.24737548828125, 4.3671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 11.0, 18.0, 24.0, 45.0, 37.0, 67.0, 87.0, 124.0, 211.0, 355.0, 650.0, 1151.0, 2346.0, 5335.0, 13511.0, 40259.0, 188169.0, 612403.0, 131788.0, 31884.0, 10895.0, 4505.0, 2076.0, 1014.0, 563.0, 342.0, 205.0, 135.0, 88.0, 63.0, 49.0, 38.0, 27.0, 21.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.294189453125, -14.80712890625, -14.320068359375, -13.8330078125, -13.345947265625, -12.85888671875, -12.371826171875, -11.884765625, -11.397705078125, -10.91064453125, -10.423583984375, -9.9365234375, -9.449462890625, -8.96240234375, -8.475341796875, -7.98828125, -7.501220703125, -7.01416015625, -6.527099609375, -6.0400390625, -5.552978515625, -5.06591796875, -4.578857421875, -4.091796875, -3.604736328125, -3.11767578125, -2.630615234375, -2.1435546875, -1.656494140625, -1.16943359375, -0.682373046875, -0.1953125, 0.291748046875, 0.77880859375, 1.265869140625, 1.7529296875, 2.239990234375, 2.72705078125, 3.214111328125, 3.701171875, 4.188232421875, 4.67529296875, 5.162353515625, 5.6494140625, 6.136474609375, 6.62353515625, 7.110595703125, 7.59765625, 8.084716796875, 8.57177734375, 9.058837890625, 9.5458984375, 10.032958984375, 10.52001953125, 11.007080078125, 11.494140625, 11.981201171875, 12.46826171875, 12.955322265625, 13.4423828125, 13.929443359375, 14.41650390625, 14.903564453125, 15.390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 10.0, 10.0, 12.0, 13.0, 15.0, 21.0, 18.0, 22.0, 35.0, 20.0, 35.0, 46.0, 42.0, 56.0, 66.0, 42.0, 56.0, 54.0, 51.0, 45.0, 54.0, 33.0, 37.0, 36.0, 26.0, 21.0, 26.0, 18.0, 14.0, 8.0, 16.0, 15.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.50341796875, -16.9130859375, -16.32275390625, -15.732421875, -15.14208984375, -14.5517578125, -13.96142578125, -13.37109375, -12.78076171875, -12.1904296875, -11.60009765625, -11.009765625, -10.41943359375, -9.8291015625, -9.23876953125, -8.6484375, -8.05810546875, -7.4677734375, -6.87744140625, -6.287109375, -5.69677734375, -5.1064453125, -4.51611328125, -3.92578125, -3.33544921875, -2.7451171875, -2.15478515625, -1.564453125, -0.97412109375, -0.3837890625, 0.20654296875, 0.796875, 1.38720703125, 1.9775390625, 2.56787109375, 3.158203125, 3.74853515625, 4.3388671875, 4.92919921875, 5.51953125, 6.10986328125, 6.7001953125, 7.29052734375, 7.880859375, 8.47119140625, 9.0615234375, 9.65185546875, 10.2421875, 10.83251953125, 11.4228515625, 12.01318359375, 12.603515625, 13.19384765625, 13.7841796875, 14.37451171875, 14.96484375, 15.55517578125, 16.1455078125, 16.73583984375, 17.326171875, 17.91650390625, 18.5068359375, 19.09716796875, 19.6875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 20.0, 25.0, 36.0, 54.0, 84.0, 153.0, 206.0, 353.0, 752.0, 1568.0, 4050.0, 14806.0, 122324.0, 837333.0, 51955.0, 9307.0, 2943.0, 1210.0, 558.0, 330.0, 182.0, 100.0, 79.0, 35.0, 29.0, 20.0, 14.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4853515625, -11.080078125, -10.6748046875, -10.26953125, -9.8642578125, -9.458984375, -9.0537109375, -8.6484375, -8.2431640625, -7.837890625, -7.4326171875, -7.02734375, -6.6220703125, -6.216796875, -5.8115234375, -5.40625, -5.0009765625, -4.595703125, -4.1904296875, -3.78515625, -3.3798828125, -2.974609375, -2.5693359375, -2.1640625, -1.7587890625, -1.353515625, -0.9482421875, -0.54296875, -0.1376953125, 0.267578125, 0.6728515625, 1.078125, 1.4833984375, 1.888671875, 2.2939453125, 2.69921875, 3.1044921875, 3.509765625, 3.9150390625, 4.3203125, 4.7255859375, 5.130859375, 5.5361328125, 5.94140625, 6.3466796875, 6.751953125, 7.1572265625, 7.5625, 7.9677734375, 8.373046875, 8.7783203125, 9.18359375, 9.5888671875, 9.994140625, 10.3994140625, 10.8046875, 11.2099609375, 11.615234375, 12.0205078125, 12.42578125, 12.8310546875, 13.236328125, 13.6416015625, 14.046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 4.0, 7.0, 7.0, 15.0, 30.0, 37.0, 49.0, 90.0, 167.0, 170.0, 148.0, 96.0, 59.0, 37.0, 21.0, 12.0, 7.0, 12.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001209259033203125, -0.0011729598045349121, -0.0011366605758666992, -0.0011003613471984863, -0.0010640621185302734, -0.0010277628898620605, -0.0009914636611938477, -0.0009551644325256348, -0.0009188652038574219, -0.000882565975189209, -0.0008462667465209961, -0.0008099675178527832, -0.0007736682891845703, -0.0007373690605163574, -0.0007010698318481445, -0.0006647706031799316, -0.0006284713745117188, -0.0005921721458435059, -0.000555872917175293, -0.0005195736885070801, -0.0004832744598388672, -0.0004469752311706543, -0.0004106760025024414, -0.0003743767738342285, -0.0003380775451660156, -0.00030177831649780273, -0.00026547908782958984, -0.00022917985916137695, -0.00019288063049316406, -0.00015658140182495117, -0.00012028217315673828, -8.398294448852539e-05, -4.76837158203125e-05, -1.138448715209961e-05, 2.491474151611328e-05, 6.121397018432617e-05, 9.751319885253906e-05, 0.00013381242752075195, 0.00017011165618896484, 0.00020641088485717773, 0.00024271011352539062, 0.0002790093421936035, 0.0003153085708618164, 0.0003516077995300293, 0.0003879070281982422, 0.0004242062568664551, 0.00046050548553466797, 0.0004968047142028809, 0.0005331039428710938, 0.0005694031715393066, 0.0006057024002075195, 0.0006420016288757324, 0.0006783008575439453, 0.0007146000862121582, 0.0007508993148803711, 0.000787198543548584, 0.0008234977722167969, 0.0008597970008850098, 0.0008960962295532227, 0.0009323954582214355, 0.0009686946868896484, 0.0010049939155578613, 0.0010412931442260742, 0.0010775923728942871, 0.0011138916015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 7.0, 12.0, 16.0, 15.0, 25.0, 29.0, 46.0, 71.0, 140.0, 199.0, 363.0, 710.0, 1648.0, 4599.0, 16711.0, 150058.0, 800964.0, 57410.0, 9895.0, 3068.0, 1220.0, 545.0, 289.0, 187.0, 111.0, 53.0, 47.0, 28.0, 22.0, 24.0, 11.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.671875, -10.3697509765625, -10.067626953125, -9.7655029296875, -9.46337890625, -9.1612548828125, -8.859130859375, -8.5570068359375, -8.2548828125, -7.9527587890625, -7.650634765625, -7.3485107421875, -7.04638671875, -6.7442626953125, -6.442138671875, -6.1400146484375, -5.837890625, -5.5357666015625, -5.233642578125, -4.9315185546875, -4.62939453125, -4.3272705078125, -4.025146484375, -3.7230224609375, -3.4208984375, -3.1187744140625, -2.816650390625, -2.5145263671875, -2.21240234375, -1.9102783203125, -1.608154296875, -1.3060302734375, -1.00390625, -0.7017822265625, -0.399658203125, -0.0975341796875, 0.20458984375, 0.5067138671875, 0.808837890625, 1.1109619140625, 1.4130859375, 1.7152099609375, 2.017333984375, 2.3194580078125, 2.62158203125, 2.9237060546875, 3.225830078125, 3.5279541015625, 3.830078125, 4.1322021484375, 4.434326171875, 4.7364501953125, 5.03857421875, 5.3406982421875, 5.642822265625, 5.9449462890625, 6.2470703125, 6.5491943359375, 6.851318359375, 7.1534423828125, 7.45556640625, 7.7576904296875, 8.059814453125, 8.3619384765625, 8.6640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 19.0, 18.0, 31.0, 42.0, 66.0, 134.0, 159.0, 161.0, 119.0, 79.0, 45.0, 23.0, 16.0, 14.0, 8.0, 5.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.07080078125, -10.7119140625, -10.35302734375, -9.994140625, -9.63525390625, -9.2763671875, -8.91748046875, -8.55859375, -8.19970703125, -7.8408203125, -7.48193359375, -7.123046875, -6.76416015625, -6.4052734375, -6.04638671875, -5.6875, -5.32861328125, -4.9697265625, -4.61083984375, -4.251953125, -3.89306640625, -3.5341796875, -3.17529296875, -2.81640625, -2.45751953125, -2.0986328125, -1.73974609375, -1.380859375, -1.02197265625, -0.6630859375, -0.30419921875, 0.0546875, 0.41357421875, 0.7724609375, 1.13134765625, 1.490234375, 1.84912109375, 2.2080078125, 2.56689453125, 2.92578125, 3.28466796875, 3.6435546875, 4.00244140625, 4.361328125, 4.72021484375, 5.0791015625, 5.43798828125, 5.796875, 6.15576171875, 6.5146484375, 6.87353515625, 7.232421875, 7.59130859375, 7.9501953125, 8.30908203125, 8.66796875, 9.02685546875, 9.3857421875, 9.74462890625, 10.103515625, 10.46240234375, 10.8212890625, 11.18017578125, 11.5390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 13.0, 12.0, 23.0, 28.0, 38.0, 72.0, 126.0, 171.0, 174.0, 125.0, 84.0, 61.0, 29.0, 14.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.21603393554688, -70.16384887695312, -65.11165618896484, -60.05946731567383, -55.00727844238281, -49.9550895690918, -44.90290069580078, -39.850711822509766, -34.79852294921875, -29.746334075927734, -24.69414520263672, -19.641956329345703, -14.589767456054688, -9.537578582763672, -4.485389709472656, 0.5667991638183594, 5.618988037109375, 10.67117691040039, 15.723365783691406, 20.775554656982422, 25.827743530273438, 30.879932403564453, 35.93212127685547, 40.984310150146484, 46.0364990234375, 51.088687896728516, 56.14087677001953, 61.19306564331055, 66.24525451660156, 71.29743957519531, 76.3496322631836, 81.40182495117188, 86.45399475097656, 91.50617980957031, 96.5583724975586, 101.61056518554688, 106.66275024414062, 111.71493530273438, 116.76712799072266, 121.81932067871094, 126.87150573730469, 131.92369079589844, 136.97589111328125, 142.028076171875, 147.08026123046875, 152.1324462890625, 157.18463134765625, 162.23683166503906, 167.2890167236328, 172.34120178222656, 177.39340209960938, 182.44558715820312, 187.49777221679688, 192.54995727539062, 197.60214233398438, 202.6543426513672, 207.70652770996094, 212.7587127685547, 217.8109130859375, 222.86309814453125, 227.915283203125, 232.96746826171875, 238.0196533203125, 243.0718536376953, 248.12403869628906]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 11.0, 6.0, 19.0, 5.0, 20.0, 21.0, 29.0, 29.0, 44.0, 57.0, 52.0, 57.0, 66.0, 79.0, 67.0, 77.0, 58.0, 49.0, 38.0, 35.0, 30.0, 30.0, 21.0, 17.0, 14.0, 12.0, 6.0, 10.0, 11.0, 8.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-104.96003723144531, -101.78387451171875, -98.60770416259766, -95.43153381347656, -92.25537109375, -89.07920837402344, -85.90303802490234, -82.72686767578125, -79.55070495605469, -76.37454223632812, -73.19837188720703, -70.02220153808594, -66.84603881835938, -63.66987228393555, -60.49370574951172, -57.31753921508789, -54.14137268066406, -50.965206146240234, -47.789039611816406, -44.61287307739258, -41.43670654296875, -38.26054000854492, -35.084373474121094, -31.908206939697266, -28.732040405273438, -25.55587387084961, -22.37970733642578, -19.203540802001953, -16.027374267578125, -12.851207733154297, -9.675041198730469, -6.498874664306641, -3.3227005004882812, -0.14653396606445312, 3.029632568359375, 6.205799102783203, 9.381965637207031, 12.55813217163086, 15.734298706054688, 18.910465240478516, 22.086631774902344, 25.262798309326172, 28.43896484375, 31.615131378173828, 34.791297912597656, 37.967464447021484, 41.14363098144531, 44.31979751586914, 47.49596405029297, 50.6721305847168, 53.848297119140625, 57.02446365356445, 60.20063018798828, 63.37679672241211, 66.55296325683594, 69.7291259765625, 72.9052963256836, 76.08146667480469, 79.25762939453125, 82.43379211425781, 85.6099624633789, 88.7861328125, 91.96229553222656, 95.13845825195312, 98.31462860107422]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 4.0, 2.0, 3.0, 6.0, 6.0, 11.0, 16.0, 22.0, 24.0, 28.0, 21.0, 48.0, 67.0, 89.0, 147.0, 201.0, 318.0, 543.0, 877.0, 1721.0, 3927.0, 13676.0, 4106130.0, 53724.0, 7000.0, 2649.0, 1256.0, 683.0, 405.0, 230.0, 157.0, 90.0, 61.0, 36.0, 23.0, 25.0, 16.0, 9.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.5625, -31.72216796875, -30.8818359375, -30.04150390625, -29.201171875, -28.36083984375, -27.5205078125, -26.68017578125, -25.83984375, -24.99951171875, -24.1591796875, -23.31884765625, -22.478515625, -21.63818359375, -20.7978515625, -19.95751953125, -19.1171875, -18.27685546875, -17.4365234375, -16.59619140625, -15.755859375, -14.91552734375, -14.0751953125, -13.23486328125, -12.39453125, -11.55419921875, -10.7138671875, -9.87353515625, -9.033203125, -8.19287109375, -7.3525390625, -6.51220703125, -5.671875, -4.83154296875, -3.9912109375, -3.15087890625, -2.310546875, -1.47021484375, -0.6298828125, 0.21044921875, 1.05078125, 1.89111328125, 2.7314453125, 3.57177734375, 4.412109375, 5.25244140625, 6.0927734375, 6.93310546875, 7.7734375, 8.61376953125, 9.4541015625, 10.29443359375, 11.134765625, 11.97509765625, 12.8154296875, 13.65576171875, 14.49609375, 15.33642578125, 16.1767578125, 17.01708984375, 17.857421875, 18.69775390625, 19.5380859375, 20.37841796875, 21.21875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 7.0, 4.0, 8.0, 10.0, 12.0, 12.0, 16.0, 26.0, 36.0, 46.0, 49.0, 52.0, 54.0, 82.0, 66.0, 70.0, 82.0, 58.0, 58.0, 38.0, 41.0, 35.0, 35.0, 17.0, 13.0, 16.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.048095703125, -3.91259765625, -3.777099609375, -3.6416015625, -3.506103515625, -3.37060546875, -3.235107421875, -3.099609375, -2.964111328125, -2.82861328125, -2.693115234375, -2.5576171875, -2.422119140625, -2.28662109375, -2.151123046875, -2.015625, -1.880126953125, -1.74462890625, -1.609130859375, -1.4736328125, -1.338134765625, -1.20263671875, -1.067138671875, -0.931640625, -0.796142578125, -0.66064453125, -0.525146484375, -0.3896484375, -0.254150390625, -0.11865234375, 0.016845703125, 0.15234375, 0.287841796875, 0.42333984375, 0.558837890625, 0.6943359375, 0.829833984375, 0.96533203125, 1.100830078125, 1.236328125, 1.371826171875, 1.50732421875, 1.642822265625, 1.7783203125, 1.913818359375, 2.04931640625, 2.184814453125, 2.3203125, 2.455810546875, 2.59130859375, 2.726806640625, 2.8623046875, 2.997802734375, 3.13330078125, 3.268798828125, 3.404296875, 3.539794921875, 3.67529296875, 3.810791015625, 3.9462890625, 4.081787109375, 4.21728515625, 4.352783203125, 4.48828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 7.0, 18.0, 18.0, 25.0, 40.0, 33.0, 58.0, 70.0, 60.0, 92.0, 148.0, 181.0, 234.0, 370.0, 466.0, 728.0, 1084.0, 1732.0, 2822.0, 5112.0, 10057.0, 24703.0, 3546364.0, 554011.0, 22768.0, 9845.0, 5097.0, 2885.0, 1658.0, 1040.0, 732.0, 501.0, 323.0, 229.0, 164.0, 127.0, 108.0, 74.0, 71.0, 55.0, 35.0, 37.0, 31.0, 15.0, 15.0, 5.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.265625, -19.6318359375, -18.998046875, -18.3642578125, -17.73046875, -17.0966796875, -16.462890625, -15.8291015625, -15.1953125, -14.5615234375, -13.927734375, -13.2939453125, -12.66015625, -12.0263671875, -11.392578125, -10.7587890625, -10.125, -9.4912109375, -8.857421875, -8.2236328125, -7.58984375, -6.9560546875, -6.322265625, -5.6884765625, -5.0546875, -4.4208984375, -3.787109375, -3.1533203125, -2.51953125, -1.8857421875, -1.251953125, -0.6181640625, 0.015625, 0.6494140625, 1.283203125, 1.9169921875, 2.55078125, 3.1845703125, 3.818359375, 4.4521484375, 5.0859375, 5.7197265625, 6.353515625, 6.9873046875, 7.62109375, 8.2548828125, 8.888671875, 9.5224609375, 10.15625, 10.7900390625, 11.423828125, 12.0576171875, 12.69140625, 13.3251953125, 13.958984375, 14.5927734375, 15.2265625, 15.8603515625, 16.494140625, 17.1279296875, 17.76171875, 18.3955078125, 19.029296875, 19.6630859375, 20.296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 16.0, 6.0, 12.0, 45.0, 223.0, 3526.0, 116.0, 28.0, 17.0, 9.0, 15.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.31640625, -7.1036376953125, -6.890869140625, -6.6781005859375, -6.46533203125, -6.2525634765625, -6.039794921875, -5.8270263671875, -5.6142578125, -5.4014892578125, -5.188720703125, -4.9759521484375, -4.76318359375, -4.5504150390625, -4.337646484375, -4.1248779296875, -3.912109375, -3.6993408203125, -3.486572265625, -3.2738037109375, -3.06103515625, -2.8482666015625, -2.635498046875, -2.4227294921875, -2.2099609375, -1.9971923828125, -1.784423828125, -1.5716552734375, -1.35888671875, -1.1461181640625, -0.933349609375, -0.7205810546875, -0.5078125, -0.2950439453125, -0.082275390625, 0.1304931640625, 0.34326171875, 0.5560302734375, 0.768798828125, 0.9815673828125, 1.1943359375, 1.4071044921875, 1.619873046875, 1.8326416015625, 2.04541015625, 2.2581787109375, 2.470947265625, 2.6837158203125, 2.896484375, 3.1092529296875, 3.322021484375, 3.5347900390625, 3.74755859375, 3.9603271484375, 4.173095703125, 4.3858642578125, 4.5986328125, 4.8114013671875, 5.024169921875, 5.2369384765625, 5.44970703125, 5.6624755859375, 5.875244140625, 6.0880126953125, 6.30078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 11.0, 11.0, 13.0, 29.0, 62.0, 84.0, 118.0, 167.0, 151.0, 145.0, 71.0, 60.0, 34.0, 21.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.697967529296875, -42.713932037353516, -41.72990036010742, -40.74586486816406, -39.7618293762207, -38.77779769897461, -37.79376220703125, -36.809730529785156, -35.8256950378418, -34.84165954589844, -33.857627868652344, -32.873592376708984, -31.889558792114258, -30.90552520751953, -29.921489715576172, -28.937456130981445, -27.95342254638672, -26.969388961791992, -25.985353469848633, -25.001319885253906, -24.01728630065918, -23.033252716064453, -22.049217224121094, -21.065183639526367, -20.081148147583008, -19.09711456298828, -18.113079071044922, -17.129045486450195, -16.14501190185547, -15.160977363586426, -14.176942825317383, -13.192909240722656, -12.20887565612793, -11.224841117858887, -10.24080753326416, -9.256772994995117, -8.27273941040039, -7.288704872131348, -6.304670810699463, -5.320636749267578, -4.336602687835693, -3.3525686264038086, -2.368534564971924, -1.38450026512146, -0.4004662036895752, 0.5835680961608887, 1.5676021575927734, 2.551636219024658, 3.535670280456543, 4.519704341888428, 5.5037384033203125, 6.4877729415893555, 7.471806526184082, 8.455841064453125, 9.439874649047852, 10.423909187316895, 11.407943725585938, 12.39197826385498, 13.376011848449707, 14.36004638671875, 15.344079971313477, 16.328113555908203, 17.312149047851562, 18.29618263244629, 19.280216217041016]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 10.0, 11.0, 14.0, 18.0, 14.0, 13.0, 30.0, 22.0, 26.0, 21.0, 34.0, 36.0, 32.0, 40.0, 46.0, 51.0, 38.0, 55.0, 42.0, 51.0, 53.0, 38.0, 28.0, 26.0, 36.0, 25.0, 33.0, 22.0, 14.0, 22.0, 13.0, 10.0, 9.0, 12.0, 4.0, 6.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.77127742767334, -14.33841323852539, -13.905550003051758, -13.472685813903809, -13.03982162475586, -12.606958389282227, -12.174094200134277, -11.741230010986328, -11.308366775512695, -10.875502586364746, -10.442639350891113, -10.009775161743164, -9.576910972595215, -9.144046783447266, -8.711183547973633, -8.278319358825684, -7.845455169677734, -7.412591457366943, -6.979727268218994, -6.546863555908203, -6.113999366760254, -5.681135654449463, -5.248271942138672, -4.815407752990723, -4.382544040679932, -3.9496800899505615, -3.5168161392211914, -3.0839524269104004, -2.6510884761810303, -2.21822452545166, -1.7853608131408691, -1.352496862411499, -0.9196319580078125, -0.48676806688308716, -0.053904175758361816, 0.37895965576171875, 0.8118236064910889, 1.244687557220459, 1.67755126953125, 2.11041522026062, 2.5432791709899902, 2.9761431217193604, 3.4090070724487305, 3.8418707847595215, 4.2747344970703125, 4.707598686218262, 5.140462398529053, 5.573326110839844, 6.006190299987793, 6.439054012298584, 6.871918201446533, 7.304781913757324, 7.737646102905273, 8.170509338378906, 8.603373527526855, 9.036237716674805, 9.469100952148438, 9.901965141296387, 10.33482837677002, 10.767692565917969, 11.200556755065918, 11.633420944213867, 12.0662841796875, 12.49914836883545, 12.932012557983398]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 4.0, 10.0, 14.0, 23.0, 36.0, 46.0, 68.0, 102.0, 109.0, 138.0, 218.0, 273.0, 432.0, 640.0, 1065.0, 1800.0, 3115.0, 5864.0, 11952.0, 27123.0, 71720.0, 226178.0, 419859.0, 176193.0, 57022.0, 22134.0, 10208.0, 5064.0, 2709.0, 1528.0, 954.0, 629.0, 392.0, 287.0, 191.0, 122.0, 92.0, 59.0, 49.0, 31.0, 19.0, 23.0, 20.0, 10.0, 8.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.01324462890625, -6.7257080078125, -6.43817138671875, -6.150634765625, -5.86309814453125, -5.5755615234375, -5.28802490234375, -5.00048828125, -4.71295166015625, -4.4254150390625, -4.13787841796875, -3.850341796875, -3.56280517578125, -3.2752685546875, -2.98773193359375, -2.7001953125, -2.41265869140625, -2.1251220703125, -1.83758544921875, -1.550048828125, -1.26251220703125, -0.9749755859375, -0.68743896484375, -0.39990234375, -0.11236572265625, 0.1751708984375, 0.46270751953125, 0.750244140625, 1.03778076171875, 1.3253173828125, 1.61285400390625, 1.900390625, 2.18792724609375, 2.4754638671875, 2.76300048828125, 3.050537109375, 3.33807373046875, 3.6256103515625, 3.91314697265625, 4.20068359375, 4.48822021484375, 4.7757568359375, 5.06329345703125, 5.350830078125, 5.63836669921875, 5.9259033203125, 6.21343994140625, 6.5009765625, 6.78851318359375, 7.0760498046875, 7.36358642578125, 7.651123046875, 7.93865966796875, 8.2261962890625, 8.51373291015625, 8.80126953125, 9.08880615234375, 9.3763427734375, 9.66387939453125, 9.951416015625, 10.23895263671875, 10.5264892578125, 10.81402587890625, 11.1015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 16.0, 19.0, 11.0, 28.0, 33.0, 39.0, 44.0, 60.0, 46.0, 50.0, 49.0, 56.0, 65.0, 48.0, 50.0, 64.0, 46.0, 44.0, 44.0, 21.0, 27.0, 17.0, 11.0, 7.0, 10.0, 13.0, 7.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.71075439453125, -3.5816650390625, -3.45257568359375, -3.323486328125, -3.19439697265625, -3.0653076171875, -2.93621826171875, -2.80712890625, -2.67803955078125, -2.5489501953125, -2.41986083984375, -2.290771484375, -2.16168212890625, -2.0325927734375, -1.90350341796875, -1.7744140625, -1.64532470703125, -1.5162353515625, -1.38714599609375, -1.258056640625, -1.12896728515625, -0.9998779296875, -0.87078857421875, -0.74169921875, -0.61260986328125, -0.4835205078125, -0.35443115234375, -0.225341796875, -0.09625244140625, 0.0328369140625, 0.16192626953125, 0.291015625, 0.42010498046875, 0.5491943359375, 0.67828369140625, 0.807373046875, 0.93646240234375, 1.0655517578125, 1.19464111328125, 1.32373046875, 1.45281982421875, 1.5819091796875, 1.71099853515625, 1.840087890625, 1.96917724609375, 2.0982666015625, 2.22735595703125, 2.3564453125, 2.48553466796875, 2.6146240234375, 2.74371337890625, 2.872802734375, 3.00189208984375, 3.1309814453125, 3.26007080078125, 3.38916015625, 3.51824951171875, 3.6473388671875, 3.77642822265625, 3.905517578125, 4.03460693359375, 4.1636962890625, 4.29278564453125, 4.421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 1.0, 7.0, 10.0, 18.0, 23.0, 34.0, 62.0, 93.0, 218.0, 416.0, 1122.0, 3464.0, 19165.0, 366662.0, 624335.0, 26346.0, 4336.0, 1207.0, 499.0, 217.0, 123.0, 64.0, 37.0, 21.0, 21.0, 21.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -26.941162109375, -25.86669921875, -24.792236328125, -23.7177734375, -22.643310546875, -21.56884765625, -20.494384765625, -19.419921875, -18.345458984375, -17.27099609375, -16.196533203125, -15.1220703125, -14.047607421875, -12.97314453125, -11.898681640625, -10.82421875, -9.749755859375, -8.67529296875, -7.600830078125, -6.5263671875, -5.451904296875, -4.37744140625, -3.302978515625, -2.228515625, -1.154052734375, -0.07958984375, 0.994873046875, 2.0693359375, 3.143798828125, 4.21826171875, 5.292724609375, 6.3671875, 7.441650390625, 8.51611328125, 9.590576171875, 10.6650390625, 11.739501953125, 12.81396484375, 13.888427734375, 14.962890625, 16.037353515625, 17.11181640625, 18.186279296875, 19.2607421875, 20.335205078125, 21.40966796875, 22.484130859375, 23.55859375, 24.633056640625, 25.70751953125, 26.781982421875, 27.8564453125, 28.930908203125, 30.00537109375, 31.079833984375, 32.154296875, 33.228759765625, 34.30322265625, 35.377685546875, 36.4521484375, 37.526611328125, 38.60107421875, 39.675537109375, 40.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 8.0, 10.0, 17.0, 20.0, 13.0, 40.0, 50.0, 44.0, 48.0, 54.0, 64.0, 63.0, 62.0, 45.0, 69.0, 58.0, 41.0, 54.0, 41.0, 35.0, 23.0, 21.0, 16.0, 17.0, 18.0, 10.0, 6.0, 8.0, 9.0, 0.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.8388671875, -20.990234375, -20.1416015625, -19.29296875, -18.4443359375, -17.595703125, -16.7470703125, -15.8984375, -15.0498046875, -14.201171875, -13.3525390625, -12.50390625, -11.6552734375, -10.806640625, -9.9580078125, -9.109375, -8.2607421875, -7.412109375, -6.5634765625, -5.71484375, -4.8662109375, -4.017578125, -3.1689453125, -2.3203125, -1.4716796875, -0.623046875, 0.2255859375, 1.07421875, 1.9228515625, 2.771484375, 3.6201171875, 4.46875, 5.3173828125, 6.166015625, 7.0146484375, 7.86328125, 8.7119140625, 9.560546875, 10.4091796875, 11.2578125, 12.1064453125, 12.955078125, 13.8037109375, 14.65234375, 15.5009765625, 16.349609375, 17.1982421875, 18.046875, 18.8955078125, 19.744140625, 20.5927734375, 21.44140625, 22.2900390625, 23.138671875, 23.9873046875, 24.8359375, 25.6845703125, 26.533203125, 27.3818359375, 28.23046875, 29.0791015625, 29.927734375, 30.7763671875, 31.625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 9.0, 20.0, 25.0, 44.0, 61.0, 92.0, 174.0, 308.0, 690.0, 1977.0, 8953.0, 110569.0, 889094.0, 29881.0, 4290.0, 1211.0, 489.0, 238.0, 131.0, 55.0, 47.0, 38.0, 26.0, 30.0, 12.0, 6.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.125, -27.3046875, -26.484375, -25.6640625, -24.84375, -24.0234375, -23.203125, -22.3828125, -21.5625, -20.7421875, -19.921875, -19.1015625, -18.28125, -17.4609375, -16.640625, -15.8203125, -15.0, -14.1796875, -13.359375, -12.5390625, -11.71875, -10.8984375, -10.078125, -9.2578125, -8.4375, -7.6171875, -6.796875, -5.9765625, -5.15625, -4.3359375, -3.515625, -2.6953125, -1.875, -1.0546875, -0.234375, 0.5859375, 1.40625, 2.2265625, 3.046875, 3.8671875, 4.6875, 5.5078125, 6.328125, 7.1484375, 7.96875, 8.7890625, 9.609375, 10.4296875, 11.25, 12.0703125, 12.890625, 13.7109375, 14.53125, 15.3515625, 16.171875, 16.9921875, 17.8125, 18.6328125, 19.453125, 20.2734375, 21.09375, 21.9140625, 22.734375, 23.5546875, 24.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 9.0, 17.0, 20.0, 29.0, 44.0, 72.0, 114.0, 156.0, 191.0, 121.0, 65.0, 52.0, 22.0, 13.0, 15.0, 9.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0023288726806640625, -0.002264544367790222, -0.002200216054916382, -0.0021358877420425415, -0.002071559429168701, -0.002007231116294861, -0.0019429028034210205, -0.0018785744905471802, -0.0018142461776733398, -0.0017499178647994995, -0.0016855895519256592, -0.0016212612390518188, -0.0015569329261779785, -0.0014926046133041382, -0.0014282763004302979, -0.0013639479875564575, -0.0012996196746826172, -0.0012352913618087769, -0.0011709630489349365, -0.0011066347360610962, -0.0010423064231872559, -0.0009779781103134155, -0.0009136497974395752, -0.0008493214845657349, -0.0007849931716918945, -0.0007206648588180542, -0.0006563365459442139, -0.0005920082330703735, -0.0005276799201965332, -0.00046335160732269287, -0.00039902329444885254, -0.0003346949815750122, -0.0002703666687011719, -0.00020603835582733154, -0.0001417100429534912, -7.738173007965088e-05, -1.3053417205810547e-05, 5.1274895668029785e-05, 0.00011560320854187012, 0.00017993152141571045, 0.0002442598342895508, 0.0003085881471633911, 0.00037291646003723145, 0.0004372447729110718, 0.0005015730857849121, 0.0005659013986587524, 0.0006302297115325928, 0.0006945580244064331, 0.0007588863372802734, 0.0008232146501541138, 0.0008875429630279541, 0.0009518712759017944, 0.0010161995887756348, 0.001080527901649475, 0.0011448562145233154, 0.0012091845273971558, 0.001273512840270996, 0.0013378411531448364, 0.0014021694660186768, 0.001466497778892517, 0.0015308260917663574, 0.0015951544046401978, 0.001659482717514038, 0.0017238110303878784, 0.0017881393432617188]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 16.0, 29.0, 35.0, 40.0, 63.0, 82.0, 197.0, 629.0, 3830.0, 97136.0, 929900.0, 14573.0, 1335.0, 318.0, 112.0, 62.0, 52.0, 35.0, 30.0, 13.0, 15.0, 5.0, 11.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.2734375, -33.015625, -31.7578125, -30.5, -29.2421875, -27.984375, -26.7265625, -25.46875, -24.2109375, -22.953125, -21.6953125, -20.4375, -19.1796875, -17.921875, -16.6640625, -15.40625, -14.1484375, -12.890625, -11.6328125, -10.375, -9.1171875, -7.859375, -6.6015625, -5.34375, -4.0859375, -2.828125, -1.5703125, -0.3125, 0.9453125, 2.203125, 3.4609375, 4.71875, 5.9765625, 7.234375, 8.4921875, 9.75, 11.0078125, 12.265625, 13.5234375, 14.78125, 16.0390625, 17.296875, 18.5546875, 19.8125, 21.0703125, 22.328125, 23.5859375, 24.84375, 26.1015625, 27.359375, 28.6171875, 29.875, 31.1328125, 32.390625, 33.6484375, 34.90625, 36.1640625, 37.421875, 38.6796875, 39.9375, 41.1953125, 42.453125, 43.7109375, 44.96875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 4.0, 6.0, 17.0, 16.0, 26.0, 38.0, 65.0, 98.0, 154.0, 159.0, 151.0, 63.0, 67.0, 46.0, 28.0, 20.0, 9.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-25.359375, -24.835693359375, -24.31201171875, -23.788330078125, -23.2646484375, -22.740966796875, -22.21728515625, -21.693603515625, -21.169921875, -20.646240234375, -20.12255859375, -19.598876953125, -19.0751953125, -18.551513671875, -18.02783203125, -17.504150390625, -16.98046875, -16.456787109375, -15.93310546875, -15.409423828125, -14.8857421875, -14.362060546875, -13.83837890625, -13.314697265625, -12.791015625, -12.267333984375, -11.74365234375, -11.219970703125, -10.6962890625, -10.172607421875, -9.64892578125, -9.125244140625, -8.6015625, -8.077880859375, -7.55419921875, -7.030517578125, -6.5068359375, -5.983154296875, -5.45947265625, -4.935791015625, -4.412109375, -3.888427734375, -3.36474609375, -2.841064453125, -2.3173828125, -1.793701171875, -1.27001953125, -0.746337890625, -0.22265625, 0.301025390625, 0.82470703125, 1.348388671875, 1.8720703125, 2.395751953125, 2.91943359375, 3.443115234375, 3.966796875, 4.490478515625, 5.01416015625, 5.537841796875, 6.0615234375, 6.585205078125, 7.10888671875, 7.632568359375, 8.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 4.0, 19.0, 27.0, 39.0, 76.0, 123.0, 181.0, 175.0, 155.0, 94.0, 45.0, 26.0, 18.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-308.2944030761719, -300.6241455078125, -292.9538879394531, -285.2835998535156, -277.61334228515625, -269.9430847167969, -262.2728271484375, -254.60255432128906, -246.93228149414062, -239.26202392578125, -231.5917510986328, -223.92149353027344, -216.251220703125, -208.58096313476562, -200.9106903076172, -193.2404327392578, -185.57015991210938, -177.89990234375, -170.22962951660156, -162.5593719482422, -154.88909912109375, -147.21884155273438, -139.54856872558594, -131.87831115722656, -124.20805358886719, -116.53778839111328, -108.86752319335938, -101.19725799560547, -93.52699279785156, -85.85673522949219, -78.18646240234375, -70.51620483398438, -62.84593200683594, -55.17566680908203, -47.505401611328125, -39.83513641357422, -32.16487121582031, -24.494609832763672, -16.824344635009766, -9.15407943725586, -1.4838142395019531, 6.186450481414795, 13.856715202331543, 21.526979446411133, 29.19724464416504, 36.86750793457031, 44.53777313232422, 52.208038330078125, 59.87830352783203, 67.54856872558594, 75.21883392333984, 82.88909912109375, 90.55936431884766, 98.22962951660156, 105.89988708496094, 113.57015991210938, 121.24041748046875, 128.91067504882812, 136.58094787597656, 144.25120544433594, 151.92147827148438, 159.59173583984375, 167.2620086669922, 174.93226623535156, 182.6025390625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 9.0, 11.0, 11.0, 11.0, 13.0, 22.0, 28.0, 30.0, 23.0, 29.0, 41.0, 36.0, 46.0, 47.0, 56.0, 56.0, 64.0, 48.0, 46.0, 37.0, 49.0, 31.0, 34.0, 31.0, 31.0, 27.0, 22.0, 13.0, 16.0, 8.0, 6.0, 8.0, 9.0, 9.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-109.64665222167969, -106.50016021728516, -103.35367584228516, -100.20718383789062, -97.06069946289062, -93.9142074584961, -90.7677230834961, -87.62123107910156, -84.47474670410156, -81.32825469970703, -78.18177032470703, -75.0352783203125, -71.8887939453125, -68.74230194091797, -65.59581756591797, -62.44932556152344, -59.30283737182617, -56.156349182128906, -53.00986099243164, -49.863372802734375, -46.71688461303711, -43.570396423339844, -40.42390441894531, -37.27742004394531, -34.13092803955078, -30.984439849853516, -27.83795166015625, -24.691463470458984, -21.54497528076172, -18.398487091064453, -15.251996994018555, -12.105508804321289, -8.959022521972656, -5.812534332275391, -2.666045665740967, 0.48044300079345703, 3.6269311904907227, 6.773419380187988, 9.91990852355957, 13.066396713256836, 16.2128849029541, 19.359373092651367, 22.505861282348633, 25.65235137939453, 28.798839569091797, 31.945327758789062, 35.09181594848633, 38.238304138183594, 41.38479232788086, 44.531280517578125, 47.67776870727539, 50.824256896972656, 53.97074508666992, 57.11723327636719, 60.26372528076172, 63.41020965576172, 66.55670166015625, 69.70319366455078, 72.84967803955078, 75.99617004394531, 79.14265441894531, 82.28914642333984, 85.43563079833984, 88.58212280273438, 91.72860717773438]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 5.0, 11.0, 9.0, 12.0, 19.0, 27.0, 28.0, 56.0, 75.0, 108.0, 237.0, 415.0, 1121.0, 7294.0, 4178126.0, 4788.0, 1020.0, 378.0, 209.0, 118.0, 76.0, 38.0, 28.0, 23.0, 17.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-93.625, -91.46875, -89.3125, -87.15625, -85.0, -82.84375, -80.6875, -78.53125, -76.375, -74.21875, -72.0625, -69.90625, -67.75, -65.59375, -63.4375, -61.28125, -59.125, -56.96875, -54.8125, -52.65625, -50.5, -48.34375, -46.1875, -44.03125, -41.875, -39.71875, -37.5625, -35.40625, -33.25, -31.09375, -28.9375, -26.78125, -24.625, -22.46875, -20.3125, -18.15625, -16.0, -13.84375, -11.6875, -9.53125, -7.375, -5.21875, -3.0625, -0.90625, 1.25, 3.40625, 5.5625, 7.71875, 9.875, 12.03125, 14.1875, 16.34375, 18.5, 20.65625, 22.8125, 24.96875, 27.125, 29.28125, 31.4375, 33.59375, 35.75, 37.90625, 40.0625, 42.21875, 44.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 9.0, 10.0, 21.0, 33.0, 41.0, 52.0, 55.0, 68.0, 87.0, 92.0, 77.0, 87.0, 83.0, 62.0, 60.0, 38.0, 22.0, 19.0, 17.0, 10.0, 10.0, 4.0, 2.0, 11.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6953125, -7.4923095703125, -7.289306640625, -7.0863037109375, -6.88330078125, -6.6802978515625, -6.477294921875, -6.2742919921875, -6.0712890625, -5.8682861328125, -5.665283203125, -5.4622802734375, -5.25927734375, -5.0562744140625, -4.853271484375, -4.6502685546875, -4.447265625, -4.2442626953125, -4.041259765625, -3.8382568359375, -3.63525390625, -3.4322509765625, -3.229248046875, -3.0262451171875, -2.8232421875, -2.6202392578125, -2.417236328125, -2.2142333984375, -2.01123046875, -1.8082275390625, -1.605224609375, -1.4022216796875, -1.19921875, -0.9962158203125, -0.793212890625, -0.5902099609375, -0.38720703125, -0.1842041015625, 0.018798828125, 0.2218017578125, 0.4248046875, 0.6278076171875, 0.830810546875, 1.0338134765625, 1.23681640625, 1.4398193359375, 1.642822265625, 1.8458251953125, 2.048828125, 2.2518310546875, 2.454833984375, 2.6578369140625, 2.86083984375, 3.0638427734375, 3.266845703125, 3.4698486328125, 3.6728515625, 3.8758544921875, 4.078857421875, 4.2818603515625, 4.48486328125, 4.6878662109375, 4.890869140625, 5.0938720703125, 5.296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 9.0, 8.0, 8.0, 24.0, 25.0, 32.0, 36.0, 52.0, 52.0, 103.0, 167.0, 220.0, 382.0, 733.0, 1641.0, 5734.0, 4160723.0, 19232.0, 2675.0, 1023.0, 520.0, 297.0, 160.0, 107.0, 82.0, 48.0, 35.0, 28.0, 20.0, 19.0, 12.0, 17.0, 8.0, 10.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.4375, -56.330078125, -54.22265625, -52.115234375, -50.0078125, -47.900390625, -45.79296875, -43.685546875, -41.578125, -39.470703125, -37.36328125, -35.255859375, -33.1484375, -31.041015625, -28.93359375, -26.826171875, -24.71875, -22.611328125, -20.50390625, -18.396484375, -16.2890625, -14.181640625, -12.07421875, -9.966796875, -7.859375, -5.751953125, -3.64453125, -1.537109375, 0.5703125, 2.677734375, 4.78515625, 6.892578125, 9.0, 11.107421875, 13.21484375, 15.322265625, 17.4296875, 19.537109375, 21.64453125, 23.751953125, 25.859375, 27.966796875, 30.07421875, 32.181640625, 34.2890625, 36.396484375, 38.50390625, 40.611328125, 42.71875, 44.826171875, 46.93359375, 49.041015625, 51.1484375, 53.255859375, 55.36328125, 57.470703125, 59.578125, 61.685546875, 63.79296875, 65.900390625, 68.0078125, 70.115234375, 72.22265625, 74.330078125, 76.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 14.0, 35.0, 3900.0, 97.0, 14.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -17.053955078125, -16.65478515625, -16.255615234375, -15.8564453125, -15.457275390625, -15.05810546875, -14.658935546875, -14.259765625, -13.860595703125, -13.46142578125, -13.062255859375, -12.6630859375, -12.263916015625, -11.86474609375, -11.465576171875, -11.06640625, -10.667236328125, -10.26806640625, -9.868896484375, -9.4697265625, -9.070556640625, -8.67138671875, -8.272216796875, -7.873046875, -7.473876953125, -7.07470703125, -6.675537109375, -6.2763671875, -5.877197265625, -5.47802734375, -5.078857421875, -4.6796875, -4.280517578125, -3.88134765625, -3.482177734375, -3.0830078125, -2.683837890625, -2.28466796875, -1.885498046875, -1.486328125, -1.087158203125, -0.68798828125, -0.288818359375, 0.1103515625, 0.509521484375, 0.90869140625, 1.307861328125, 1.70703125, 2.106201171875, 2.50537109375, 2.904541015625, 3.3037109375, 3.702880859375, 4.10205078125, 4.501220703125, 4.900390625, 5.299560546875, 5.69873046875, 6.097900390625, 6.4970703125, 6.896240234375, 7.29541015625, 7.694580078125, 8.09375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 9.0, 14.0, 17.0, 21.0, 24.0, 30.0, 48.0, 64.0, 65.0, 94.0, 104.0, 109.0, 88.0, 73.0, 56.0, 40.0, 33.0, 22.0, 13.0, 12.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.995750427246094, -16.414566040039062, -15.833379745483398, -15.252195358276367, -14.67101001739502, -14.089824676513672, -13.50864028930664, -12.927454948425293, -12.346269607543945, -11.765084266662598, -11.18389892578125, -10.602714538574219, -10.021529197692871, -9.440343856811523, -8.859159469604492, -8.277974128723145, -7.696788787841797, -7.115603446960449, -6.53441858291626, -5.95323371887207, -5.372048377990723, -4.790863037109375, -4.2096781730651855, -3.628493309020996, -3.0473079681396484, -2.46612286567688, -1.8849377632141113, -1.3037526607513428, -0.7225675582885742, -0.14138245582580566, 0.4398026466369629, 1.0209875106811523, 1.6021728515625, 2.1833579540252686, 2.764543056488037, 3.3457281589508057, 3.926913261413574, 4.508098602294922, 5.089283466339111, 5.670468330383301, 6.251653671264648, 6.832839012145996, 7.4140238761901855, 7.995208740234375, 8.576394081115723, 9.15757942199707, 9.738763809204102, 10.31994915008545, 10.901134490966797, 11.482319831848145, 12.063505172729492, 12.644689559936523, 13.225874900817871, 13.807060241699219, 14.38824462890625, 14.969429969787598, 15.550615310668945, 16.131799697875977, 16.71298599243164, 17.294170379638672, 17.875354766845703, 18.456541061401367, 19.0377254486084, 19.618911743164062, 20.200096130371094]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 16.0, 13.0, 10.0, 18.0, 19.0, 15.0, 39.0, 37.0, 39.0, 41.0, 37.0, 49.0, 66.0, 58.0, 49.0, 52.0, 54.0, 48.0, 47.0, 49.0, 47.0, 31.0, 32.0, 29.0, 23.0, 20.0, 11.0, 14.0, 9.0, 8.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.9779052734375, -19.417823791503906, -18.85774040222168, -18.297658920288086, -17.737577438354492, -17.177494049072266, -16.617412567138672, -16.057331085205078, -15.497248649597168, -14.937166213989258, -14.377084732055664, -13.817002296447754, -13.256919860839844, -12.69683837890625, -12.13675594329834, -11.57667350769043, -11.016592025756836, -10.456509590148926, -9.896428108215332, -9.336345672607422, -8.776264190673828, -8.216181755065918, -7.656099319458008, -7.096017360687256, -6.535935401916504, -5.975853443145752, -5.415771484375, -4.85568904876709, -4.295607089996338, -3.735525131225586, -3.175442934036255, -2.615360736846924, -2.0552806854248047, -1.4951986074447632, -0.9351165294647217, -0.3750344514846802, 0.18504762649536133, 0.7451295852661133, 1.3052117824554443, 1.8652939796447754, 2.4253759384155273, 2.9854578971862793, 3.5455400943756104, 4.105622291564941, 4.665704250335693, 5.225786209106445, 5.7858686447143555, 6.345950603485107, 6.906032562255859, 7.466114521026611, 8.026196479797363, 8.586278915405273, 9.146360397338867, 9.706442832946777, 10.266525268554688, 10.826606750488281, 11.386689186096191, 11.946771621704102, 12.506853103637695, 13.066935539245605, 13.627017974853516, 14.18709945678711, 14.74718189239502, 15.30726432800293, 15.867345809936523]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 17.0, 27.0, 24.0, 32.0, 63.0, 76.0, 135.0, 199.0, 298.0, 606.0, 1121.0, 2248.0, 4866.0, 13002.0, 41640.0, 179553.0, 575664.0, 167660.0, 39306.0, 12591.0, 4739.0, 2115.0, 1056.0, 564.0, 327.0, 211.0, 129.0, 81.0, 58.0, 45.0, 31.0, 14.0, 17.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -14.15283203125, -13.6884765625, -13.22412109375, -12.759765625, -12.29541015625, -11.8310546875, -11.36669921875, -10.90234375, -10.43798828125, -9.9736328125, -9.50927734375, -9.044921875, -8.58056640625, -8.1162109375, -7.65185546875, -7.1875, -6.72314453125, -6.2587890625, -5.79443359375, -5.330078125, -4.86572265625, -4.4013671875, -3.93701171875, -3.47265625, -3.00830078125, -2.5439453125, -2.07958984375, -1.615234375, -1.15087890625, -0.6865234375, -0.22216796875, 0.2421875, 0.70654296875, 1.1708984375, 1.63525390625, 2.099609375, 2.56396484375, 3.0283203125, 3.49267578125, 3.95703125, 4.42138671875, 4.8857421875, 5.35009765625, 5.814453125, 6.27880859375, 6.7431640625, 7.20751953125, 7.671875, 8.13623046875, 8.6005859375, 9.06494140625, 9.529296875, 9.99365234375, 10.4580078125, 10.92236328125, 11.38671875, 11.85107421875, 12.3154296875, 12.77978515625, 13.244140625, 13.70849609375, 14.1728515625, 14.63720703125, 15.1015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 4.0, 9.0, 16.0, 20.0, 33.0, 37.0, 48.0, 49.0, 61.0, 64.0, 52.0, 71.0, 78.0, 72.0, 53.0, 50.0, 56.0, 38.0, 34.0, 35.0, 26.0, 15.0, 12.0, 3.0, 8.0, 7.0, 5.0, 2.0, 9.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.3780517578125, -5.177978515625, -4.9779052734375, -4.77783203125, -4.5777587890625, -4.377685546875, -4.1776123046875, -3.9775390625, -3.7774658203125, -3.577392578125, -3.3773193359375, -3.17724609375, -2.9771728515625, -2.777099609375, -2.5770263671875, -2.376953125, -2.1768798828125, -1.976806640625, -1.7767333984375, -1.57666015625, -1.3765869140625, -1.176513671875, -0.9764404296875, -0.7763671875, -0.5762939453125, -0.376220703125, -0.1761474609375, 0.02392578125, 0.2239990234375, 0.424072265625, 0.6241455078125, 0.82421875, 1.0242919921875, 1.224365234375, 1.4244384765625, 1.62451171875, 1.8245849609375, 2.024658203125, 2.2247314453125, 2.4248046875, 2.6248779296875, 2.824951171875, 3.0250244140625, 3.22509765625, 3.4251708984375, 3.625244140625, 3.8253173828125, 4.025390625, 4.2254638671875, 4.425537109375, 4.6256103515625, 4.82568359375, 5.0257568359375, 5.225830078125, 5.4259033203125, 5.6259765625, 5.8260498046875, 6.026123046875, 6.2261962890625, 6.42626953125, 6.6263427734375, 6.826416015625, 7.0264892578125, 7.2265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 8.0, 8.0, 8.0, 12.0, 13.0, 13.0, 23.0, 47.0, 55.0, 94.0, 150.0, 206.0, 335.0, 619.0, 1195.0, 3170.0, 11152.0, 63258.0, 704314.0, 227953.0, 25942.0, 5892.0, 1984.0, 817.0, 464.0, 268.0, 175.0, 125.0, 85.0, 39.0, 44.0, 20.0, 14.0, 14.0, 7.0, 6.0, 10.0, 9.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.03125, -21.265380859375, -20.49951171875, -19.733642578125, -18.9677734375, -18.201904296875, -17.43603515625, -16.670166015625, -15.904296875, -15.138427734375, -14.37255859375, -13.606689453125, -12.8408203125, -12.074951171875, -11.30908203125, -10.543212890625, -9.77734375, -9.011474609375, -8.24560546875, -7.479736328125, -6.7138671875, -5.947998046875, -5.18212890625, -4.416259765625, -3.650390625, -2.884521484375, -2.11865234375, -1.352783203125, -0.5869140625, 0.178955078125, 0.94482421875, 1.710693359375, 2.4765625, 3.242431640625, 4.00830078125, 4.774169921875, 5.5400390625, 6.305908203125, 7.07177734375, 7.837646484375, 8.603515625, 9.369384765625, 10.13525390625, 10.901123046875, 11.6669921875, 12.432861328125, 13.19873046875, 13.964599609375, 14.73046875, 15.496337890625, 16.26220703125, 17.028076171875, 17.7939453125, 18.559814453125, 19.32568359375, 20.091552734375, 20.857421875, 21.623291015625, 22.38916015625, 23.155029296875, 23.9208984375, 24.686767578125, 25.45263671875, 26.218505859375, 26.984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 4.0, 10.0, 16.0, 15.0, 21.0, 27.0, 34.0, 35.0, 49.0, 53.0, 70.0, 75.0, 66.0, 61.0, 80.0, 66.0, 56.0, 45.0, 43.0, 32.0, 40.0, 31.0, 28.0, 13.0, 11.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.390625, -23.256591796875, -22.12255859375, -20.988525390625, -19.8544921875, -18.720458984375, -17.58642578125, -16.452392578125, -15.318359375, -14.184326171875, -13.05029296875, -11.916259765625, -10.7822265625, -9.648193359375, -8.51416015625, -7.380126953125, -6.24609375, -5.112060546875, -3.97802734375, -2.843994140625, -1.7099609375, -0.575927734375, 0.55810546875, 1.692138671875, 2.826171875, 3.960205078125, 5.09423828125, 6.228271484375, 7.3623046875, 8.496337890625, 9.63037109375, 10.764404296875, 11.8984375, 13.032470703125, 14.16650390625, 15.300537109375, 16.4345703125, 17.568603515625, 18.70263671875, 19.836669921875, 20.970703125, 22.104736328125, 23.23876953125, 24.372802734375, 25.5068359375, 26.640869140625, 27.77490234375, 28.908935546875, 30.04296875, 31.177001953125, 32.31103515625, 33.445068359375, 34.5791015625, 35.713134765625, 36.84716796875, 37.981201171875, 39.115234375, 40.249267578125, 41.38330078125, 42.517333984375, 43.6513671875, 44.785400390625, 45.91943359375, 47.053466796875, 48.1875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 9.0, 14.0, 22.0, 35.0, 78.0, 149.0, 353.0, 996.0, 3632.0, 35996.0, 978331.0, 24359.0, 3083.0, 856.0, 302.0, 160.0, 69.0, 35.0, 26.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.1875, -23.30615234375, -22.4248046875, -21.54345703125, -20.662109375, -19.78076171875, -18.8994140625, -18.01806640625, -17.13671875, -16.25537109375, -15.3740234375, -14.49267578125, -13.611328125, -12.72998046875, -11.8486328125, -10.96728515625, -10.0859375, -9.20458984375, -8.3232421875, -7.44189453125, -6.560546875, -5.67919921875, -4.7978515625, -3.91650390625, -3.03515625, -2.15380859375, -1.2724609375, -0.39111328125, 0.490234375, 1.37158203125, 2.2529296875, 3.13427734375, 4.015625, 4.89697265625, 5.7783203125, 6.65966796875, 7.541015625, 8.42236328125, 9.3037109375, 10.18505859375, 11.06640625, 11.94775390625, 12.8291015625, 13.71044921875, 14.591796875, 15.47314453125, 16.3544921875, 17.23583984375, 18.1171875, 18.99853515625, 19.8798828125, 20.76123046875, 21.642578125, 22.52392578125, 23.4052734375, 24.28662109375, 25.16796875, 26.04931640625, 26.9306640625, 27.81201171875, 28.693359375, 29.57470703125, 30.4560546875, 31.33740234375, 32.21875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 14.0, 19.0, 32.0, 32.0, 49.0, 72.0, 128.0, 164.0, 158.0, 101.0, 71.0, 42.0, 18.0, 28.0, 10.0, 8.0, 12.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018277913331985474, -0.001772075891494751, -0.0017163604497909546, -0.0016606450080871582, -0.0016049295663833618, -0.0015492141246795654, -0.001493498682975769, -0.0014377832412719727, -0.0013820677995681763, -0.0013263523578643799, -0.0012706369161605835, -0.0012149214744567871, -0.0011592060327529907, -0.0011034905910491943, -0.001047775149345398, -0.0009920597076416016, -0.0009363442659378052, -0.0008806288242340088, -0.0008249133825302124, -0.000769197940826416, -0.0007134824991226196, -0.0006577670574188232, -0.0006020516157150269, -0.0005463361740112305, -0.0004906207323074341, -0.0004349052906036377, -0.0003791898488998413, -0.0003234744071960449, -0.00026775896549224854, -0.00021204352378845215, -0.00015632808208465576, -0.00010061264038085938, -4.489719867706299e-05, 1.0818243026733398e-05, 6.653368473052979e-05, 0.00012224912643432617, 0.00017796456813812256, 0.00023368000984191895, 0.00028939545154571533, 0.0003451108932495117, 0.0004008263349533081, 0.0004565417766571045, 0.0005122572183609009, 0.0005679726600646973, 0.0006236881017684937, 0.00067940354347229, 0.0007351189851760864, 0.0007908344268798828, 0.0008465498685836792, 0.0009022653102874756, 0.000957980751991272, 0.0010136961936950684, 0.0010694116353988647, 0.0011251270771026611, 0.0011808425188064575, 0.001236557960510254, 0.0012922734022140503, 0.0013479888439178467, 0.001403704285621643, 0.0014594197273254395, 0.0015151351690292358, 0.0015708506107330322, 0.0016265660524368286, 0.001682281494140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 1.0, 7.0, 11.0, 14.0, 9.0, 22.0, 41.0, 74.0, 112.0, 230.0, 476.0, 1127.0, 3137.0, 17472.0, 935932.0, 81137.0, 5649.0, 1688.0, 691.0, 290.0, 167.0, 83.0, 63.0, 38.0, 16.0, 20.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.21875, -34.30908203125, -33.3994140625, -32.48974609375, -31.580078125, -30.67041015625, -29.7607421875, -28.85107421875, -27.94140625, -27.03173828125, -26.1220703125, -25.21240234375, -24.302734375, -23.39306640625, -22.4833984375, -21.57373046875, -20.6640625, -19.75439453125, -18.8447265625, -17.93505859375, -17.025390625, -16.11572265625, -15.2060546875, -14.29638671875, -13.38671875, -12.47705078125, -11.5673828125, -10.65771484375, -9.748046875, -8.83837890625, -7.9287109375, -7.01904296875, -6.109375, -5.19970703125, -4.2900390625, -3.38037109375, -2.470703125, -1.56103515625, -0.6513671875, 0.25830078125, 1.16796875, 2.07763671875, 2.9873046875, 3.89697265625, 4.806640625, 5.71630859375, 6.6259765625, 7.53564453125, 8.4453125, 9.35498046875, 10.2646484375, 11.17431640625, 12.083984375, 12.99365234375, 13.9033203125, 14.81298828125, 15.72265625, 16.63232421875, 17.5419921875, 18.45166015625, 19.361328125, 20.27099609375, 21.1806640625, 22.09033203125, 23.0]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 17.0, 49.0, 127.0, 222.0, 310.0, 133.0, 57.0, 34.0, 14.0, 7.0, 3.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.71875, -35.886962890625, -35.05517578125, -34.223388671875, -33.3916015625, -32.559814453125, -31.72802734375, -30.896240234375, -30.064453125, -29.232666015625, -28.40087890625, -27.569091796875, -26.7373046875, -25.905517578125, -25.07373046875, -24.241943359375, -23.41015625, -22.578369140625, -21.74658203125, -20.914794921875, -20.0830078125, -19.251220703125, -18.41943359375, -17.587646484375, -16.755859375, -15.924072265625, -15.09228515625, -14.260498046875, -13.4287109375, -12.596923828125, -11.76513671875, -10.933349609375, -10.1015625, -9.269775390625, -8.43798828125, -7.606201171875, -6.7744140625, -5.942626953125, -5.11083984375, -4.279052734375, -3.447265625, -2.615478515625, -1.78369140625, -0.951904296875, -0.1201171875, 0.711669921875, 1.54345703125, 2.375244140625, 3.20703125, 4.038818359375, 4.87060546875, 5.702392578125, 6.5341796875, 7.365966796875, 8.19775390625, 9.029541015625, 9.861328125, 10.693115234375, 11.52490234375, 12.356689453125, 13.1884765625, 14.020263671875, 14.85205078125, 15.683837890625, 16.515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 15.0, 25.0, 38.0, 54.0, 86.0, 144.0, 203.0, 147.0, 104.0, 75.0, 40.0, 23.0, 15.0, 12.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5213623046875, -258.6152648925781, -251.70919799804688, -244.80311584472656, -237.89703369140625, -230.99093627929688, -224.08486938476562, -217.17877197265625, -210.27268981933594, -203.36660766601562, -196.4605255126953, -189.554443359375, -182.6483612060547, -175.74227905273438, -168.836181640625, -161.9300994873047, -155.02401733398438, -148.11793518066406, -141.21185302734375, -134.30577087402344, -127.3996810913086, -120.49359893798828, -113.58751678466797, -106.68142700195312, -99.77536010742188, -92.86927795410156, -85.96319580078125, -79.05711364746094, -72.1510238647461, -65.24494171142578, -58.33885955810547, -51.43277359008789, -44.52668762207031, -37.62060546875, -30.714519500732422, -23.80843734741211, -16.902353286743164, -9.996269226074219, -3.0901870727539062, 3.815898895263672, 10.721981048583984, 17.62806510925293, 24.534149169921875, 31.440231323242188, 38.3463134765625, 45.25239944458008, 52.15848159790039, 59.06456756591797, 65.97064971923828, 72.8767318725586, 79.7828140258789, 86.68890380859375, 93.59498596191406, 100.50106811523438, 107.40715026855469, 114.313232421875, 121.21931457519531, 128.12539672851562, 135.03147888183594, 141.93756103515625, 148.84364318847656, 155.74972534179688, 162.65582275390625, 169.56190490722656, 176.46798706054688]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 8.0, 10.0, 14.0, 14.0, 7.0, 14.0, 8.0, 18.0, 29.0, 27.0, 40.0, 45.0, 31.0, 54.0, 42.0, 64.0, 70.0, 66.0, 50.0, 59.0, 42.0, 42.0, 35.0, 30.0, 37.0, 31.0, 18.0, 21.0, 18.0, 14.0, 9.0, 7.0, 7.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-143.69024658203125, -139.3070526123047, -134.92384338378906, -130.5406494140625, -126.1574478149414, -121.77424621582031, -117.39105224609375, -113.00785064697266, -108.62464904785156, -104.24144744873047, -99.85824584960938, -95.47505187988281, -91.09185028076172, -86.70864868164062, -82.32545471191406, -77.94225311279297, -73.55905151367188, -69.17584991455078, -64.79264831542969, -60.409454345703125, -56.02625274658203, -51.64305114746094, -47.25985336303711, -42.87665557861328, -38.49345397949219, -34.110252380371094, -29.727054595947266, -25.343854904174805, -20.960655212402344, -16.577455520629883, -12.194255828857422, -7.811056137084961, -3.4278411865234375, 0.9553585052490234, 5.338558197021484, 9.721757888793945, 14.104957580566406, 18.488157272338867, 22.871356964111328, 27.25455665588379, 31.63775634765625, 36.020957946777344, 40.40415573120117, 44.787353515625, 49.170555114746094, 53.55375671386719, 57.936954498291016, 62.320152282714844, 66.70335388183594, 71.08655548095703, 75.46975708007812, 79.85295104980469, 84.23615264892578, 88.61935424804688, 93.00254821777344, 97.38574981689453, 101.76895141601562, 106.15215301513672, 110.53535461425781, 114.91854858398438, 119.30175018310547, 123.68495178222656, 128.06814575195312, 132.45135498046875, 136.8345489501953]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 10.0, 9.0, 14.0, 22.0, 31.0, 43.0, 61.0, 79.0, 121.0, 170.0, 353.0, 618.0, 1320.0, 4245.0, 90417.0, 4087750.0, 5651.0, 1608.0, 732.0, 352.0, 237.0, 141.0, 90.0, 55.0, 41.0, 24.0, 19.0, 11.0, 15.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-52.65625, -51.19677734375, -49.7373046875, -48.27783203125, -46.818359375, -45.35888671875, -43.8994140625, -42.43994140625, -40.98046875, -39.52099609375, -38.0615234375, -36.60205078125, -35.142578125, -33.68310546875, -32.2236328125, -30.76416015625, -29.3046875, -27.84521484375, -26.3857421875, -24.92626953125, -23.466796875, -22.00732421875, -20.5478515625, -19.08837890625, -17.62890625, -16.16943359375, -14.7099609375, -13.25048828125, -11.791015625, -10.33154296875, -8.8720703125, -7.41259765625, -5.953125, -4.49365234375, -3.0341796875, -1.57470703125, -0.115234375, 1.34423828125, 2.8037109375, 4.26318359375, 5.72265625, 7.18212890625, 8.6416015625, 10.10107421875, 11.560546875, 13.02001953125, 14.4794921875, 15.93896484375, 17.3984375, 18.85791015625, 20.3173828125, 21.77685546875, 23.236328125, 24.69580078125, 26.1552734375, 27.61474609375, 29.07421875, 30.53369140625, 31.9931640625, 33.45263671875, 34.912109375, 36.37158203125, 37.8310546875, 39.29052734375, 40.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 6.0, 18.0, 17.0, 24.0, 32.0, 63.0, 84.0, 89.0, 109.0, 105.0, 102.0, 75.0, 64.0, 49.0, 50.0, 29.0, 28.0, 10.0, 13.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.950927734375, -8.68310546875, -8.415283203125, -8.1474609375, -7.879638671875, -7.61181640625, -7.343994140625, -7.076171875, -6.808349609375, -6.54052734375, -6.272705078125, -6.0048828125, -5.737060546875, -5.46923828125, -5.201416015625, -4.93359375, -4.665771484375, -4.39794921875, -4.130126953125, -3.8623046875, -3.594482421875, -3.32666015625, -3.058837890625, -2.791015625, -2.523193359375, -2.25537109375, -1.987548828125, -1.7197265625, -1.451904296875, -1.18408203125, -0.916259765625, -0.6484375, -0.380615234375, -0.11279296875, 0.155029296875, 0.4228515625, 0.690673828125, 0.95849609375, 1.226318359375, 1.494140625, 1.761962890625, 2.02978515625, 2.297607421875, 2.5654296875, 2.833251953125, 3.10107421875, 3.368896484375, 3.63671875, 3.904541015625, 4.17236328125, 4.440185546875, 4.7080078125, 4.975830078125, 5.24365234375, 5.511474609375, 5.779296875, 6.047119140625, 6.31494140625, 6.582763671875, 6.8505859375, 7.118408203125, 7.38623046875, 7.654052734375, 7.921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 10.0, 22.0, 27.0, 34.0, 44.0, 60.0, 71.0, 105.0, 153.0, 235.0, 345.0, 516.0, 841.0, 1326.0, 2641.0, 5967.0, 23169.0, 4097367.0, 45575.0, 8015.0, 3295.0, 1616.0, 916.0, 605.0, 379.0, 263.0, 189.0, 130.0, 83.0, 78.0, 44.0, 37.0, 16.0, 20.0, 12.0, 17.0, 5.0, 9.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.733642578125, -27.76416015625, -26.794677734375, -25.8251953125, -24.855712890625, -23.88623046875, -22.916748046875, -21.947265625, -20.977783203125, -20.00830078125, -19.038818359375, -18.0693359375, -17.099853515625, -16.13037109375, -15.160888671875, -14.19140625, -13.221923828125, -12.25244140625, -11.282958984375, -10.3134765625, -9.343994140625, -8.37451171875, -7.405029296875, -6.435546875, -5.466064453125, -4.49658203125, -3.527099609375, -2.5576171875, -1.588134765625, -0.61865234375, 0.350830078125, 1.3203125, 2.289794921875, 3.25927734375, 4.228759765625, 5.1982421875, 6.167724609375, 7.13720703125, 8.106689453125, 9.076171875, 10.045654296875, 11.01513671875, 11.984619140625, 12.9541015625, 13.923583984375, 14.89306640625, 15.862548828125, 16.83203125, 17.801513671875, 18.77099609375, 19.740478515625, 20.7099609375, 21.679443359375, 22.64892578125, 23.618408203125, 24.587890625, 25.557373046875, 26.52685546875, 27.496337890625, 28.4658203125, 29.435302734375, 30.40478515625, 31.374267578125, 32.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 15.0, 18.0, 91.0, 3646.0, 191.0, 43.0, 19.0, 11.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75, -15.2679443359375, -14.785888671875, -14.3038330078125, -13.82177734375, -13.3397216796875, -12.857666015625, -12.3756103515625, -11.8935546875, -11.4114990234375, -10.929443359375, -10.4473876953125, -9.96533203125, -9.4832763671875, -9.001220703125, -8.5191650390625, -8.037109375, -7.5550537109375, -7.072998046875, -6.5909423828125, -6.10888671875, -5.6268310546875, -5.144775390625, -4.6627197265625, -4.1806640625, -3.6986083984375, -3.216552734375, -2.7344970703125, -2.25244140625, -1.7703857421875, -1.288330078125, -0.8062744140625, -0.32421875, 0.1578369140625, 0.639892578125, 1.1219482421875, 1.60400390625, 2.0860595703125, 2.568115234375, 3.0501708984375, 3.5322265625, 4.0142822265625, 4.496337890625, 4.9783935546875, 5.46044921875, 5.9425048828125, 6.424560546875, 6.9066162109375, 7.388671875, 7.8707275390625, 8.352783203125, 8.8348388671875, 9.31689453125, 9.7989501953125, 10.281005859375, 10.7630615234375, 11.2451171875, 11.7271728515625, 12.209228515625, 12.6912841796875, 13.17333984375, 13.6553955078125, 14.137451171875, 14.6195068359375, 15.1015625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 28.0, 62.0, 126.0, 214.0, 201.0, 149.0, 82.0, 43.0, 26.0, 13.0, 12.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.55660629272461, -35.55962371826172, -33.56264114379883, -31.56566047668457, -29.56867790222168, -27.57169532775879, -25.57471466064453, -23.57773208618164, -21.58074951171875, -19.58376693725586, -17.58678436279297, -15.589803695678711, -13.59282112121582, -11.59583854675293, -9.598856925964355, -7.601875305175781, -5.604892730712891, -3.607910633087158, -1.6109285354614258, 0.38605356216430664, 2.383035659790039, 4.38001823425293, 6.376999855041504, 8.373981475830078, 10.370964050292969, 12.36794662475586, 14.364928245544434, 16.361909866333008, 18.3588924407959, 20.35587501525879, 22.352855682373047, 24.349838256835938, 26.346817016601562, 28.343799591064453, 30.340782165527344, 32.337764739990234, 34.334747314453125, 36.33172607421875, 38.32870864868164, 40.32569122314453, 42.32267379760742, 44.31965637207031, 46.3166389465332, 48.313621520996094, 50.31060028076172, 52.307586669921875, 54.3045654296875, 56.30154800415039, 58.29853057861328, 60.29551315307617, 62.29249572753906, 64.28947448730469, 66.28646087646484, 68.28343963623047, 70.28042602539062, 72.27740478515625, 74.27438354492188, 76.2713623046875, 78.26834869384766, 80.26532745361328, 82.26231384277344, 84.25929260253906, 86.25627899169922, 88.25325775146484, 90.250244140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 6.0, 7.0, 4.0, 2.0, 6.0, 7.0, 14.0, 19.0, 15.0, 18.0, 19.0, 22.0, 21.0, 31.0, 23.0, 33.0, 35.0, 48.0, 37.0, 50.0, 32.0, 50.0, 36.0, 37.0, 38.0, 29.0, 40.0, 37.0, 30.0, 40.0, 31.0, 23.0, 29.0, 24.0, 20.0, 16.0, 14.0, 11.0, 12.0, 9.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.404634475708008, -23.700088500976562, -22.995542526245117, -22.290996551513672, -21.58645248413086, -20.881906509399414, -20.17736053466797, -19.472814559936523, -18.768268585205078, -18.063722610473633, -17.359176635742188, -16.654630661010742, -15.950085639953613, -15.245539665222168, -14.540994644165039, -13.836448669433594, -13.131902694702148, -12.427356719970703, -11.722810745239258, -11.018265724182129, -10.313719749450684, -9.609173774719238, -8.90462875366211, -8.200082778930664, -7.495536804199219, -6.790990829467773, -6.086445331573486, -5.381899833679199, -4.677353858947754, -3.9728081226348877, -3.2682623863220215, -2.5637168884277344, -1.8591728210449219, -1.1546270847320557, -0.45008134841918945, 0.25446438789367676, 0.959010124206543, 1.6635558605194092, 2.3681015968322754, 3.0726470947265625, 3.777193069458008, 4.481739044189453, 5.18628454208374, 5.890830039978027, 6.595376014709473, 7.299921989440918, 8.004467010498047, 8.709012985229492, 9.413558959960938, 10.118104934692383, 10.822650909423828, 11.527195930480957, 12.231741905212402, 12.936287879943848, 13.640832901000977, 14.345378875732422, 15.049924850463867, 15.754470825195312, 16.459016799926758, 17.163562774658203, 17.868106842041016, 18.57265281677246, 19.277198791503906, 19.98174476623535, 20.686290740966797]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 17.0, 23.0, 36.0, 77.0, 149.0, 262.0, 535.0, 1116.0, 2816.0, 8535.0, 34441.0, 240255.0, 647535.0, 87678.0, 16869.0, 4805.0, 1803.0, 756.0, 374.0, 194.0, 96.0, 76.0, 35.0, 25.0, 10.0, 8.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.515625, -23.648193359375, -22.78076171875, -21.913330078125, -21.0458984375, -20.178466796875, -19.31103515625, -18.443603515625, -17.576171875, -16.708740234375, -15.84130859375, -14.973876953125, -14.1064453125, -13.239013671875, -12.37158203125, -11.504150390625, -10.63671875, -9.769287109375, -8.90185546875, -8.034423828125, -7.1669921875, -6.299560546875, -5.43212890625, -4.564697265625, -3.697265625, -2.829833984375, -1.96240234375, -1.094970703125, -0.2275390625, 0.639892578125, 1.50732421875, 2.374755859375, 3.2421875, 4.109619140625, 4.97705078125, 5.844482421875, 6.7119140625, 7.579345703125, 8.44677734375, 9.314208984375, 10.181640625, 11.049072265625, 11.91650390625, 12.783935546875, 13.6513671875, 14.518798828125, 15.38623046875, 16.253662109375, 17.12109375, 17.988525390625, 18.85595703125, 19.723388671875, 20.5908203125, 21.458251953125, 22.32568359375, 23.193115234375, 24.060546875, 24.927978515625, 25.79541015625, 26.662841796875, 27.5302734375, 28.397705078125, 29.26513671875, 30.132568359375, 31.0]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 14.0, 10.0, 8.0, 16.0, 27.0, 28.0, 48.0, 62.0, 52.0, 72.0, 75.0, 106.0, 86.0, 79.0, 71.0, 45.0, 48.0, 37.0, 28.0, 24.0, 13.0, 9.0, 7.0, 10.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.2578125, -8.00439453125, -7.7509765625, -7.49755859375, -7.244140625, -6.99072265625, -6.7373046875, -6.48388671875, -6.23046875, -5.97705078125, -5.7236328125, -5.47021484375, -5.216796875, -4.96337890625, -4.7099609375, -4.45654296875, -4.203125, -3.94970703125, -3.6962890625, -3.44287109375, -3.189453125, -2.93603515625, -2.6826171875, -2.42919921875, -2.17578125, -1.92236328125, -1.6689453125, -1.41552734375, -1.162109375, -0.90869140625, -0.6552734375, -0.40185546875, -0.1484375, 0.10498046875, 0.3583984375, 0.61181640625, 0.865234375, 1.11865234375, 1.3720703125, 1.62548828125, 1.87890625, 2.13232421875, 2.3857421875, 2.63916015625, 2.892578125, 3.14599609375, 3.3994140625, 3.65283203125, 3.90625, 4.15966796875, 4.4130859375, 4.66650390625, 4.919921875, 5.17333984375, 5.4267578125, 5.68017578125, 5.93359375, 6.18701171875, 6.4404296875, 6.69384765625, 6.947265625, 7.20068359375, 7.4541015625, 7.70751953125, 7.9609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 12.0, 13.0, 32.0, 39.0, 46.0, 78.0, 134.0, 220.0, 456.0, 894.0, 2364.0, 8110.0, 47372.0, 635730.0, 315899.0, 27946.0, 5710.0, 1829.0, 702.0, 374.0, 212.0, 127.0, 76.0, 44.0, 29.0, 25.0, 15.0, 12.0, 12.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.171875, -21.202392578125, -20.23291015625, -19.263427734375, -18.2939453125, -17.324462890625, -16.35498046875, -15.385498046875, -14.416015625, -13.446533203125, -12.47705078125, -11.507568359375, -10.5380859375, -9.568603515625, -8.59912109375, -7.629638671875, -6.66015625, -5.690673828125, -4.72119140625, -3.751708984375, -2.7822265625, -1.812744140625, -0.84326171875, 0.126220703125, 1.095703125, 2.065185546875, 3.03466796875, 4.004150390625, 4.9736328125, 5.943115234375, 6.91259765625, 7.882080078125, 8.8515625, 9.821044921875, 10.79052734375, 11.760009765625, 12.7294921875, 13.698974609375, 14.66845703125, 15.637939453125, 16.607421875, 17.576904296875, 18.54638671875, 19.515869140625, 20.4853515625, 21.454833984375, 22.42431640625, 23.393798828125, 24.36328125, 25.332763671875, 26.30224609375, 27.271728515625, 28.2412109375, 29.210693359375, 30.18017578125, 31.149658203125, 32.119140625, 33.088623046875, 34.05810546875, 35.027587890625, 35.9970703125, 36.966552734375, 37.93603515625, 38.905517578125, 39.875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 5.0, 6.0, 9.0, 13.0, 8.0, 9.0, 12.0, 21.0, 26.0, 28.0, 25.0, 28.0, 34.0, 38.0, 31.0, 38.0, 35.0, 38.0, 45.0, 44.0, 34.0, 40.0, 39.0, 48.0, 41.0, 38.0, 34.0, 32.0, 27.0, 24.0, 24.0, 16.0, 15.0, 13.0, 15.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.9267578125, -17.275390625, -16.6240234375, -15.97265625, -15.3212890625, -14.669921875, -14.0185546875, -13.3671875, -12.7158203125, -12.064453125, -11.4130859375, -10.76171875, -10.1103515625, -9.458984375, -8.8076171875, -8.15625, -7.5048828125, -6.853515625, -6.2021484375, -5.55078125, -4.8994140625, -4.248046875, -3.5966796875, -2.9453125, -2.2939453125, -1.642578125, -0.9912109375, -0.33984375, 0.3115234375, 0.962890625, 1.6142578125, 2.265625, 2.9169921875, 3.568359375, 4.2197265625, 4.87109375, 5.5224609375, 6.173828125, 6.8251953125, 7.4765625, 8.1279296875, 8.779296875, 9.4306640625, 10.08203125, 10.7333984375, 11.384765625, 12.0361328125, 12.6875, 13.3388671875, 13.990234375, 14.6416015625, 15.29296875, 15.9443359375, 16.595703125, 17.2470703125, 17.8984375, 18.5498046875, 19.201171875, 19.8525390625, 20.50390625, 21.1552734375, 21.806640625, 22.4580078125, 23.109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 5.0, 6.0, 16.0, 13.0, 13.0, 21.0, 29.0, 49.0, 65.0, 102.0, 214.0, 406.0, 987.0, 2993.0, 13089.0, 151561.0, 806377.0, 61336.0, 7768.0, 1992.0, 734.0, 354.0, 145.0, 99.0, 67.0, 28.0, 26.0, 10.0, 14.0, 7.0, 7.0, 1.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87109375, -7.57232666015625, -7.2735595703125, -6.97479248046875, -6.676025390625, -6.37725830078125, -6.0784912109375, -5.77972412109375, -5.48095703125, -5.18218994140625, -4.8834228515625, -4.58465576171875, -4.285888671875, -3.98712158203125, -3.6883544921875, -3.38958740234375, -3.0908203125, -2.79205322265625, -2.4932861328125, -2.19451904296875, -1.895751953125, -1.59698486328125, -1.2982177734375, -0.99945068359375, -0.70068359375, -0.40191650390625, -0.1031494140625, 0.19561767578125, 0.494384765625, 0.79315185546875, 1.0919189453125, 1.39068603515625, 1.689453125, 1.98822021484375, 2.2869873046875, 2.58575439453125, 2.884521484375, 3.18328857421875, 3.4820556640625, 3.78082275390625, 4.07958984375, 4.37835693359375, 4.6771240234375, 4.97589111328125, 5.274658203125, 5.57342529296875, 5.8721923828125, 6.17095947265625, 6.4697265625, 6.76849365234375, 7.0672607421875, 7.36602783203125, 7.664794921875, 7.96356201171875, 8.2623291015625, 8.56109619140625, 8.85986328125, 9.15863037109375, 9.4573974609375, 9.75616455078125, 10.054931640625, 10.35369873046875, 10.6524658203125, 10.95123291015625, 11.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 10.0, 13.0, 10.0, 15.0, 24.0, 24.0, 49.0, 43.0, 45.0, 86.0, 75.0, 82.0, 88.0, 67.0, 64.0, 66.0, 47.0, 34.0, 22.0, 19.0, 14.0, 13.0, 13.0, 10.0, 9.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.0009570121765136719, -0.0009287819266319275, -0.0009005516767501831, -0.0008723214268684387, -0.0008440911769866943, -0.00081586092710495, -0.0007876306772232056, -0.0007594004273414612, -0.0007311701774597168, -0.0007029399275779724, -0.000674709677696228, -0.0006464794278144836, -0.0006182491779327393, -0.0005900189280509949, -0.0005617886781692505, -0.0005335584282875061, -0.0005053281784057617, -0.00047709792852401733, -0.00044886767864227295, -0.00042063742876052856, -0.0003924071788787842, -0.0003641769289970398, -0.0003359466791152954, -0.000307716429233551, -0.00027948617935180664, -0.00025125592947006226, -0.00022302567958831787, -0.00019479542970657349, -0.0001665651798248291, -0.00013833492994308472, -0.00011010468006134033, -8.187443017959595e-05, -5.364418029785156e-05, -2.5413930416107178e-05, 2.816319465637207e-06, 3.104656934738159e-05, 5.9276819229125977e-05, 8.750706911087036e-05, 0.00011573731899261475, 0.00014396756887435913, 0.00017219781875610352, 0.0002004280686378479, 0.00022865831851959229, 0.00025688856840133667, 0.00028511881828308105, 0.00031334906816482544, 0.0003415793180465698, 0.0003698095679283142, 0.0003980398178100586, 0.000426270067691803, 0.00045450031757354736, 0.00048273056745529175, 0.0005109608173370361, 0.0005391910672187805, 0.0005674213171005249, 0.0005956515669822693, 0.0006238818168640137, 0.0006521120667457581, 0.0006803423166275024, 0.0007085725665092468, 0.0007368028163909912, 0.0007650330662727356, 0.00079326331615448, 0.0008214935660362244, 0.0008497238159179688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 30.0, 47.0, 119.0, 201.0, 544.0, 2076.0, 17988.0, 875212.0, 145020.0, 5560.0, 1049.0, 327.0, 154.0, 90.0, 39.0, 27.0, 19.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -9.9466552734375, -9.416748046875, -8.8868408203125, -8.35693359375, -7.8270263671875, -7.297119140625, -6.7672119140625, -6.2373046875, -5.7073974609375, -5.177490234375, -4.6475830078125, -4.11767578125, -3.5877685546875, -3.057861328125, -2.5279541015625, -1.998046875, -1.4681396484375, -0.938232421875, -0.4083251953125, 0.12158203125, 0.6514892578125, 1.181396484375, 1.7113037109375, 2.2412109375, 2.7711181640625, 3.301025390625, 3.8309326171875, 4.36083984375, 4.8907470703125, 5.420654296875, 5.9505615234375, 6.48046875, 7.0103759765625, 7.540283203125, 8.0701904296875, 8.60009765625, 9.1300048828125, 9.659912109375, 10.1898193359375, 10.7197265625, 11.2496337890625, 11.779541015625, 12.3094482421875, 12.83935546875, 13.3692626953125, 13.899169921875, 14.4290771484375, 14.958984375, 15.4888916015625, 16.018798828125, 16.5487060546875, 17.07861328125, 17.6085205078125, 18.138427734375, 18.6683349609375, 19.1982421875, 19.7281494140625, 20.258056640625, 20.7879638671875, 21.31787109375, 21.8477783203125, 22.377685546875, 22.9075927734375, 23.4375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 9.0, 18.0, 24.0, 34.0, 69.0, 79.0, 106.0, 132.0, 131.0, 125.0, 86.0, 56.0, 39.0, 29.0, 20.0, 18.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.7703857421875, -7.447021484375, -7.1236572265625, -6.80029296875, -6.4769287109375, -6.153564453125, -5.8302001953125, -5.5068359375, -5.1834716796875, -4.860107421875, -4.5367431640625, -4.21337890625, -3.8900146484375, -3.566650390625, -3.2432861328125, -2.919921875, -2.5965576171875, -2.273193359375, -1.9498291015625, -1.62646484375, -1.3031005859375, -0.979736328125, -0.6563720703125, -0.3330078125, -0.0096435546875, 0.313720703125, 0.6370849609375, 0.96044921875, 1.2838134765625, 1.607177734375, 1.9305419921875, 2.25390625, 2.5772705078125, 2.900634765625, 3.2239990234375, 3.54736328125, 3.8707275390625, 4.194091796875, 4.5174560546875, 4.8408203125, 5.1641845703125, 5.487548828125, 5.8109130859375, 6.13427734375, 6.4576416015625, 6.781005859375, 7.1043701171875, 7.427734375, 7.7510986328125, 8.074462890625, 8.3978271484375, 8.72119140625, 9.0445556640625, 9.367919921875, 9.6912841796875, 10.0146484375, 10.3380126953125, 10.661376953125, 10.9847412109375, 11.30810546875, 11.6314697265625, 11.954833984375, 12.2781982421875, 12.6015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 15.0, 53.0, 106.0, 207.0, 299.0, 202.0, 74.0, 21.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.8743896484375, -358.4471740722656, -348.01995849609375, -337.59271240234375, -327.1654968261719, -316.73828125, -306.31103515625, -295.8838195800781, -285.45660400390625, -275.0293884277344, -264.6021728515625, -254.1749267578125, -243.74771118164062, -233.32049560546875, -222.8932647705078, -212.46603393554688, -202.038818359375, -191.61160278320312, -181.1843719482422, -170.75714111328125, -160.32992553710938, -149.9027099609375, -139.47547912597656, -129.04824829101562, -118.62103271484375, -108.19380950927734, -97.76658630371094, -87.33936309814453, -76.91213989257812, -66.48491668701172, -56.05769348144531, -45.630470275878906, -35.203216552734375, -24.77599334716797, -14.348770141601562, -3.9215469360351562, 6.50567626953125, 16.932899475097656, 27.360122680664062, 37.78734588623047, 48.214569091796875, 58.64179229736328, 69.06901550292969, 79.4962387084961, 89.9234619140625, 100.3506851196289, 110.77790832519531, 121.20513153076172, 131.63235473632812, 142.0595703125, 152.48680114746094, 162.91403198242188, 173.34124755859375, 183.76846313476562, 194.19569396972656, 204.6229248046875, 215.05014038085938, 225.47735595703125, 235.9045867919922, 246.33181762695312, 256.759033203125, 267.1862487792969, 277.61346435546875, 288.04071044921875, 298.4679260253906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 6.0, 9.0, 8.0, 12.0, 8.0, 9.0, 15.0, 20.0, 22.0, 26.0, 29.0, 37.0, 34.0, 42.0, 40.0, 45.0, 47.0, 44.0, 51.0, 59.0, 45.0, 40.0, 32.0, 40.0, 42.0, 39.0, 30.0, 22.0, 18.0, 24.0, 17.0, 23.0, 9.0, 8.0, 3.0, 8.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-106.68327331542969, -103.49650573730469, -100.30973052978516, -97.12296295166016, -93.93618774414062, -90.74942016601562, -87.56265258789062, -84.3758773803711, -81.1891098022461, -78.0023422241211, -74.81556701660156, -71.62879943847656, -68.44202423095703, -65.25525665283203, -62.068485260009766, -58.8817138671875, -55.694942474365234, -52.50817108154297, -49.3213996887207, -46.13462829589844, -42.94786071777344, -39.76108932495117, -36.574317932128906, -33.387550354003906, -30.200777053833008, -27.014005661010742, -23.82723617553711, -20.640464782714844, -17.453693389892578, -14.266923904418945, -11.08015251159668, -7.893383026123047, -4.706611633300781, -1.519840955734253, 1.6669297218322754, 4.853700637817383, 8.040471076965332, 11.227241516113281, 14.414012908935547, 17.60078239440918, 20.787553787231445, 23.97432518005371, 27.161094665527344, 30.34786605834961, 33.534637451171875, 36.721405029296875, 39.908180236816406, 43.094947814941406, 46.28171920776367, 49.46849060058594, 52.6552619934082, 55.84203338623047, 59.02880096435547, 62.215572357177734, 65.40234375, 68.589111328125, 71.77588653564453, 74.96265411376953, 78.14942932128906, 81.33619689941406, 84.5229721069336, 87.7097396850586, 90.89651489257812, 94.08328247070312, 97.27005004882812]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 22.0, 33.0, 62.0, 89.0, 132.0, 203.0, 345.0, 588.0, 925.0, 1791.0, 3531.0, 7863.0, 21478.0, 97236.0, 3593024.0, 406738.0, 37408.0, 12195.0, 5113.0, 2503.0, 1245.0, 677.0, 412.0, 252.0, 146.0, 85.0, 58.0, 31.0, 27.0, 16.0, 3.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.7327880859375, -13.254638671875, -12.7764892578125, -12.29833984375, -11.8201904296875, -11.342041015625, -10.8638916015625, -10.3857421875, -9.9075927734375, -9.429443359375, -8.9512939453125, -8.47314453125, -7.9949951171875, -7.516845703125, -7.0386962890625, -6.560546875, -6.0823974609375, -5.604248046875, -5.1260986328125, -4.64794921875, -4.1697998046875, -3.691650390625, -3.2135009765625, -2.7353515625, -2.2572021484375, -1.779052734375, -1.3009033203125, -0.82275390625, -0.3446044921875, 0.133544921875, 0.6116943359375, 1.08984375, 1.5679931640625, 2.046142578125, 2.5242919921875, 3.00244140625, 3.4805908203125, 3.958740234375, 4.4368896484375, 4.9150390625, 5.3931884765625, 5.871337890625, 6.3494873046875, 6.82763671875, 7.3057861328125, 7.783935546875, 8.2620849609375, 8.740234375, 9.2183837890625, 9.696533203125, 10.1746826171875, 10.65283203125, 11.1309814453125, 11.609130859375, 12.0872802734375, 12.5654296875, 13.0435791015625, 13.521728515625, 13.9998779296875, 14.47802734375, 14.9561767578125, 15.434326171875, 15.9124755859375, 16.390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 10.0, 15.0, 25.0, 28.0, 34.0, 51.0, 50.0, 73.0, 62.0, 57.0, 75.0, 66.0, 70.0, 70.0, 54.0, 49.0, 41.0, 28.0, 26.0, 23.0, 17.0, 16.0, 10.0, 12.0, 7.0, 6.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.6953125, -6.49884033203125, -6.3023681640625, -6.10589599609375, -5.909423828125, -5.71295166015625, -5.5164794921875, -5.32000732421875, -5.12353515625, -4.92706298828125, -4.7305908203125, -4.53411865234375, -4.337646484375, -4.14117431640625, -3.9447021484375, -3.74822998046875, -3.5517578125, -3.35528564453125, -3.1588134765625, -2.96234130859375, -2.765869140625, -2.56939697265625, -2.3729248046875, -2.17645263671875, -1.97998046875, -1.78350830078125, -1.5870361328125, -1.39056396484375, -1.194091796875, -0.99761962890625, -0.8011474609375, -0.60467529296875, -0.408203125, -0.21173095703125, -0.0152587890625, 0.18121337890625, 0.377685546875, 0.57415771484375, 0.7706298828125, 0.96710205078125, 1.16357421875, 1.36004638671875, 1.5565185546875, 1.75299072265625, 1.949462890625, 2.14593505859375, 2.3424072265625, 2.53887939453125, 2.7353515625, 2.93182373046875, 3.1282958984375, 3.32476806640625, 3.521240234375, 3.71771240234375, 3.9141845703125, 4.11065673828125, 4.30712890625, 4.50360107421875, 4.7000732421875, 4.89654541015625, 5.093017578125, 5.28948974609375, 5.4859619140625, 5.68243408203125, 5.87890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 18.0, 19.0, 25.0, 27.0, 39.0, 47.0, 80.0, 115.0, 225.0, 322.0, 613.0, 1142.0, 2011.0, 4016.0, 8066.0, 18718.0, 55971.0, 355818.0, 3504023.0, 175654.0, 39531.0, 14345.0, 6205.0, 3238.0, 1681.0, 895.0, 572.0, 278.0, 197.0, 117.0, 88.0, 51.0, 36.0, 22.0, 21.0, 15.0, 6.0, 10.0, 7.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.4114990234375, -12.002685546875, -11.5938720703125, -11.18505859375, -10.7762451171875, -10.367431640625, -9.9586181640625, -9.5498046875, -9.1409912109375, -8.732177734375, -8.3233642578125, -7.91455078125, -7.5057373046875, -7.096923828125, -6.6881103515625, -6.279296875, -5.8704833984375, -5.461669921875, -5.0528564453125, -4.64404296875, -4.2352294921875, -3.826416015625, -3.4176025390625, -3.0087890625, -2.5999755859375, -2.191162109375, -1.7823486328125, -1.37353515625, -0.9647216796875, -0.555908203125, -0.1470947265625, 0.26171875, 0.6705322265625, 1.079345703125, 1.4881591796875, 1.89697265625, 2.3057861328125, 2.714599609375, 3.1234130859375, 3.5322265625, 3.9410400390625, 4.349853515625, 4.7586669921875, 5.16748046875, 5.5762939453125, 5.985107421875, 6.3939208984375, 6.802734375, 7.2115478515625, 7.620361328125, 8.0291748046875, 8.43798828125, 8.8468017578125, 9.255615234375, 9.6644287109375, 10.0732421875, 10.4820556640625, 10.890869140625, 11.2996826171875, 11.70849609375, 12.1173095703125, 12.526123046875, 12.9349365234375, 13.34375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 7.0, 3.0, 15.0, 7.0, 17.0, 19.0, 25.0, 41.0, 52.0, 93.0, 117.0, 271.0, 761.0, 1416.0, 603.0, 241.0, 104.0, 59.0, 60.0, 29.0, 27.0, 20.0, 17.0, 9.0, 11.0, 4.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.703125, -13.20263671875, -12.7021484375, -12.20166015625, -11.701171875, -11.20068359375, -10.7001953125, -10.19970703125, -9.69921875, -9.19873046875, -8.6982421875, -8.19775390625, -7.697265625, -7.19677734375, -6.6962890625, -6.19580078125, -5.6953125, -5.19482421875, -4.6943359375, -4.19384765625, -3.693359375, -3.19287109375, -2.6923828125, -2.19189453125, -1.69140625, -1.19091796875, -0.6904296875, -0.18994140625, 0.310546875, 0.81103515625, 1.3115234375, 1.81201171875, 2.3125, 2.81298828125, 3.3134765625, 3.81396484375, 4.314453125, 4.81494140625, 5.3154296875, 5.81591796875, 6.31640625, 6.81689453125, 7.3173828125, 7.81787109375, 8.318359375, 8.81884765625, 9.3193359375, 9.81982421875, 10.3203125, 10.82080078125, 11.3212890625, 11.82177734375, 12.322265625, 12.82275390625, 13.3232421875, 13.82373046875, 14.32421875, 14.82470703125, 15.3251953125, 15.82568359375, 16.326171875, 16.82666015625, 17.3271484375, 17.82763671875, 18.328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 21.0, 43.0, 154.0, 282.0, 272.0, 125.0, 44.0, 20.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-323.97894287109375, -317.2300720214844, -310.481201171875, -303.7322998046875, -296.9834289550781, -290.23455810546875, -283.4856872558594, -276.73681640625, -269.9879455566406, -263.23907470703125, -256.4902038574219, -249.74131774902344, -242.99244689941406, -236.24356079101562, -229.49468994140625, -222.74581909179688, -215.99691772460938, -209.248046875, -202.49916076660156, -195.7502899169922, -189.0014190673828, -182.25253295898438, -175.503662109375, -168.75479125976562, -162.00592041015625, -155.25704956054688, -148.50816345214844, -141.75929260253906, -135.0104217529297, -128.26153564453125, -121.51266479492188, -114.76378631591797, -108.01490783691406, -101.26602935791016, -94.51715850830078, -87.76828002929688, -81.01940155029297, -74.27052307128906, -67.52165222167969, -60.77277374267578, -54.02389907836914, -47.2750244140625, -40.526145935058594, -33.77727127075195, -27.02839469909668, -20.279518127441406, -13.530643463134766, -6.781764984130859, -0.03289031982421875, 6.7159857749938965, 13.464861869812012, 20.21373748779297, 26.962614059448242, 33.711490631103516, 40.460365295410156, 47.20924377441406, 53.9581184387207, 60.706993103027344, 67.45587158203125, 74.20474243164062, 80.95362091064453, 87.70249938964844, 94.45137023925781, 101.20025634765625, 107.94912719726562]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 7.0, 11.0, 14.0, 15.0, 23.0, 34.0, 22.0, 30.0, 40.0, 46.0, 46.0, 50.0, 44.0, 53.0, 58.0, 57.0, 53.0, 53.0, 47.0, 42.0, 38.0, 32.0, 33.0, 34.0, 23.0, 21.0, 8.0, 14.0, 10.0, 8.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.70966339111328, -71.57650756835938, -69.443359375, -67.3102035522461, -65.17705535888672, -63.04389953613281, -60.91074752807617, -58.77759552001953, -56.644439697265625, -54.511287689208984, -52.378135681152344, -50.24497985839844, -48.1118278503418, -45.978675842285156, -43.845523834228516, -41.712371826171875, -39.579219818115234, -37.446067810058594, -35.31291580200195, -33.17976379394531, -31.046607971191406, -28.913455963134766, -26.780303955078125, -24.647151947021484, -22.51399803161621, -20.38084602355957, -18.247692108154297, -16.114540100097656, -13.9813871383667, -11.848234176635742, -9.715082168579102, -7.5819292068481445, -5.4487762451171875, -3.3156235218048096, -1.1824707984924316, 0.9506816864013672, 3.083834648132324, 5.216987609863281, 7.350139617919922, 9.483292579650879, 11.616445541381836, 13.749598503112793, 15.88275146484375, 18.01590347290039, 20.14905548095703, 22.282209396362305, 24.415361404418945, 26.54851531982422, 28.68166732788086, 30.8148193359375, 32.94797134399414, 35.08112335205078, 37.21427917480469, 39.34743118286133, 41.48058319091797, 43.61373519897461, 45.74688720703125, 47.88003921508789, 50.01319122314453, 52.14634704589844, 54.27949905395508, 56.41265106201172, 58.54580307006836, 60.678955078125, 62.812110900878906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 16.0, 15.0, 17.0, 37.0, 48.0, 85.0, 76.0, 147.0, 238.0, 336.0, 501.0, 745.0, 1242.0, 1971.0, 3649.0, 7057.0, 14776.0, 34832.0, 88901.0, 253111.0, 387278.0, 152252.0, 55972.0, 22783.0, 10280.0, 4995.0, 2783.0, 1562.0, 975.0, 630.0, 388.0, 263.0, 185.0, 112.0, 90.0, 63.0, 44.0, 23.0, 26.0, 12.0, 8.0, 5.0, 1.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6622314453125, -8.355712890625, -8.0491943359375, -7.74267578125, -7.4361572265625, -7.129638671875, -6.8231201171875, -6.5166015625, -6.2100830078125, -5.903564453125, -5.5970458984375, -5.29052734375, -4.9840087890625, -4.677490234375, -4.3709716796875, -4.064453125, -3.7579345703125, -3.451416015625, -3.1448974609375, -2.83837890625, -2.5318603515625, -2.225341796875, -1.9188232421875, -1.6123046875, -1.3057861328125, -0.999267578125, -0.6927490234375, -0.38623046875, -0.0797119140625, 0.226806640625, 0.5333251953125, 0.83984375, 1.1463623046875, 1.452880859375, 1.7593994140625, 2.06591796875, 2.3724365234375, 2.678955078125, 2.9854736328125, 3.2919921875, 3.5985107421875, 3.905029296875, 4.2115478515625, 4.51806640625, 4.8245849609375, 5.131103515625, 5.4376220703125, 5.744140625, 6.0506591796875, 6.357177734375, 6.6636962890625, 6.97021484375, 7.2767333984375, 7.583251953125, 7.8897705078125, 8.1962890625, 8.5028076171875, 8.809326171875, 9.1158447265625, 9.42236328125, 9.7288818359375, 10.035400390625, 10.3419189453125, 10.6484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 0.0, 7.0, 15.0, 13.0, 21.0, 23.0, 21.0, 35.0, 46.0, 46.0, 55.0, 49.0, 50.0, 53.0, 51.0, 59.0, 74.0, 57.0, 41.0, 45.0, 34.0, 40.0, 30.0, 21.0, 17.0, 24.0, 13.0, 17.0, 7.0, 10.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.9298095703125, -3.765869140625, -3.6019287109375, -3.43798828125, -3.2740478515625, -3.110107421875, -2.9461669921875, -2.7822265625, -2.6182861328125, -2.454345703125, -2.2904052734375, -2.12646484375, -1.9625244140625, -1.798583984375, -1.6346435546875, -1.470703125, -1.3067626953125, -1.142822265625, -0.9788818359375, -0.81494140625, -0.6510009765625, -0.487060546875, -0.3231201171875, -0.1591796875, 0.0047607421875, 0.168701171875, 0.3326416015625, 0.49658203125, 0.6605224609375, 0.824462890625, 0.9884033203125, 1.15234375, 1.3162841796875, 1.480224609375, 1.6441650390625, 1.80810546875, 1.9720458984375, 2.135986328125, 2.2999267578125, 2.4638671875, 2.6278076171875, 2.791748046875, 2.9556884765625, 3.11962890625, 3.2835693359375, 3.447509765625, 3.6114501953125, 3.775390625, 3.9393310546875, 4.103271484375, 4.2672119140625, 4.43115234375, 4.5950927734375, 4.759033203125, 4.9229736328125, 5.0869140625, 5.2508544921875, 5.414794921875, 5.5787353515625, 5.74267578125, 5.9066162109375, 6.070556640625, 6.2344970703125, 6.3984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 12.0, 13.0, 14.0, 25.0, 31.0, 63.0, 86.0, 128.0, 231.0, 403.0, 819.0, 2017.0, 6475.0, 39311.0, 649931.0, 316538.0, 24226.0, 4852.0, 1627.0, 765.0, 387.0, 213.0, 128.0, 82.0, 58.0, 33.0, 22.0, 12.0, 11.0, 11.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.765625, -20.02099609375, -19.2763671875, -18.53173828125, -17.787109375, -17.04248046875, -16.2978515625, -15.55322265625, -14.80859375, -14.06396484375, -13.3193359375, -12.57470703125, -11.830078125, -11.08544921875, -10.3408203125, -9.59619140625, -8.8515625, -8.10693359375, -7.3623046875, -6.61767578125, -5.873046875, -5.12841796875, -4.3837890625, -3.63916015625, -2.89453125, -2.14990234375, -1.4052734375, -0.66064453125, 0.083984375, 0.82861328125, 1.5732421875, 2.31787109375, 3.0625, 3.80712890625, 4.5517578125, 5.29638671875, 6.041015625, 6.78564453125, 7.5302734375, 8.27490234375, 9.01953125, 9.76416015625, 10.5087890625, 11.25341796875, 11.998046875, 12.74267578125, 13.4873046875, 14.23193359375, 14.9765625, 15.72119140625, 16.4658203125, 17.21044921875, 17.955078125, 18.69970703125, 19.4443359375, 20.18896484375, 20.93359375, 21.67822265625, 22.4228515625, 23.16748046875, 23.912109375, 24.65673828125, 25.4013671875, 26.14599609375, 26.890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 6.0, 14.0, 9.0, 8.0, 12.0, 15.0, 16.0, 20.0, 21.0, 35.0, 37.0, 35.0, 38.0, 57.0, 61.0, 58.0, 60.0, 59.0, 54.0, 46.0, 56.0, 52.0, 33.0, 26.0, 33.0, 25.0, 22.0, 20.0, 18.0, 15.0, 12.0, 8.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.953125, -18.265625, -17.578125, -16.890625, -16.203125, -15.515625, -14.828125, -14.140625, -13.453125, -12.765625, -12.078125, -11.390625, -10.703125, -10.015625, -9.328125, -8.640625, -7.953125, -7.265625, -6.578125, -5.890625, -5.203125, -4.515625, -3.828125, -3.140625, -2.453125, -1.765625, -1.078125, -0.390625, 0.296875, 0.984375, 1.671875, 2.359375, 3.046875, 3.734375, 4.421875, 5.109375, 5.796875, 6.484375, 7.171875, 7.859375, 8.546875, 9.234375, 9.921875, 10.609375, 11.296875, 11.984375, 12.671875, 13.359375, 14.046875, 14.734375, 15.421875, 16.109375, 16.796875, 17.484375, 18.171875, 18.859375, 19.546875, 20.234375, 20.921875, 21.609375, 22.296875, 22.984375, 23.671875, 24.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 12.0, 16.0, 31.0, 40.0, 77.0, 137.0, 272.0, 585.0, 1412.0, 4773.0, 24360.0, 398572.0, 581404.0, 28568.0, 5431.0, 1610.0, 603.0, 265.0, 150.0, 85.0, 46.0, 33.0, 23.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.4129638671875, -10.146240234375, -9.8795166015625, -9.61279296875, -9.3460693359375, -9.079345703125, -8.8126220703125, -8.5458984375, -8.2791748046875, -8.012451171875, -7.7457275390625, -7.47900390625, -7.2122802734375, -6.945556640625, -6.6788330078125, -6.412109375, -6.1453857421875, -5.878662109375, -5.6119384765625, -5.34521484375, -5.0784912109375, -4.811767578125, -4.5450439453125, -4.2783203125, -4.0115966796875, -3.744873046875, -3.4781494140625, -3.21142578125, -2.9447021484375, -2.677978515625, -2.4112548828125, -2.14453125, -1.8778076171875, -1.611083984375, -1.3443603515625, -1.07763671875, -0.8109130859375, -0.544189453125, -0.2774658203125, -0.0107421875, 0.2559814453125, 0.522705078125, 0.7894287109375, 1.05615234375, 1.3228759765625, 1.589599609375, 1.8563232421875, 2.123046875, 2.3897705078125, 2.656494140625, 2.9232177734375, 3.18994140625, 3.4566650390625, 3.723388671875, 3.9901123046875, 4.2568359375, 4.5235595703125, 4.790283203125, 5.0570068359375, 5.32373046875, 5.5904541015625, 5.857177734375, 6.1239013671875, 6.390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 15.0, 17.0, 16.0, 27.0, 45.0, 58.0, 69.0, 109.0, 131.0, 128.0, 90.0, 66.0, 59.0, 33.0, 35.0, 19.0, 8.0, 7.0, 8.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001041412353515625, -0.0010052919387817383, -0.0009691715240478516, -0.0009330511093139648, -0.0008969306945800781, -0.0008608102798461914, -0.0008246898651123047, -0.000788569450378418, -0.0007524490356445312, -0.0007163286209106445, -0.0006802082061767578, -0.0006440877914428711, -0.0006079673767089844, -0.0005718469619750977, -0.0005357265472412109, -0.0004996061325073242, -0.0004634857177734375, -0.0004273653030395508, -0.00039124488830566406, -0.00035512447357177734, -0.0003190040588378906, -0.0002828836441040039, -0.0002467632293701172, -0.00021064281463623047, -0.00017452239990234375, -0.00013840198516845703, -0.00010228157043457031, -6.61611557006836e-05, -3.0040740966796875e-05, 6.079673767089844e-06, 4.220008850097656e-05, 7.832050323486328e-05, 0.00011444091796875, 0.00015056133270263672, 0.00018668174743652344, 0.00022280216217041016, 0.0002589225769042969, 0.0002950429916381836, 0.0003311634063720703, 0.00036728382110595703, 0.00040340423583984375, 0.00043952465057373047, 0.0004756450653076172, 0.0005117654800415039, 0.0005478858947753906, 0.0005840063095092773, 0.0006201267242431641, 0.0006562471389770508, 0.0006923675537109375, 0.0007284879684448242, 0.0007646083831787109, 0.0008007287979125977, 0.0008368492126464844, 0.0008729696273803711, 0.0009090900421142578, 0.0009452104568481445, 0.0009813308715820312, 0.001017451286315918, 0.0010535717010498047, 0.0010896921157836914, 0.0011258125305175781, 0.0011619329452514648, 0.0011980533599853516, 0.0012341737747192383, 0.001270294189453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 8.0, 5.0, 9.0, 17.0, 13.0, 31.0, 59.0, 63.0, 69.0, 97.0, 178.0, 308.0, 546.0, 1081.0, 2134.0, 6084.0, 23758.0, 171669.0, 727649.0, 91078.0, 15430.0, 4560.0, 1693.0, 786.0, 424.0, 241.0, 166.0, 110.0, 72.0, 54.0, 47.0, 27.0, 20.0, 16.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.00921630859375, -4.8035888671875, -4.59796142578125, -4.392333984375, -4.18670654296875, -3.9810791015625, -3.77545166015625, -3.56982421875, -3.36419677734375, -3.1585693359375, -2.95294189453125, -2.747314453125, -2.54168701171875, -2.3360595703125, -2.13043212890625, -1.9248046875, -1.71917724609375, -1.5135498046875, -1.30792236328125, -1.102294921875, -0.89666748046875, -0.6910400390625, -0.48541259765625, -0.27978515625, -0.07415771484375, 0.1314697265625, 0.33709716796875, 0.542724609375, 0.74835205078125, 0.9539794921875, 1.15960693359375, 1.365234375, 1.57086181640625, 1.7764892578125, 1.98211669921875, 2.187744140625, 2.39337158203125, 2.5989990234375, 2.80462646484375, 3.01025390625, 3.21588134765625, 3.4215087890625, 3.62713623046875, 3.832763671875, 4.03839111328125, 4.2440185546875, 4.44964599609375, 4.6552734375, 4.86090087890625, 5.0665283203125, 5.27215576171875, 5.477783203125, 5.68341064453125, 5.8890380859375, 6.09466552734375, 6.30029296875, 6.50592041015625, 6.7115478515625, 6.91717529296875, 7.122802734375, 7.32843017578125, 7.5340576171875, 7.73968505859375, 7.9453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 3.0, 10.0, 10.0, 10.0, 16.0, 22.0, 19.0, 28.0, 34.0, 55.0, 51.0, 63.0, 85.0, 91.0, 88.0, 76.0, 78.0, 35.0, 36.0, 35.0, 26.0, 23.0, 24.0, 25.0, 12.0, 12.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.43359375, -5.245361328125, -5.05712890625, -4.868896484375, -4.6806640625, -4.492431640625, -4.30419921875, -4.115966796875, -3.927734375, -3.739501953125, -3.55126953125, -3.363037109375, -3.1748046875, -2.986572265625, -2.79833984375, -2.610107421875, -2.421875, -2.233642578125, -2.04541015625, -1.857177734375, -1.6689453125, -1.480712890625, -1.29248046875, -1.104248046875, -0.916015625, -0.727783203125, -0.53955078125, -0.351318359375, -0.1630859375, 0.025146484375, 0.21337890625, 0.401611328125, 0.58984375, 0.778076171875, 0.96630859375, 1.154541015625, 1.3427734375, 1.531005859375, 1.71923828125, 1.907470703125, 2.095703125, 2.283935546875, 2.47216796875, 2.660400390625, 2.8486328125, 3.036865234375, 3.22509765625, 3.413330078125, 3.6015625, 3.789794921875, 3.97802734375, 4.166259765625, 4.3544921875, 4.542724609375, 4.73095703125, 4.919189453125, 5.107421875, 5.295654296875, 5.48388671875, 5.672119140625, 5.8603515625, 6.048583984375, 6.23681640625, 6.425048828125, 6.61328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 11.0, 29.0, 47.0, 97.0, 130.0, 207.0, 184.0, 134.0, 52.0, 39.0, 22.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.02127075195312, -166.4908447265625, -161.96041870117188, -157.42999267578125, -152.89956665039062, -148.369140625, -143.83871459960938, -139.30828857421875, -134.77786254882812, -130.2474365234375, -125.71701049804688, -121.18658447265625, -116.65615844726562, -112.125732421875, -107.5953140258789, -103.06488800048828, -98.53446960449219, -94.00404357910156, -89.47361755371094, -84.94319152832031, -80.41276550292969, -75.88233947753906, -71.35192108154297, -66.82149505615234, -62.29106903076172, -57.760643005371094, -53.23021697998047, -48.69979476928711, -44.169368743896484, -39.63894271850586, -35.1085205078125, -30.578094482421875, -26.047653198242188, -21.517227172851562, -16.98680305480957, -12.456377983093262, -7.925952911376953, -3.395526885986328, 1.134897232055664, 5.665321350097656, 10.195747375488281, 14.72617244720459, 19.2565975189209, 23.78702163696289, 28.317447662353516, 32.84787368774414, 37.3782958984375, 41.908721923828125, 46.43914794921875, 50.969573974609375, 55.5, 60.03042221069336, 64.56085205078125, 69.09127807617188, 73.62169647216797, 78.1521224975586, 82.68254852294922, 87.21297454833984, 91.74340057373047, 96.2738265991211, 100.80424499511719, 105.33467102050781, 109.86509704589844, 114.39552307128906, 118.92594909667969]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 5.0, 15.0, 13.0, 17.0, 15.0, 27.0, 20.0, 26.0, 30.0, 24.0, 41.0, 31.0, 50.0, 44.0, 67.0, 65.0, 52.0, 65.0, 58.0, 35.0, 43.0, 32.0, 41.0, 31.0, 24.0, 16.0, 23.0, 18.0, 15.0, 11.0, 8.0, 3.0, 9.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-89.40168762207031, -86.83890533447266, -84.27611541748047, -81.71333312988281, -79.15055084228516, -76.5877685546875, -74.02497863769531, -71.46219635009766, -68.8994140625, -66.33663177490234, -63.77384567260742, -61.2110595703125, -58.648277282714844, -56.08549118041992, -53.522705078125, -50.959922790527344, -48.39713668823242, -45.8343505859375, -43.271568298339844, -40.70878219604492, -38.145999908447266, -35.583213806152344, -33.02043151855469, -30.457645416259766, -27.894861221313477, -25.332077026367188, -22.7692928314209, -20.20650863647461, -17.643722534179688, -15.080939292907715, -12.51815414428711, -9.95536994934082, -7.392585754394531, -4.829801559448242, -2.267016887664795, 0.29576778411865234, 2.8585519790649414, 5.4213361740112305, 7.984121322631836, 10.546905517578125, 13.109689712524414, 15.672473907470703, 18.235258102416992, 20.79804229736328, 23.360828399658203, 25.92361068725586, 28.48639678955078, 31.04918098449707, 33.61196517944336, 36.17475128173828, 38.73753356933594, 41.30031967163086, 43.863101959228516, 46.42588806152344, 48.988670349121094, 51.551456451416016, 54.11424255371094, 56.67702865600586, 59.239810943603516, 61.80259704589844, 64.3653793334961, 66.92816162109375, 69.49095153808594, 72.0537338256836, 74.61651611328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 2.0, 14.0, 13.0, 19.0, 33.0, 51.0, 83.0, 178.0, 494.0, 3460.0, 3793231.0, 393432.0, 2491.0, 407.0, 148.0, 76.0, 43.0, 30.0, 20.0, 15.0, 8.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.69580078125, -62.0166015625, -60.33740234375, -58.658203125, -56.97900390625, -55.2998046875, -53.62060546875, -51.94140625, -50.26220703125, -48.5830078125, -46.90380859375, -45.224609375, -43.54541015625, -41.8662109375, -40.18701171875, -38.5078125, -36.82861328125, -35.1494140625, -33.47021484375, -31.791015625, -30.11181640625, -28.4326171875, -26.75341796875, -25.07421875, -23.39501953125, -21.7158203125, -20.03662109375, -18.357421875, -16.67822265625, -14.9990234375, -13.31982421875, -11.640625, -9.96142578125, -8.2822265625, -6.60302734375, -4.923828125, -3.24462890625, -1.5654296875, 0.11376953125, 1.79296875, 3.47216796875, 5.1513671875, 6.83056640625, 8.509765625, 10.18896484375, 11.8681640625, 13.54736328125, 15.2265625, 16.90576171875, 18.5849609375, 20.26416015625, 21.943359375, 23.62255859375, 25.3017578125, 26.98095703125, 28.66015625, 30.33935546875, 32.0185546875, 33.69775390625, 35.376953125, 37.05615234375, 38.7353515625, 40.41455078125, 42.09375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 17.0, 22.0, 22.0, 44.0, 52.0, 69.0, 86.0, 84.0, 86.0, 104.0, 82.0, 85.0, 55.0, 57.0, 31.0, 35.0, 26.0, 19.0, 13.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0078125, -9.75823974609375, -9.5086669921875, -9.25909423828125, -9.009521484375, -8.75994873046875, -8.5103759765625, -8.26080322265625, -8.01123046875, -7.76165771484375, -7.5120849609375, -7.26251220703125, -7.012939453125, -6.76336669921875, -6.5137939453125, -6.26422119140625, -6.0146484375, -5.76507568359375, -5.5155029296875, -5.26593017578125, -5.016357421875, -4.76678466796875, -4.5172119140625, -4.26763916015625, -4.01806640625, -3.76849365234375, -3.5189208984375, -3.26934814453125, -3.019775390625, -2.77020263671875, -2.5206298828125, -2.27105712890625, -2.021484375, -1.77191162109375, -1.5223388671875, -1.27276611328125, -1.023193359375, -0.77362060546875, -0.5240478515625, -0.27447509765625, -0.02490234375, 0.22467041015625, 0.4742431640625, 0.72381591796875, 0.973388671875, 1.22296142578125, 1.4725341796875, 1.72210693359375, 1.9716796875, 2.22125244140625, 2.4708251953125, 2.72039794921875, 2.969970703125, 3.21954345703125, 3.4691162109375, 3.71868896484375, 3.96826171875, 4.21783447265625, 4.4674072265625, 4.71697998046875, 4.966552734375, 5.21612548828125, 5.4656982421875, 5.71527099609375, 5.96484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 15.0, 16.0, 25.0, 34.0, 60.0, 64.0, 128.0, 195.0, 379.0, 677.0, 1309.0, 2739.0, 6917.0, 20299.0, 85019.0, 2219743.0, 1741078.0, 81150.0, 20670.0, 7291.0, 3142.0, 1461.0, 740.0, 410.0, 251.0, 133.0, 100.0, 64.0, 51.0, 29.0, 29.0, 14.0, 17.0, 5.0, 9.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.951171875, -10.59765625, -10.244140625, -9.890625, -9.537109375, -9.18359375, -8.830078125, -8.4765625, -8.123046875, -7.76953125, -7.416015625, -7.0625, -6.708984375, -6.35546875, -6.001953125, -5.6484375, -5.294921875, -4.94140625, -4.587890625, -4.234375, -3.880859375, -3.52734375, -3.173828125, -2.8203125, -2.466796875, -2.11328125, -1.759765625, -1.40625, -1.052734375, -0.69921875, -0.345703125, 0.0078125, 0.361328125, 0.71484375, 1.068359375, 1.421875, 1.775390625, 2.12890625, 2.482421875, 2.8359375, 3.189453125, 3.54296875, 3.896484375, 4.25, 4.603515625, 4.95703125, 5.310546875, 5.6640625, 6.017578125, 6.37109375, 6.724609375, 7.078125, 7.431640625, 7.78515625, 8.138671875, 8.4921875, 8.845703125, 9.19921875, 9.552734375, 9.90625, 10.259765625, 10.61328125, 10.966796875, 11.3203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 7.0, 16.0, 17.0, 32.0, 36.0, 67.0, 110.0, 327.0, 902.0, 1487.0, 575.0, 196.0, 82.0, 62.0, 48.0, 30.0, 14.0, 19.0, 8.0, 11.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.9921875, -13.530029296875, -13.06787109375, -12.605712890625, -12.1435546875, -11.681396484375, -11.21923828125, -10.757080078125, -10.294921875, -9.832763671875, -9.37060546875, -8.908447265625, -8.4462890625, -7.984130859375, -7.52197265625, -7.059814453125, -6.59765625, -6.135498046875, -5.67333984375, -5.211181640625, -4.7490234375, -4.286865234375, -3.82470703125, -3.362548828125, -2.900390625, -2.438232421875, -1.97607421875, -1.513916015625, -1.0517578125, -0.589599609375, -0.12744140625, 0.334716796875, 0.796875, 1.259033203125, 1.72119140625, 2.183349609375, 2.6455078125, 3.107666015625, 3.56982421875, 4.031982421875, 4.494140625, 4.956298828125, 5.41845703125, 5.880615234375, 6.3427734375, 6.804931640625, 7.26708984375, 7.729248046875, 8.19140625, 8.653564453125, 9.11572265625, 9.577880859375, 10.0400390625, 10.502197265625, 10.96435546875, 11.426513671875, 11.888671875, 12.350830078125, 12.81298828125, 13.275146484375, 13.7373046875, 14.199462890625, 14.66162109375, 15.123779296875, 15.5859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 17.0, 54.0, 273.0, 391.0, 174.0, 39.0, 22.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.26020812988281, -61.57416534423828, -54.88812255859375, -48.202083587646484, -41.51604080200195, -34.82999801635742, -28.143959045410156, -21.457916259765625, -14.771873474121094, -8.085831642150879, -1.399789810180664, 5.286251068115234, 11.972293853759766, 18.658336639404297, 25.344375610351562, 32.030418395996094, 38.716461181640625, 45.402503967285156, 52.08854675292969, 58.77458572387695, 65.46063232421875, 72.14666748046875, 78.83271026611328, 85.51875305175781, 92.20479583740234, 98.89083862304688, 105.5768814086914, 112.26292419433594, 118.94895935058594, 125.635009765625, 132.321044921875, 139.007080078125, 145.69314575195312, 152.37918090820312, 159.0652313232422, 165.7512664794922, 172.43731689453125, 179.12335205078125, 185.80938720703125, 192.4954376220703, 199.18148803710938, 205.86752319335938, 212.55357360839844, 219.23960876464844, 225.9256591796875, 232.6116943359375, 239.2977294921875, 245.98377990722656, 252.66981506347656, 259.3558654785156, 266.0419006347656, 272.7279357910156, 279.4139709472656, 286.10003662109375, 292.78607177734375, 299.47210693359375, 306.15814208984375, 312.84417724609375, 319.53021240234375, 326.2162780761719, 332.9023132324219, 339.5883483886719, 346.2743835449219, 352.96044921875, 359.646484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 9.0, 17.0, 17.0, 25.0, 41.0, 32.0, 44.0, 41.0, 52.0, 78.0, 62.0, 58.0, 62.0, 57.0, 41.0, 58.0, 54.0, 49.0, 40.0, 35.0, 30.0, 21.0, 16.0, 14.0, 16.0, 6.0, 7.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.45680236816406, -48.3878173828125, -46.3188362121582, -44.24985122680664, -42.180870056152344, -40.11188507080078, -38.04290008544922, -35.973915100097656, -33.90493392944336, -31.83595085144043, -29.7669677734375, -27.697982788085938, -25.628999710083008, -23.560016632080078, -21.491031646728516, -19.422048568725586, -17.353065490722656, -15.284082412719727, -13.21509838104248, -11.146114349365234, -9.077131271362305, -7.008148193359375, -4.939164161682129, -2.870180130004883, -0.8011970520019531, 1.2677865028381348, 3.3367700576782227, 5.4057536125183105, 7.474737167358398, 9.543720245361328, 11.612704277038574, 13.68168830871582, 15.75067138671875, 17.81965446472168, 19.88863754272461, 21.957622528076172, 24.0266056060791, 26.09558868408203, 28.164573669433594, 30.233556747436523, 32.30253982543945, 34.371524810791016, 36.44050598144531, 38.509490966796875, 40.57847595214844, 42.647457122802734, 44.7164421081543, 46.785423278808594, 48.854408264160156, 50.92339324951172, 52.992374420166016, 55.06135940551758, 57.130340576171875, 59.19932556152344, 61.268310546875, 63.33729553222656, 65.40628051757812, 67.47526550292969, 69.54425048828125, 71.61322784423828, 73.68221282958984, 75.7511978149414, 77.82018280029297, 79.88916778564453, 81.95814514160156]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 10.0, 7.0, 21.0, 26.0, 20.0, 27.0, 63.0, 66.0, 108.0, 155.0, 214.0, 355.0, 631.0, 1005.0, 1784.0, 3622.0, 7951.0, 19529.0, 54320.0, 168365.0, 445453.0, 228857.0, 71076.0, 25298.0, 9821.0, 4516.0, 2157.0, 1185.0, 683.0, 400.0, 278.0, 173.0, 120.0, 87.0, 43.0, 32.0, 21.0, 28.0, 13.0, 6.0, 5.0, 4.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.25, -9.9451904296875, -9.640380859375, -9.3355712890625, -9.03076171875, -8.7259521484375, -8.421142578125, -8.1163330078125, -7.8115234375, -7.5067138671875, -7.201904296875, -6.8970947265625, -6.59228515625, -6.2874755859375, -5.982666015625, -5.6778564453125, -5.373046875, -5.0682373046875, -4.763427734375, -4.4586181640625, -4.15380859375, -3.8489990234375, -3.544189453125, -3.2393798828125, -2.9345703125, -2.6297607421875, -2.324951171875, -2.0201416015625, -1.71533203125, -1.4105224609375, -1.105712890625, -0.8009033203125, -0.49609375, -0.1912841796875, 0.113525390625, 0.4183349609375, 0.72314453125, 1.0279541015625, 1.332763671875, 1.6375732421875, 1.9423828125, 2.2471923828125, 2.552001953125, 2.8568115234375, 3.16162109375, 3.4664306640625, 3.771240234375, 4.0760498046875, 4.380859375, 4.6856689453125, 4.990478515625, 5.2952880859375, 5.60009765625, 5.9049072265625, 6.209716796875, 6.5145263671875, 6.8193359375, 7.1241455078125, 7.428955078125, 7.7337646484375, 8.03857421875, 8.3433837890625, 8.648193359375, 8.9530029296875, 9.2578125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 10.0, 11.0, 13.0, 15.0, 25.0, 27.0, 26.0, 34.0, 40.0, 37.0, 38.0, 41.0, 52.0, 58.0, 55.0, 54.0, 52.0, 56.0, 55.0, 30.0, 40.0, 40.0, 35.0, 22.0, 29.0, 26.0, 17.0, 14.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.260223388671875, -3.11224365234375, -2.964263916015625, -2.8162841796875, -2.668304443359375, -2.52032470703125, -2.372344970703125, -2.224365234375, -2.076385498046875, -1.92840576171875, -1.780426025390625, -1.6324462890625, -1.484466552734375, -1.33648681640625, -1.188507080078125, -1.04052734375, -0.892547607421875, -0.74456787109375, -0.596588134765625, -0.4486083984375, -0.300628662109375, -0.15264892578125, -0.004669189453125, 0.143310546875, 0.291290283203125, 0.43927001953125, 0.587249755859375, 0.7352294921875, 0.883209228515625, 1.03118896484375, 1.179168701171875, 1.3271484375, 1.475128173828125, 1.62310791015625, 1.771087646484375, 1.9190673828125, 2.067047119140625, 2.21502685546875, 2.363006591796875, 2.510986328125, 2.658966064453125, 2.80694580078125, 2.954925537109375, 3.1029052734375, 3.250885009765625, 3.39886474609375, 3.546844482421875, 3.69482421875, 3.842803955078125, 3.99078369140625, 4.138763427734375, 4.2867431640625, 4.434722900390625, 4.58270263671875, 4.730682373046875, 4.878662109375, 5.026641845703125, 5.17462158203125, 5.322601318359375, 5.4705810546875, 5.618560791015625, 5.76654052734375, 5.914520263671875, 6.0625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 8.0, 13.0, 19.0, 39.0, 36.0, 47.0, 101.0, 170.0, 259.0, 524.0, 1001.0, 2405.0, 7045.0, 31429.0, 233871.0, 672907.0, 77990.0, 13779.0, 3884.0, 1423.0, 639.0, 370.0, 196.0, 132.0, 70.0, 52.0, 39.0, 27.0, 10.0, 17.0, 11.0, 12.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.6875, -16.1357421875, -15.583984375, -15.0322265625, -14.48046875, -13.9287109375, -13.376953125, -12.8251953125, -12.2734375, -11.7216796875, -11.169921875, -10.6181640625, -10.06640625, -9.5146484375, -8.962890625, -8.4111328125, -7.859375, -7.3076171875, -6.755859375, -6.2041015625, -5.65234375, -5.1005859375, -4.548828125, -3.9970703125, -3.4453125, -2.8935546875, -2.341796875, -1.7900390625, -1.23828125, -0.6865234375, -0.134765625, 0.4169921875, 0.96875, 1.5205078125, 2.072265625, 2.6240234375, 3.17578125, 3.7275390625, 4.279296875, 4.8310546875, 5.3828125, 5.9345703125, 6.486328125, 7.0380859375, 7.58984375, 8.1416015625, 8.693359375, 9.2451171875, 9.796875, 10.3486328125, 10.900390625, 11.4521484375, 12.00390625, 12.5556640625, 13.107421875, 13.6591796875, 14.2109375, 14.7626953125, 15.314453125, 15.8662109375, 16.41796875, 16.9697265625, 17.521484375, 18.0732421875, 18.625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 6.0, 17.0, 12.0, 17.0, 29.0, 23.0, 34.0, 33.0, 37.0, 45.0, 38.0, 50.0, 44.0, 40.0, 52.0, 46.0, 45.0, 31.0, 44.0, 49.0, 35.0, 30.0, 43.0, 33.0, 25.0, 22.0, 14.0, 8.0, 12.0, 11.0, 11.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.046875, -14.549560546875, -14.05224609375, -13.554931640625, -13.0576171875, -12.560302734375, -12.06298828125, -11.565673828125, -11.068359375, -10.571044921875, -10.07373046875, -9.576416015625, -9.0791015625, -8.581787109375, -8.08447265625, -7.587158203125, -7.08984375, -6.592529296875, -6.09521484375, -5.597900390625, -5.1005859375, -4.603271484375, -4.10595703125, -3.608642578125, -3.111328125, -2.614013671875, -2.11669921875, -1.619384765625, -1.1220703125, -0.624755859375, -0.12744140625, 0.369873046875, 0.8671875, 1.364501953125, 1.86181640625, 2.359130859375, 2.8564453125, 3.353759765625, 3.85107421875, 4.348388671875, 4.845703125, 5.343017578125, 5.84033203125, 6.337646484375, 6.8349609375, 7.332275390625, 7.82958984375, 8.326904296875, 8.82421875, 9.321533203125, 9.81884765625, 10.316162109375, 10.8134765625, 11.310791015625, 11.80810546875, 12.305419921875, 12.802734375, 13.300048828125, 13.79736328125, 14.294677734375, 14.7919921875, 15.289306640625, 15.78662109375, 16.283935546875, 16.78125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 15.0, 21.0, 22.0, 26.0, 43.0, 87.0, 144.0, 362.0, 999.0, 4004.0, 29955.0, 794061.0, 204478.0, 11049.0, 2086.0, 599.0, 262.0, 137.0, 66.0, 39.0, 31.0, 16.0, 9.0, 6.0, 11.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.7578125, -7.505859375, -7.25390625, -7.001953125, -6.75, -6.498046875, -6.24609375, -5.994140625, -5.7421875, -5.490234375, -5.23828125, -4.986328125, -4.734375, -4.482421875, -4.23046875, -3.978515625, -3.7265625, -3.474609375, -3.22265625, -2.970703125, -2.71875, -2.466796875, -2.21484375, -1.962890625, -1.7109375, -1.458984375, -1.20703125, -0.955078125, -0.703125, -0.451171875, -0.19921875, 0.052734375, 0.3046875, 0.556640625, 0.80859375, 1.060546875, 1.3125, 1.564453125, 1.81640625, 2.068359375, 2.3203125, 2.572265625, 2.82421875, 3.076171875, 3.328125, 3.580078125, 3.83203125, 4.083984375, 4.3359375, 4.587890625, 4.83984375, 5.091796875, 5.34375, 5.595703125, 5.84765625, 6.099609375, 6.3515625, 6.603515625, 6.85546875, 7.107421875, 7.359375, 7.611328125, 7.86328125, 8.115234375, 8.3671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 12.0, 6.0, 9.0, 19.0, 29.0, 50.0, 62.0, 87.0, 150.0, 134.0, 145.0, 106.0, 84.0, 26.0, 26.0, 25.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.002086639404296875, -0.002041757106781006, -0.0019968748092651367, -0.0019519925117492676, -0.0019071102142333984, -0.0018622279167175293, -0.0018173456192016602, -0.001772463321685791, -0.0017275810241699219, -0.0016826987266540527, -0.0016378164291381836, -0.0015929341316223145, -0.0015480518341064453, -0.0015031695365905762, -0.001458287239074707, -0.0014134049415588379, -0.0013685226440429688, -0.0013236403465270996, -0.0012787580490112305, -0.0012338757514953613, -0.0011889934539794922, -0.001144111156463623, -0.001099228858947754, -0.0010543465614318848, -0.0010094642639160156, -0.0009645819664001465, -0.0009196996688842773, -0.0008748173713684082, -0.0008299350738525391, -0.0007850527763366699, -0.0007401704788208008, -0.0006952881813049316, -0.0006504058837890625, -0.0006055235862731934, -0.0005606412887573242, -0.0005157589912414551, -0.00047087669372558594, -0.0004259943962097168, -0.00038111209869384766, -0.0003362298011779785, -0.0002913475036621094, -0.00024646520614624023, -0.0002015829086303711, -0.00015670061111450195, -0.00011181831359863281, -6.693601608276367e-05, -2.205371856689453e-05, 2.282857894897461e-05, 6.771087646484375e-05, 0.00011259317398071289, 0.00015747547149658203, 0.00020235776901245117, 0.0002472400665283203, 0.00029212236404418945, 0.0003370046615600586, 0.00038188695907592773, 0.0004267692565917969, 0.000471651554107666, 0.0005165338516235352, 0.0005614161491394043, 0.0006062984466552734, 0.0006511807441711426, 0.0006960630416870117, 0.0007409453392028809, 0.00078582763671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 7.0, 8.0, 11.0, 18.0, 18.0, 36.0, 63.0, 89.0, 153.0, 333.0, 825.0, 2465.0, 12026.0, 147405.0, 827352.0, 48874.0, 6090.0, 1576.0, 583.0, 263.0, 129.0, 83.0, 54.0, 32.0, 20.0, 12.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.72265625, -7.49761962890625, -7.2725830078125, -7.04754638671875, -6.822509765625, -6.59747314453125, -6.3724365234375, -6.14739990234375, -5.92236328125, -5.69732666015625, -5.4722900390625, -5.24725341796875, -5.022216796875, -4.79718017578125, -4.5721435546875, -4.34710693359375, -4.1220703125, -3.89703369140625, -3.6719970703125, -3.44696044921875, -3.221923828125, -2.99688720703125, -2.7718505859375, -2.54681396484375, -2.32177734375, -2.09674072265625, -1.8717041015625, -1.64666748046875, -1.421630859375, -1.19659423828125, -0.9715576171875, -0.74652099609375, -0.521484375, -0.29644775390625, -0.0714111328125, 0.15362548828125, 0.378662109375, 0.60369873046875, 0.8287353515625, 1.05377197265625, 1.27880859375, 1.50384521484375, 1.7288818359375, 1.95391845703125, 2.178955078125, 2.40399169921875, 2.6290283203125, 2.85406494140625, 3.0791015625, 3.30413818359375, 3.5291748046875, 3.75421142578125, 3.979248046875, 4.20428466796875, 4.4293212890625, 4.65435791015625, 4.87939453125, 5.10443115234375, 5.3294677734375, 5.55450439453125, 5.779541015625, 6.00457763671875, 6.2296142578125, 6.45465087890625, 6.6796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 15.0, 11.0, 13.0, 21.0, 21.0, 38.0, 59.0, 51.0, 88.0, 73.0, 96.0, 89.0, 81.0, 65.0, 41.0, 47.0, 41.0, 24.0, 26.0, 12.0, 16.0, 11.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.43359375, -4.2994384765625, -4.165283203125, -4.0311279296875, -3.89697265625, -3.7628173828125, -3.628662109375, -3.4945068359375, -3.3603515625, -3.2261962890625, -3.092041015625, -2.9578857421875, -2.82373046875, -2.6895751953125, -2.555419921875, -2.4212646484375, -2.287109375, -2.1529541015625, -2.018798828125, -1.8846435546875, -1.75048828125, -1.6163330078125, -1.482177734375, -1.3480224609375, -1.2138671875, -1.0797119140625, -0.945556640625, -0.8114013671875, -0.67724609375, -0.5430908203125, -0.408935546875, -0.2747802734375, -0.140625, -0.0064697265625, 0.127685546875, 0.2618408203125, 0.39599609375, 0.5301513671875, 0.664306640625, 0.7984619140625, 0.9326171875, 1.0667724609375, 1.200927734375, 1.3350830078125, 1.46923828125, 1.6033935546875, 1.737548828125, 1.8717041015625, 2.005859375, 2.1400146484375, 2.274169921875, 2.4083251953125, 2.54248046875, 2.6766357421875, 2.810791015625, 2.9449462890625, 3.0791015625, 3.2132568359375, 3.347412109375, 3.4815673828125, 3.61572265625, 3.7498779296875, 3.884033203125, 4.0181884765625, 4.15234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 13.0, 34.0, 83.0, 250.0, 362.0, 166.0, 54.0, 21.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-200.30690002441406, -194.11257934570312, -187.9182586669922, -181.72393798828125, -175.5296173095703, -169.33529663085938, -163.1409912109375, -156.9466552734375, -150.75234985351562, -144.5580291748047, -138.36370849609375, -132.1693878173828, -125.97506713867188, -119.78074645996094, -113.58643341064453, -107.3921127319336, -101.19778442382812, -95.00346374511719, -88.80914306640625, -82.61482238769531, -76.42050170898438, -70.22618103027344, -64.03186798095703, -57.837547302246094, -51.643226623535156, -45.44890594482422, -39.25458526611328, -33.06026840209961, -26.865947723388672, -20.671627044677734, -14.477310180664062, -8.282989501953125, -2.08868408203125, 4.105635643005371, 10.299955368041992, 16.494274139404297, 22.688594818115234, 28.882915496826172, 35.077232360839844, 41.27155303955078, 47.46587371826172, 53.660194396972656, 59.854515075683594, 66.048828125, 72.24314880371094, 78.43746948242188, 84.63179016113281, 90.82611083984375, 97.02043151855469, 103.21475219726562, 109.40907287597656, 115.6033935546875, 121.79771423339844, 127.99203491210938, 134.18634033203125, 140.38067626953125, 146.57498168945312, 152.76930236816406, 158.963623046875, 165.15794372558594, 171.35226440429688, 177.5465850830078, 183.74090576171875, 189.93521118164062, 196.12954711914062]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 8.0, 6.0, 10.0, 7.0, 13.0, 13.0, 10.0, 11.0, 19.0, 19.0, 20.0, 26.0, 24.0, 26.0, 35.0, 21.0, 44.0, 44.0, 51.0, 54.0, 47.0, 53.0, 43.0, 35.0, 44.0, 37.0, 33.0, 21.0, 36.0, 32.0, 18.0, 22.0, 24.0, 12.0, 13.0, 8.0, 10.0, 9.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-57.63092041015625, -55.8527717590332, -54.07462692260742, -52.296478271484375, -50.51832962036133, -48.74018096923828, -46.9620361328125, -45.18388748168945, -43.405738830566406, -41.62759017944336, -39.84944534301758, -38.07129669189453, -36.293148040771484, -34.51499938964844, -32.736854553222656, -30.95870590209961, -29.180559158325195, -27.40241241455078, -25.624263763427734, -23.84611701965332, -22.067968368530273, -20.28982162475586, -18.511672973632812, -16.7335262298584, -14.955378532409668, -13.177230834960938, -11.399083137512207, -9.620935440063477, -7.842788219451904, -6.064640998840332, -4.286493301391602, -2.508345603942871, -0.7301979064941406, 1.0479496717453003, 2.826097249984741, 4.604244709014893, 6.382392406463623, 8.160539627075195, 9.938687324523926, 11.716835021972656, 13.494982719421387, 15.273130416870117, 17.05127716064453, 18.829425811767578, 20.607572555541992, 22.385719299316406, 24.163867950439453, 25.9420166015625, 27.720163345336914, 29.498310089111328, 31.276458740234375, 33.05460739135742, 34.8327522277832, 36.61090087890625, 38.3890495300293, 40.167198181152344, 41.945343017578125, 43.72349166870117, 45.50163650512695, 47.27978515625, 49.05793380737305, 50.836082458496094, 52.614227294921875, 54.39237594604492, 56.17052459716797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 9.0, 7.0, 11.0, 5.0, 9.0, 13.0, 12.0, 36.0, 53.0, 76.0, 121.0, 192.0, 285.0, 397.0, 677.0, 1142.0, 2128.0, 3796.0, 7970.0, 18394.0, 58882.0, 329741.0, 2413627.0, 1148182.0, 148708.0, 34141.0, 12719.0, 5903.0, 2937.0, 1662.0, 911.0, 538.0, 354.0, 206.0, 134.0, 109.0, 77.0, 47.0, 21.0, 19.0, 13.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.578125, -4.429443359375, -4.28076171875, -4.132080078125, -3.9833984375, -3.834716796875, -3.68603515625, -3.537353515625, -3.388671875, -3.239990234375, -3.09130859375, -2.942626953125, -2.7939453125, -2.645263671875, -2.49658203125, -2.347900390625, -2.19921875, -2.050537109375, -1.90185546875, -1.753173828125, -1.6044921875, -1.455810546875, -1.30712890625, -1.158447265625, -1.009765625, -0.861083984375, -0.71240234375, -0.563720703125, -0.4150390625, -0.266357421875, -0.11767578125, 0.031005859375, 0.1796875, 0.328369140625, 0.47705078125, 0.625732421875, 0.7744140625, 0.923095703125, 1.07177734375, 1.220458984375, 1.369140625, 1.517822265625, 1.66650390625, 1.815185546875, 1.9638671875, 2.112548828125, 2.26123046875, 2.409912109375, 2.55859375, 2.707275390625, 2.85595703125, 3.004638671875, 3.1533203125, 3.302001953125, 3.45068359375, 3.599365234375, 3.748046875, 3.896728515625, 4.04541015625, 4.194091796875, 4.3427734375, 4.491455078125, 4.64013671875, 4.788818359375, 4.9375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 12.0, 8.0, 15.0, 20.0, 38.0, 45.0, 39.0, 39.0, 41.0, 46.0, 60.0, 61.0, 60.0, 54.0, 59.0, 64.0, 51.0, 57.0, 35.0, 46.0, 34.0, 23.0, 18.0, 19.0, 18.0, 4.0, 8.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.26953125, -3.12109375, -2.97265625, -2.82421875, -2.67578125, -2.52734375, -2.37890625, -2.23046875, -2.08203125, -1.93359375, -1.78515625, -1.63671875, -1.48828125, -1.33984375, -1.19140625, -1.04296875, -0.89453125, -0.74609375, -0.59765625, -0.44921875, -0.30078125, -0.15234375, -0.00390625, 0.14453125, 0.29296875, 0.44140625, 0.58984375, 0.73828125, 0.88671875, 1.03515625, 1.18359375, 1.33203125, 1.48046875, 1.62890625, 1.77734375, 1.92578125, 2.07421875, 2.22265625, 2.37109375, 2.51953125, 2.66796875, 2.81640625, 2.96484375, 3.11328125, 3.26171875, 3.41015625, 3.55859375, 3.70703125, 3.85546875, 4.00390625, 4.15234375, 4.30078125, 4.44921875, 4.59765625, 4.74609375, 4.89453125, 5.04296875, 5.19140625, 5.33984375, 5.48828125, 5.63671875, 5.78515625, 5.93359375, 6.08203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 19.0, 23.0, 29.0, 40.0, 68.0, 101.0, 159.0, 262.0, 485.0, 890.0, 1756.0, 3827.0, 9148.0, 27427.0, 117659.0, 2225243.0, 1667582.0, 99855.0, 24875.0, 8317.0, 3246.0, 1529.0, 723.0, 398.0, 218.0, 113.0, 76.0, 49.0, 29.0, 31.0, 17.0, 16.0, 5.0, 7.0, 11.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62445068359375, -7.3699951171875, -7.11553955078125, -6.861083984375, -6.60662841796875, -6.3521728515625, -6.09771728515625, -5.84326171875, -5.58880615234375, -5.3343505859375, -5.07989501953125, -4.825439453125, -4.57098388671875, -4.3165283203125, -4.06207275390625, -3.8076171875, -3.55316162109375, -3.2987060546875, -3.04425048828125, -2.789794921875, -2.53533935546875, -2.2808837890625, -2.02642822265625, -1.77197265625, -1.51751708984375, -1.2630615234375, -1.00860595703125, -0.754150390625, -0.49969482421875, -0.2452392578125, 0.00921630859375, 0.263671875, 0.51812744140625, 0.7725830078125, 1.02703857421875, 1.281494140625, 1.53594970703125, 1.7904052734375, 2.04486083984375, 2.29931640625, 2.55377197265625, 2.8082275390625, 3.06268310546875, 3.317138671875, 3.57159423828125, 3.8260498046875, 4.08050537109375, 4.3349609375, 4.58941650390625, 4.8438720703125, 5.09832763671875, 5.352783203125, 5.60723876953125, 5.8616943359375, 6.11614990234375, 6.37060546875, 6.62506103515625, 6.8795166015625, 7.13397216796875, 7.388427734375, 7.64288330078125, 7.8973388671875, 8.15179443359375, 8.40625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 10.0, 15.0, 18.0, 24.0, 48.0, 57.0, 91.0, 125.0, 278.0, 583.0, 984.0, 871.0, 411.0, 200.0, 106.0, 60.0, 37.0, 37.0, 22.0, 16.0, 9.0, 15.0, 8.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.7734375, -13.43603515625, -13.0986328125, -12.76123046875, -12.423828125, -12.08642578125, -11.7490234375, -11.41162109375, -11.07421875, -10.73681640625, -10.3994140625, -10.06201171875, -9.724609375, -9.38720703125, -9.0498046875, -8.71240234375, -8.375, -8.03759765625, -7.7001953125, -7.36279296875, -7.025390625, -6.68798828125, -6.3505859375, -6.01318359375, -5.67578125, -5.33837890625, -5.0009765625, -4.66357421875, -4.326171875, -3.98876953125, -3.6513671875, -3.31396484375, -2.9765625, -2.63916015625, -2.3017578125, -1.96435546875, -1.626953125, -1.28955078125, -0.9521484375, -0.61474609375, -0.27734375, 0.06005859375, 0.3974609375, 0.73486328125, 1.072265625, 1.40966796875, 1.7470703125, 2.08447265625, 2.421875, 2.75927734375, 3.0966796875, 3.43408203125, 3.771484375, 4.10888671875, 4.4462890625, 4.78369140625, 5.12109375, 5.45849609375, 5.7958984375, 6.13330078125, 6.470703125, 6.80810546875, 7.1455078125, 7.48291015625, 7.8203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 12.0, 31.0, 102.0, 258.0, 297.0, 184.0, 64.0, 16.0, 12.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.27273559570312, -101.88432312011719, -97.49591827392578, -93.10751342773438, -88.71910095214844, -84.3306884765625, -79.9422836303711, -75.55387878417969, -71.16546630859375, -66.77705383300781, -62.388648986816406, -58.000240325927734, -53.61183166503906, -49.22342300415039, -44.83501434326172, -40.44660568237305, -36.058197021484375, -31.669788360595703, -27.28137969970703, -22.89297103881836, -18.504562377929688, -14.116153717041016, -9.727745056152344, -5.339336395263672, -0.950927734375, 3.437480926513672, 7.825889587402344, 12.214298248291016, 16.602706909179688, 20.99111557006836, 25.37952423095703, 29.767932891845703, 34.15635681152344, 38.54476547241211, 42.93317413330078, 47.32158279418945, 51.709991455078125, 56.0984001159668, 60.48680877685547, 64.87521362304688, 69.26362609863281, 73.65203857421875, 78.04044342041016, 82.42884826660156, 86.8172607421875, 91.20567321777344, 95.59407806396484, 99.98248291015625, 104.37089538574219, 108.75930786132812, 113.14771270751953, 117.53611755371094, 121.92453002929688, 126.31294250488281, 130.70135498046875, 135.08975219726562, 139.47816467285156, 143.8665771484375, 148.25497436523438, 152.6433868408203, 157.03179931640625, 161.4202117919922, 165.80862426757812, 170.197021484375, 174.58543395996094]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 16.0, 13.0, 9.0, 7.0, 15.0, 27.0, 24.0, 22.0, 41.0, 38.0, 32.0, 41.0, 35.0, 50.0, 49.0, 59.0, 56.0, 52.0, 48.0, 47.0, 48.0, 38.0, 45.0, 21.0, 37.0, 24.0, 17.0, 9.0, 16.0, 3.0, 15.0, 13.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.043025970458984, -42.64542007446289, -41.24781799316406, -39.85021209716797, -38.452606201171875, -37.05500411987305, -35.65739822387695, -34.259796142578125, -32.86219024658203, -31.46458625793457, -30.06698226928711, -28.669376373291016, -27.271772384643555, -25.874168395996094, -24.4765625, -23.07895851135254, -21.681354522705078, -20.283750534057617, -18.886146545410156, -17.488540649414062, -16.0909366607666, -14.69333267211914, -13.295727729797363, -11.898122787475586, -10.500518798828125, -9.102914810180664, -7.705309867858887, -6.307705402374268, -4.910100936889648, -3.5124964714050293, -2.11489200592041, -0.7172870635986328, 0.6803131103515625, 2.0779175758361816, 3.475522041320801, 4.87312650680542, 6.270730972290039, 7.668335437774658, 9.065939903259277, 10.463544845581055, 11.861148834228516, 13.258752822875977, 14.656357765197754, 16.05396270751953, 17.451566696166992, 18.849170684814453, 20.246776580810547, 21.644380569458008, 23.04198455810547, 24.43958854675293, 25.83719253540039, 27.234798431396484, 28.632402420043945, 30.030006408691406, 31.4276123046875, 32.825218200683594, 34.22282028198242, 35.620426177978516, 37.018028259277344, 38.41563415527344, 39.81324005126953, 41.21084213256836, 42.60844802856445, 44.00605010986328, 45.403656005859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 7.0, 14.0, 16.0, 20.0, 25.0, 26.0, 49.0, 70.0, 97.0, 170.0, 266.0, 482.0, 975.0, 1803.0, 4049.0, 9232.0, 23951.0, 65819.0, 185850.0, 404627.0, 222924.0, 79324.0, 28678.0, 11078.0, 4576.0, 2007.0, 1034.0, 525.0, 285.0, 179.0, 115.0, 69.0, 65.0, 37.0, 22.0, 21.0, 10.0, 11.0, 8.0, 6.0, 12.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71875, -7.4578857421875, -7.197021484375, -6.9361572265625, -6.67529296875, -6.4144287109375, -6.153564453125, -5.8927001953125, -5.6318359375, -5.3709716796875, -5.110107421875, -4.8492431640625, -4.58837890625, -4.3275146484375, -4.066650390625, -3.8057861328125, -3.544921875, -3.2840576171875, -3.023193359375, -2.7623291015625, -2.50146484375, -2.2406005859375, -1.979736328125, -1.7188720703125, -1.4580078125, -1.1971435546875, -0.936279296875, -0.6754150390625, -0.41455078125, -0.1536865234375, 0.107177734375, 0.3680419921875, 0.62890625, 0.8897705078125, 1.150634765625, 1.4114990234375, 1.67236328125, 1.9332275390625, 2.194091796875, 2.4549560546875, 2.7158203125, 2.9766845703125, 3.237548828125, 3.4984130859375, 3.75927734375, 4.0201416015625, 4.281005859375, 4.5418701171875, 4.802734375, 5.0635986328125, 5.324462890625, 5.5853271484375, 5.84619140625, 6.1070556640625, 6.367919921875, 6.6287841796875, 6.8896484375, 7.1505126953125, 7.411376953125, 7.6722412109375, 7.93310546875, 8.1939697265625, 8.454833984375, 8.7156982421875, 8.9765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 9.0, 10.0, 21.0, 27.0, 22.0, 39.0, 36.0, 49.0, 60.0, 78.0, 62.0, 56.0, 61.0, 65.0, 64.0, 58.0, 62.0, 43.0, 37.0, 23.0, 28.0, 21.0, 20.0, 11.0, 11.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.71368408203125, -3.5601806640625, -3.40667724609375, -3.253173828125, -3.09967041015625, -2.9461669921875, -2.79266357421875, -2.63916015625, -2.48565673828125, -2.3321533203125, -2.17864990234375, -2.025146484375, -1.87164306640625, -1.7181396484375, -1.56463623046875, -1.4111328125, -1.25762939453125, -1.1041259765625, -0.95062255859375, -0.797119140625, -0.64361572265625, -0.4901123046875, -0.33660888671875, -0.18310546875, -0.02960205078125, 0.1239013671875, 0.27740478515625, 0.430908203125, 0.58441162109375, 0.7379150390625, 0.89141845703125, 1.044921875, 1.19842529296875, 1.3519287109375, 1.50543212890625, 1.658935546875, 1.81243896484375, 1.9659423828125, 2.11944580078125, 2.27294921875, 2.42645263671875, 2.5799560546875, 2.73345947265625, 2.886962890625, 3.04046630859375, 3.1939697265625, 3.34747314453125, 3.5009765625, 3.65447998046875, 3.8079833984375, 3.96148681640625, 4.114990234375, 4.26849365234375, 4.4219970703125, 4.57550048828125, 4.72900390625, 4.88250732421875, 5.0360107421875, 5.18951416015625, 5.343017578125, 5.49652099609375, 5.6500244140625, 5.80352783203125, 5.95703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 14.0, 13.0, 17.0, 23.0, 34.0, 53.0, 80.0, 95.0, 146.0, 188.0, 246.0, 322.0, 479.0, 744.0, 1230.0, 2182.0, 4448.0, 11747.0, 45063.0, 228653.0, 606220.0, 107417.0, 23808.0, 7355.0, 3126.0, 1712.0, 1008.0, 661.0, 409.0, 266.0, 225.0, 145.0, 122.0, 73.0, 52.0, 49.0, 29.0, 23.0, 20.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.3671875, -9.035888671875, -8.70458984375, -8.373291015625, -8.0419921875, -7.710693359375, -7.37939453125, -7.048095703125, -6.716796875, -6.385498046875, -6.05419921875, -5.722900390625, -5.3916015625, -5.060302734375, -4.72900390625, -4.397705078125, -4.06640625, -3.735107421875, -3.40380859375, -3.072509765625, -2.7412109375, -2.409912109375, -2.07861328125, -1.747314453125, -1.416015625, -1.084716796875, -0.75341796875, -0.422119140625, -0.0908203125, 0.240478515625, 0.57177734375, 0.903076171875, 1.234375, 1.565673828125, 1.89697265625, 2.228271484375, 2.5595703125, 2.890869140625, 3.22216796875, 3.553466796875, 3.884765625, 4.216064453125, 4.54736328125, 4.878662109375, 5.2099609375, 5.541259765625, 5.87255859375, 6.203857421875, 6.53515625, 6.866455078125, 7.19775390625, 7.529052734375, 7.8603515625, 8.191650390625, 8.52294921875, 8.854248046875, 9.185546875, 9.516845703125, 9.84814453125, 10.179443359375, 10.5107421875, 10.842041015625, 11.17333984375, 11.504638671875, 11.8359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 6.0, 10.0, 6.0, 11.0, 19.0, 11.0, 9.0, 21.0, 17.0, 21.0, 21.0, 23.0, 28.0, 33.0, 33.0, 30.0, 34.0, 33.0, 32.0, 34.0, 32.0, 39.0, 47.0, 34.0, 31.0, 38.0, 34.0, 39.0, 27.0, 33.0, 30.0, 25.0, 30.0, 16.0, 17.0, 8.0, 13.0, 11.0, 11.0, 7.0, 7.0, 3.0, 7.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.6171875, -12.2425537109375, -11.867919921875, -11.4932861328125, -11.11865234375, -10.7440185546875, -10.369384765625, -9.9947509765625, -9.6201171875, -9.2454833984375, -8.870849609375, -8.4962158203125, -8.12158203125, -7.7469482421875, -7.372314453125, -6.9976806640625, -6.623046875, -6.2484130859375, -5.873779296875, -5.4991455078125, -5.12451171875, -4.7498779296875, -4.375244140625, -4.0006103515625, -3.6259765625, -3.2513427734375, -2.876708984375, -2.5020751953125, -2.12744140625, -1.7528076171875, -1.378173828125, -1.0035400390625, -0.62890625, -0.2542724609375, 0.120361328125, 0.4949951171875, 0.86962890625, 1.2442626953125, 1.618896484375, 1.9935302734375, 2.3681640625, 2.7427978515625, 3.117431640625, 3.4920654296875, 3.86669921875, 4.2413330078125, 4.615966796875, 4.9906005859375, 5.365234375, 5.7398681640625, 6.114501953125, 6.4891357421875, 6.86376953125, 7.2384033203125, 7.613037109375, 7.9876708984375, 8.3623046875, 8.7369384765625, 9.111572265625, 9.4862060546875, 9.86083984375, 10.2354736328125, 10.610107421875, 10.9847412109375, 11.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 19.0, 15.0, 36.0, 47.0, 44.0, 71.0, 129.0, 226.0, 380.0, 806.0, 2167.0, 8019.0, 57290.0, 807187.0, 152048.0, 14558.0, 3094.0, 1099.0, 506.0, 261.0, 183.0, 113.0, 71.0, 36.0, 43.0, 21.0, 20.0, 12.0, 3.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.51171875, -5.352783203125, -5.19384765625, -5.034912109375, -4.8759765625, -4.717041015625, -4.55810546875, -4.399169921875, -4.240234375, -4.081298828125, -3.92236328125, -3.763427734375, -3.6044921875, -3.445556640625, -3.28662109375, -3.127685546875, -2.96875, -2.809814453125, -2.65087890625, -2.491943359375, -2.3330078125, -2.174072265625, -2.01513671875, -1.856201171875, -1.697265625, -1.538330078125, -1.37939453125, -1.220458984375, -1.0615234375, -0.902587890625, -0.74365234375, -0.584716796875, -0.42578125, -0.266845703125, -0.10791015625, 0.051025390625, 0.2099609375, 0.368896484375, 0.52783203125, 0.686767578125, 0.845703125, 1.004638671875, 1.16357421875, 1.322509765625, 1.4814453125, 1.640380859375, 1.79931640625, 1.958251953125, 2.1171875, 2.276123046875, 2.43505859375, 2.593994140625, 2.7529296875, 2.911865234375, 3.07080078125, 3.229736328125, 3.388671875, 3.547607421875, 3.70654296875, 3.865478515625, 4.0244140625, 4.183349609375, 4.34228515625, 4.501220703125, 4.66015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 12.0, 20.0, 23.0, 29.0, 40.0, 46.0, 48.0, 69.0, 95.0, 100.0, 83.0, 63.0, 62.0, 44.0, 49.0, 32.0, 28.0, 16.0, 16.0, 7.0, 11.0, 12.0, 10.0, 6.0, 11.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.0007886886596679688, -0.0007663518190383911, -0.0007440149784088135, -0.0007216781377792358, -0.0006993412971496582, -0.0006770044565200806, -0.0006546676158905029, -0.0006323307752609253, -0.0006099939346313477, -0.00058765709400177, -0.0005653202533721924, -0.0005429834127426147, -0.0005206465721130371, -0.0004983097314834595, -0.00047597289085388184, -0.0004536360502243042, -0.00043129920959472656, -0.0004089623689651489, -0.0003866255283355713, -0.00036428868770599365, -0.000341951847076416, -0.0003196150064468384, -0.00029727816581726074, -0.0002749413251876831, -0.00025260448455810547, -0.00023026764392852783, -0.0002079308032989502, -0.00018559396266937256, -0.00016325712203979492, -0.00014092028141021729, -0.00011858344078063965, -9.624660015106201e-05, -7.390975952148438e-05, -5.157291889190674e-05, -2.92360782623291e-05, -6.899237632751465e-06, 1.5437602996826172e-05, 3.777444362640381e-05, 6.0111284255981445e-05, 8.244812488555908e-05, 0.00010478496551513672, 0.00012712180614471436, 0.000149458646774292, 0.00017179548740386963, 0.00019413232803344727, 0.0002164691686630249, 0.00023880600929260254, 0.0002611428499221802, 0.0002834796905517578, 0.00030581653118133545, 0.0003281533718109131, 0.0003504902124404907, 0.00037282705307006836, 0.000395163893699646, 0.00041750073432922363, 0.00043983757495880127, 0.0004621744155883789, 0.00048451125621795654, 0.0005068480968475342, 0.0005291849374771118, 0.0005515217781066895, 0.0005738586187362671, 0.0005961954593658447, 0.0006185322999954224, 0.000640869140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 11.0, 19.0, 28.0, 53.0, 72.0, 189.0, 376.0, 822.0, 2901.0, 18373.0, 704497.0, 304702.0, 12549.0, 2382.0, 827.0, 346.0, 158.0, 90.0, 59.0, 26.0, 20.0, 19.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.7017822265625, -6.477783203125, -6.2537841796875, -6.02978515625, -5.8057861328125, -5.581787109375, -5.3577880859375, -5.1337890625, -4.9097900390625, -4.685791015625, -4.4617919921875, -4.23779296875, -4.0137939453125, -3.789794921875, -3.5657958984375, -3.341796875, -3.1177978515625, -2.893798828125, -2.6697998046875, -2.44580078125, -2.2218017578125, -1.997802734375, -1.7738037109375, -1.5498046875, -1.3258056640625, -1.101806640625, -0.8778076171875, -0.65380859375, -0.4298095703125, -0.205810546875, 0.0181884765625, 0.2421875, 0.4661865234375, 0.690185546875, 0.9141845703125, 1.13818359375, 1.3621826171875, 1.586181640625, 1.8101806640625, 2.0341796875, 2.2581787109375, 2.482177734375, 2.7061767578125, 2.93017578125, 3.1541748046875, 3.378173828125, 3.6021728515625, 3.826171875, 4.0501708984375, 4.274169921875, 4.4981689453125, 4.72216796875, 4.9461669921875, 5.170166015625, 5.3941650390625, 5.6181640625, 5.8421630859375, 6.066162109375, 6.2901611328125, 6.51416015625, 6.7381591796875, 6.962158203125, 7.1861572265625, 7.41015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 11.0, 4.0, 3.0, 8.0, 11.0, 15.0, 23.0, 28.0, 41.0, 46.0, 58.0, 69.0, 100.0, 124.0, 97.0, 67.0, 64.0, 48.0, 36.0, 25.0, 21.0, 24.0, 21.0, 12.0, 15.0, 7.0, 9.0, 6.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.2427978515625, -3.110595703125, -2.9783935546875, -2.84619140625, -2.7139892578125, -2.581787109375, -2.4495849609375, -2.3173828125, -2.1851806640625, -2.052978515625, -1.9207763671875, -1.78857421875, -1.6563720703125, -1.524169921875, -1.3919677734375, -1.259765625, -1.1275634765625, -0.995361328125, -0.8631591796875, -0.73095703125, -0.5987548828125, -0.466552734375, -0.3343505859375, -0.2021484375, -0.0699462890625, 0.062255859375, 0.1944580078125, 0.32666015625, 0.4588623046875, 0.591064453125, 0.7232666015625, 0.85546875, 0.9876708984375, 1.119873046875, 1.2520751953125, 1.38427734375, 1.5164794921875, 1.648681640625, 1.7808837890625, 1.9130859375, 2.0452880859375, 2.177490234375, 2.3096923828125, 2.44189453125, 2.5740966796875, 2.706298828125, 2.8385009765625, 2.970703125, 3.1029052734375, 3.235107421875, 3.3673095703125, 3.49951171875, 3.6317138671875, 3.763916015625, 3.8961181640625, 4.0283203125, 4.1605224609375, 4.292724609375, 4.4249267578125, 4.55712890625, 4.6893310546875, 4.821533203125, 4.9537353515625, 5.0859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 18.0, 40.0, 93.0, 215.0, 309.0, 172.0, 76.0, 34.0, 18.0, 6.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.42596435546875, -160.3578338623047, -156.2897186279297, -152.22158813476562, -148.15347290039062, -144.08534240722656, -140.0172119140625, -135.9490966796875, -131.88096618652344, -127.8128433227539, -123.74472045898438, -119.67658996582031, -115.60846710205078, -111.54034423828125, -107.47221374511719, -103.40409088134766, -99.33596801757812, -95.2678451538086, -91.19972229003906, -87.131591796875, -83.06346893310547, -78.99534606933594, -74.92721557617188, -70.85909271240234, -66.79096984863281, -62.72284698486328, -58.654720306396484, -54.58659362792969, -50.518470764160156, -46.450347900390625, -42.38222122192383, -38.31409454345703, -34.24598693847656, -30.1778621673584, -26.109737396240234, -22.04161262512207, -17.973487854003906, -13.905363082885742, -9.837238311767578, -5.769113540649414, -1.70098876953125, 2.367136001586914, 6.435260772705078, 10.503385543823242, 14.571510314941406, 18.63963508605957, 22.707759857177734, 26.7758846282959, 30.844009399414062, 34.912132263183594, 38.98025894165039, 43.04838562011719, 47.11650848388672, 51.18463134765625, 55.25275802612305, 59.320884704589844, 63.389007568359375, 67.4571304321289, 71.52525329589844, 75.5933837890625, 79.66150665283203, 83.72962951660156, 87.79776000976562, 91.86588287353516, 95.93400573730469]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 10.0, 11.0, 13.0, 18.0, 17.0, 20.0, 14.0, 21.0, 27.0, 23.0, 34.0, 32.0, 33.0, 47.0, 41.0, 52.0, 53.0, 57.0, 80.0, 49.0, 40.0, 41.0, 33.0, 33.0, 28.0, 25.0, 20.0, 24.0, 18.0, 16.0, 14.0, 9.0, 6.0, 2.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.095027923583984, -49.467533111572266, -47.84003829956055, -46.21254348754883, -44.58504867553711, -42.957550048828125, -41.330055236816406, -39.70256042480469, -38.07506561279297, -36.44757080078125, -34.82007598876953, -33.19258117675781, -31.56508445739746, -29.937589645385742, -28.310094833374023, -26.682598114013672, -25.055105209350586, -23.427610397338867, -21.80011558532715, -20.172618865966797, -18.545124053955078, -16.91762924194336, -15.29013442993164, -13.662638664245605, -12.035143852233887, -10.407649040222168, -8.780153274536133, -7.152658462524414, -5.525163173675537, -3.89766788482666, -2.2701730728149414, -0.6426773071289062, 0.9848175048828125, 2.6123127937316895, 4.239808082580566, 5.867302894592285, 7.494798183441162, 9.122293472290039, 10.749788284301758, 12.377284049987793, 14.004778861999512, 15.63227367401123, 17.259769439697266, 18.887264251708984, 20.514759063720703, 22.142253875732422, 23.76974868774414, 25.397245407104492, 27.02474021911621, 28.65223503112793, 30.27972984313965, 31.9072265625, 33.53472137451172, 35.16221618652344, 36.789710998535156, 38.417205810546875, 40.044700622558594, 41.67219543457031, 43.29969024658203, 44.92718505859375, 46.55467987060547, 48.18217468261719, 49.809669494628906, 51.43716812133789, 53.06466293334961]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 11.0, 21.0, 41.0, 30.0, 83.0, 88.0, 187.0, 399.0, 1000.0, 2802.0, 9391.0, 40388.0, 425983.0, 3365041.0, 302893.0, 33149.0, 8289.0, 2760.0, 973.0, 367.0, 167.0, 77.0, 41.0, 26.0, 19.0, 8.0, 9.0, 10.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.211181640625, -5.98486328125, -5.758544921875, -5.5322265625, -5.305908203125, -5.07958984375, -4.853271484375, -4.626953125, -4.400634765625, -4.17431640625, -3.947998046875, -3.7216796875, -3.495361328125, -3.26904296875, -3.042724609375, -2.81640625, -2.590087890625, -2.36376953125, -2.137451171875, -1.9111328125, -1.684814453125, -1.45849609375, -1.232177734375, -1.005859375, -0.779541015625, -0.55322265625, -0.326904296875, -0.1005859375, 0.125732421875, 0.35205078125, 0.578369140625, 0.8046875, 1.031005859375, 1.25732421875, 1.483642578125, 1.7099609375, 1.936279296875, 2.16259765625, 2.388916015625, 2.615234375, 2.841552734375, 3.06787109375, 3.294189453125, 3.5205078125, 3.746826171875, 3.97314453125, 4.199462890625, 4.42578125, 4.652099609375, 4.87841796875, 5.104736328125, 5.3310546875, 5.557373046875, 5.78369140625, 6.010009765625, 6.236328125, 6.462646484375, 6.68896484375, 6.915283203125, 7.1416015625, 7.367919921875, 7.59423828125, 7.820556640625, 8.046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 8.0, 12.0, 11.0, 14.0, 21.0, 22.0, 36.0, 36.0, 40.0, 55.0, 50.0, 59.0, 63.0, 63.0, 58.0, 71.0, 68.0, 58.0, 48.0, 47.0, 29.0, 30.0, 25.0, 17.0, 18.0, 12.0, 4.0, 9.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.795440673828125, -2.65533447265625, -2.515228271484375, -2.3751220703125, -2.235015869140625, -2.09490966796875, -1.954803466796875, -1.814697265625, -1.674591064453125, -1.53448486328125, -1.394378662109375, -1.2542724609375, -1.114166259765625, -0.97406005859375, -0.833953857421875, -0.69384765625, -0.553741455078125, -0.41363525390625, -0.273529052734375, -0.1334228515625, 0.006683349609375, 0.14678955078125, 0.286895751953125, 0.427001953125, 0.567108154296875, 0.70721435546875, 0.847320556640625, 0.9874267578125, 1.127532958984375, 1.26763916015625, 1.407745361328125, 1.5478515625, 1.687957763671875, 1.82806396484375, 1.968170166015625, 2.1082763671875, 2.248382568359375, 2.38848876953125, 2.528594970703125, 2.668701171875, 2.808807373046875, 2.94891357421875, 3.089019775390625, 3.2291259765625, 3.369232177734375, 3.50933837890625, 3.649444580078125, 3.78955078125, 3.929656982421875, 4.06976318359375, 4.209869384765625, 4.3499755859375, 4.490081787109375, 4.63018798828125, 4.770294189453125, 4.910400390625, 5.050506591796875, 5.19061279296875, 5.330718994140625, 5.4708251953125, 5.610931396484375, 5.75103759765625, 5.891143798828125, 6.03125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 4.0, 15.0, 21.0, 26.0, 34.0, 63.0, 77.0, 146.0, 280.0, 564.0, 1180.0, 2822.0, 8534.0, 29941.0, 156047.0, 3286413.0, 623352.0, 61675.0, 14704.0, 4743.0, 1819.0, 842.0, 420.0, 205.0, 115.0, 71.0, 50.0, 25.0, 23.0, 23.0, 6.0, 8.0, 13.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.4609375, -9.216796875, -8.97265625, -8.728515625, -8.484375, -8.240234375, -7.99609375, -7.751953125, -7.5078125, -7.263671875, -7.01953125, -6.775390625, -6.53125, -6.287109375, -6.04296875, -5.798828125, -5.5546875, -5.310546875, -5.06640625, -4.822265625, -4.578125, -4.333984375, -4.08984375, -3.845703125, -3.6015625, -3.357421875, -3.11328125, -2.869140625, -2.625, -2.380859375, -2.13671875, -1.892578125, -1.6484375, -1.404296875, -1.16015625, -0.916015625, -0.671875, -0.427734375, -0.18359375, 0.060546875, 0.3046875, 0.548828125, 0.79296875, 1.037109375, 1.28125, 1.525390625, 1.76953125, 2.013671875, 2.2578125, 2.501953125, 2.74609375, 2.990234375, 3.234375, 3.478515625, 3.72265625, 3.966796875, 4.2109375, 4.455078125, 4.69921875, 4.943359375, 5.1875, 5.431640625, 5.67578125, 5.919921875, 6.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 5.0, 12.0, 14.0, 21.0, 27.0, 31.0, 41.0, 48.0, 72.0, 116.0, 210.0, 409.0, 729.0, 962.0, 608.0, 278.0, 163.0, 79.0, 59.0, 33.0, 33.0, 24.0, 20.0, 19.0, 13.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.61004638671875, -6.3489990234375, -6.08795166015625, -5.826904296875, -5.56585693359375, -5.3048095703125, -5.04376220703125, -4.78271484375, -4.52166748046875, -4.2606201171875, -3.99957275390625, -3.738525390625, -3.47747802734375, -3.2164306640625, -2.95538330078125, -2.6943359375, -2.43328857421875, -2.1722412109375, -1.91119384765625, -1.650146484375, -1.38909912109375, -1.1280517578125, -0.86700439453125, -0.60595703125, -0.34490966796875, -0.0838623046875, 0.17718505859375, 0.438232421875, 0.69927978515625, 0.9603271484375, 1.22137451171875, 1.482421875, 1.74346923828125, 2.0045166015625, 2.26556396484375, 2.526611328125, 2.78765869140625, 3.0487060546875, 3.30975341796875, 3.57080078125, 3.83184814453125, 4.0928955078125, 4.35394287109375, 4.614990234375, 4.87603759765625, 5.1370849609375, 5.39813232421875, 5.6591796875, 5.92022705078125, 6.1812744140625, 6.44232177734375, 6.703369140625, 6.96441650390625, 7.2254638671875, 7.48651123046875, 7.74755859375, 8.00860595703125, 8.2696533203125, 8.53070068359375, 8.791748046875, 9.05279541015625, 9.3138427734375, 9.57489013671875, 9.8359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 14.0, 21.0, 70.0, 176.0, 298.0, 262.0, 95.0, 29.0, 15.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.84140014648438, -127.27920532226562, -123.71701049804688, -120.15481567382812, -116.59262084960938, -113.03042602539062, -109.46823120117188, -105.90603637695312, -102.34384155273438, -98.78164672851562, -95.21945190429688, -91.65725708007812, -88.09506225585938, -84.53286743164062, -80.97067260742188, -77.40847778320312, -73.84628295898438, -70.28408813476562, -66.72189331054688, -63.159698486328125, -59.597503662109375, -56.035308837890625, -52.473114013671875, -48.910919189453125, -45.348716735839844, -41.786521911621094, -38.224327087402344, -34.662132263183594, -31.099937438964844, -27.53774070739746, -23.97554588317871, -20.41335105895996, -16.851158142089844, -13.288963317871094, -9.726768493652344, -6.164572715759277, -2.6023778915405273, 0.9598178863525391, 4.522012710571289, 8.084207534790039, 11.646402359008789, 15.208597183227539, 18.77079200744629, 22.332988739013672, 25.895183563232422, 29.457378387451172, 33.01957321166992, 36.58176803588867, 40.14396286010742, 43.70615768432617, 47.26835250854492, 50.83054733276367, 54.39274215698242, 57.95494079589844, 61.51713562011719, 65.07933044433594, 68.64152526855469, 72.20372009277344, 75.76591491699219, 79.32810974121094, 82.89030456542969, 86.45249938964844, 90.01469421386719, 93.57688903808594, 97.13908386230469]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 5.0, 8.0, 8.0, 4.0, 9.0, 13.0, 19.0, 16.0, 18.0, 36.0, 31.0, 28.0, 37.0, 31.0, 35.0, 36.0, 39.0, 37.0, 33.0, 30.0, 36.0, 35.0, 60.0, 45.0, 37.0, 32.0, 31.0, 24.0, 39.0, 41.0, 23.0, 25.0, 11.0, 9.0, 9.0, 19.0, 3.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.71070098876953, -25.708580017089844, -24.706457138061523, -23.704334259033203, -22.702213287353516, -21.700092315673828, -20.697969436645508, -19.695846557617188, -18.6937255859375, -17.691604614257812, -16.689481735229492, -15.687359809875488, -14.685237884521484, -13.68311595916748, -12.680994033813477, -11.678872108459473, -10.676750183105469, -9.674628257751465, -8.672506332397461, -7.670384407043457, -6.668262481689453, -5.666140556335449, -4.664018630981445, -3.6618967056274414, -2.6597747802734375, -1.6576528549194336, -0.6555309295654297, 0.3465909957885742, 1.3487129211425781, 2.350834846496582, 3.352956771850586, 4.35507869720459, 5.357204437255859, 6.359326362609863, 7.361448287963867, 8.363570213317871, 9.365692138671875, 10.367814064025879, 11.369935989379883, 12.372057914733887, 13.37417984008789, 14.376301765441895, 15.378423690795898, 16.38054656982422, 17.382667541503906, 18.384788513183594, 19.386911392211914, 20.389034271240234, 21.391155242919922, 22.39327621459961, 23.39539909362793, 24.39752197265625, 25.399642944335938, 26.401763916015625, 27.403886795043945, 28.406009674072266, 29.408130645751953, 30.41025161743164, 31.41237449645996, 32.41449737548828, 33.41661834716797, 34.418739318847656, 35.420860290527344, 36.4229850769043, 37.425106048583984]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 13.0, 28.0, 43.0, 69.0, 96.0, 152.0, 194.0, 340.0, 513.0, 840.0, 1408.0, 2483.0, 4651.0, 9277.0, 19484.0, 44672.0, 108266.0, 265571.0, 329507.0, 149408.0, 60336.0, 25833.0, 11961.0, 5860.0, 3069.0, 1679.0, 1074.0, 621.0, 404.0, 216.0, 163.0, 98.0, 64.0, 37.0, 32.0, 18.0, 17.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.6160888671875, -5.423583984375, -5.2310791015625, -5.03857421875, -4.8460693359375, -4.653564453125, -4.4610595703125, -4.2685546875, -4.0760498046875, -3.883544921875, -3.6910400390625, -3.49853515625, -3.3060302734375, -3.113525390625, -2.9210205078125, -2.728515625, -2.5360107421875, -2.343505859375, -2.1510009765625, -1.95849609375, -1.7659912109375, -1.573486328125, -1.3809814453125, -1.1884765625, -0.9959716796875, -0.803466796875, -0.6109619140625, -0.41845703125, -0.2259521484375, -0.033447265625, 0.1590576171875, 0.3515625, 0.5440673828125, 0.736572265625, 0.9290771484375, 1.12158203125, 1.3140869140625, 1.506591796875, 1.6990966796875, 1.8916015625, 2.0841064453125, 2.276611328125, 2.4691162109375, 2.66162109375, 2.8541259765625, 3.046630859375, 3.2391357421875, 3.431640625, 3.6241455078125, 3.816650390625, 4.0091552734375, 4.20166015625, 4.3941650390625, 4.586669921875, 4.7791748046875, 4.9716796875, 5.1641845703125, 5.356689453125, 5.5491943359375, 5.74169921875, 5.9342041015625, 6.126708984375, 6.3192138671875, 6.51171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 9.0, 7.0, 9.0, 12.0, 9.0, 18.0, 24.0, 34.0, 25.0, 38.0, 39.0, 57.0, 57.0, 66.0, 81.0, 62.0, 66.0, 52.0, 54.0, 57.0, 58.0, 27.0, 37.0, 23.0, 27.0, 14.0, 8.0, 9.0, 10.0, 11.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.946319580078125, -2.80865478515625, -2.670989990234375, -2.5333251953125, -2.395660400390625, -2.25799560546875, -2.120330810546875, -1.982666015625, -1.845001220703125, -1.70733642578125, -1.569671630859375, -1.4320068359375, -1.294342041015625, -1.15667724609375, -1.019012451171875, -0.88134765625, -0.743682861328125, -0.60601806640625, -0.468353271484375, -0.3306884765625, -0.193023681640625, -0.05535888671875, 0.082305908203125, 0.219970703125, 0.357635498046875, 0.49530029296875, 0.632965087890625, 0.7706298828125, 0.908294677734375, 1.04595947265625, 1.183624267578125, 1.3212890625, 1.458953857421875, 1.59661865234375, 1.734283447265625, 1.8719482421875, 2.009613037109375, 2.14727783203125, 2.284942626953125, 2.422607421875, 2.560272216796875, 2.69793701171875, 2.835601806640625, 2.9732666015625, 3.110931396484375, 3.24859619140625, 3.386260986328125, 3.52392578125, 3.661590576171875, 3.79925537109375, 3.936920166015625, 4.0745849609375, 4.212249755859375, 4.34991455078125, 4.487579345703125, 4.625244140625, 4.762908935546875, 4.90057373046875, 5.038238525390625, 5.1759033203125, 5.313568115234375, 5.45123291015625, 5.588897705078125, 5.7265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 14.0, 11.0, 15.0, 15.0, 22.0, 39.0, 43.0, 78.0, 115.0, 155.0, 257.0, 427.0, 685.0, 1328.0, 3038.0, 9083.0, 45794.0, 376058.0, 543750.0, 51319.0, 9773.0, 3191.0, 1369.0, 739.0, 397.0, 247.0, 184.0, 108.0, 82.0, 56.0, 43.0, 28.0, 25.0, 11.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.5032958984375, -12.100341796875, -11.6973876953125, -11.29443359375, -10.8914794921875, -10.488525390625, -10.0855712890625, -9.6826171875, -9.2796630859375, -8.876708984375, -8.4737548828125, -8.07080078125, -7.6678466796875, -7.264892578125, -6.8619384765625, -6.458984375, -6.0560302734375, -5.653076171875, -5.2501220703125, -4.84716796875, -4.4442138671875, -4.041259765625, -3.6383056640625, -3.2353515625, -2.8323974609375, -2.429443359375, -2.0264892578125, -1.62353515625, -1.2205810546875, -0.817626953125, -0.4146728515625, -0.01171875, 0.3912353515625, 0.794189453125, 1.1971435546875, 1.60009765625, 2.0030517578125, 2.406005859375, 2.8089599609375, 3.2119140625, 3.6148681640625, 4.017822265625, 4.4207763671875, 4.82373046875, 5.2266845703125, 5.629638671875, 6.0325927734375, 6.435546875, 6.8385009765625, 7.241455078125, 7.6444091796875, 8.04736328125, 8.4503173828125, 8.853271484375, 9.2562255859375, 9.6591796875, 10.0621337890625, 10.465087890625, 10.8680419921875, 11.27099609375, 11.6739501953125, 12.076904296875, 12.4798583984375, 12.8828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 11.0, 10.0, 10.0, 17.0, 13.0, 13.0, 19.0, 27.0, 27.0, 40.0, 43.0, 45.0, 49.0, 35.0, 40.0, 57.0, 48.0, 52.0, 46.0, 47.0, 40.0, 50.0, 19.0, 37.0, 40.0, 21.0, 21.0, 20.0, 20.0, 9.0, 11.0, 7.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.9921875, -13.5985107421875, -13.204833984375, -12.8111572265625, -12.41748046875, -12.0238037109375, -11.630126953125, -11.2364501953125, -10.8427734375, -10.4490966796875, -10.055419921875, -9.6617431640625, -9.26806640625, -8.8743896484375, -8.480712890625, -8.0870361328125, -7.693359375, -7.2996826171875, -6.906005859375, -6.5123291015625, -6.11865234375, -5.7249755859375, -5.331298828125, -4.9376220703125, -4.5439453125, -4.1502685546875, -3.756591796875, -3.3629150390625, -2.96923828125, -2.5755615234375, -2.181884765625, -1.7882080078125, -1.39453125, -1.0008544921875, -0.607177734375, -0.2135009765625, 0.18017578125, 0.5738525390625, 0.967529296875, 1.3612060546875, 1.7548828125, 2.1485595703125, 2.542236328125, 2.9359130859375, 3.32958984375, 3.7232666015625, 4.116943359375, 4.5106201171875, 4.904296875, 5.2979736328125, 5.691650390625, 6.0853271484375, 6.47900390625, 6.8726806640625, 7.266357421875, 7.6600341796875, 8.0537109375, 8.4473876953125, 8.841064453125, 9.2347412109375, 9.62841796875, 10.0220947265625, 10.415771484375, 10.8094482421875, 11.203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 11.0, 10.0, 13.0, 21.0, 17.0, 36.0, 48.0, 65.0, 108.0, 215.0, 423.0, 942.0, 2788.0, 12015.0, 85845.0, 744002.0, 175159.0, 20197.0, 4127.0, 1297.0, 558.0, 240.0, 142.0, 86.0, 49.0, 29.0, 30.0, 23.0, 10.0, 14.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.85546875, -3.74420166015625, -3.6329345703125, -3.52166748046875, -3.410400390625, -3.29913330078125, -3.1878662109375, -3.07659912109375, -2.96533203125, -2.85406494140625, -2.7427978515625, -2.63153076171875, -2.520263671875, -2.40899658203125, -2.2977294921875, -2.18646240234375, -2.0751953125, -1.96392822265625, -1.8526611328125, -1.74139404296875, -1.630126953125, -1.51885986328125, -1.4075927734375, -1.29632568359375, -1.18505859375, -1.07379150390625, -0.9625244140625, -0.85125732421875, -0.739990234375, -0.62872314453125, -0.5174560546875, -0.40618896484375, -0.294921875, -0.18365478515625, -0.0723876953125, 0.03887939453125, 0.150146484375, 0.26141357421875, 0.3726806640625, 0.48394775390625, 0.59521484375, 0.70648193359375, 0.8177490234375, 0.92901611328125, 1.040283203125, 1.15155029296875, 1.2628173828125, 1.37408447265625, 1.4853515625, 1.59661865234375, 1.7078857421875, 1.81915283203125, 1.930419921875, 2.04168701171875, 2.1529541015625, 2.26422119140625, 2.37548828125, 2.48675537109375, 2.5980224609375, 2.70928955078125, 2.820556640625, 2.93182373046875, 3.0430908203125, 3.15435791015625, 3.265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 10.0, 7.0, 18.0, 15.0, 18.0, 23.0, 26.0, 35.0, 39.0, 45.0, 60.0, 68.0, 64.0, 85.0, 69.0, 71.0, 70.0, 51.0, 38.0, 31.0, 30.0, 22.0, 15.0, 16.0, 11.0, 6.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006175041198730469, -0.0005973353981971741, -0.0005771666765213013, -0.0005569979548454285, -0.0005368292331695557, -0.0005166605114936829, -0.0004964917898178101, -0.00047632306814193726, -0.00045615434646606445, -0.00043598562479019165, -0.00041581690311431885, -0.00039564818143844604, -0.00037547945976257324, -0.00035531073808670044, -0.00033514201641082764, -0.00031497329473495483, -0.00029480457305908203, -0.00027463585138320923, -0.0002544671297073364, -0.00023429840803146362, -0.00021412968635559082, -0.00019396096467971802, -0.00017379224300384521, -0.0001536235213279724, -0.0001334547996520996, -0.0001132860779762268, -9.3117356300354e-05, -7.29486346244812e-05, -5.27799129486084e-05, -3.2611191272735596e-05, -1.2442469596862793e-05, 7.72625207901001e-06, 2.7894973754882812e-05, 4.8063695430755615e-05, 6.823241710662842e-05, 8.840113878250122e-05, 0.00010856986045837402, 0.00012873858213424683, 0.00014890730381011963, 0.00016907602548599243, 0.00018924474716186523, 0.00020941346883773804, 0.00022958219051361084, 0.00024975091218948364, 0.00026991963386535645, 0.00029008835554122925, 0.00031025707721710205, 0.00033042579889297485, 0.00035059452056884766, 0.00037076324224472046, 0.00039093196392059326, 0.00041110068559646606, 0.00043126940727233887, 0.00045143812894821167, 0.00047160685062408447, 0.0004917755722999573, 0.0005119442939758301, 0.0005321130156517029, 0.0005522817373275757, 0.0005724504590034485, 0.0005926191806793213, 0.0006127879023551941, 0.0006329566240310669, 0.0006531253457069397, 0.0006732940673828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 22.0, 40.0, 52.0, 96.0, 165.0, 324.0, 710.0, 1872.0, 6575.0, 42854.0, 708164.0, 260546.0, 20444.0, 4110.0, 1395.0, 534.0, 266.0, 162.0, 78.0, 53.0, 14.0, 31.0, 15.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.949951171875, -4.82568359375, -4.701416015625, -4.5771484375, -4.452880859375, -4.32861328125, -4.204345703125, -4.080078125, -3.955810546875, -3.83154296875, -3.707275390625, -3.5830078125, -3.458740234375, -3.33447265625, -3.210205078125, -3.0859375, -2.961669921875, -2.83740234375, -2.713134765625, -2.5888671875, -2.464599609375, -2.34033203125, -2.216064453125, -2.091796875, -1.967529296875, -1.84326171875, -1.718994140625, -1.5947265625, -1.470458984375, -1.34619140625, -1.221923828125, -1.09765625, -0.973388671875, -0.84912109375, -0.724853515625, -0.6005859375, -0.476318359375, -0.35205078125, -0.227783203125, -0.103515625, 0.020751953125, 0.14501953125, 0.269287109375, 0.3935546875, 0.517822265625, 0.64208984375, 0.766357421875, 0.890625, 1.014892578125, 1.13916015625, 1.263427734375, 1.3876953125, 1.511962890625, 1.63623046875, 1.760498046875, 1.884765625, 2.009033203125, 2.13330078125, 2.257568359375, 2.3818359375, 2.506103515625, 2.63037109375, 2.754638671875, 2.87890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 13.0, 12.0, 13.0, 22.0, 25.0, 17.0, 44.0, 53.0, 67.0, 76.0, 65.0, 70.0, 75.0, 72.0, 73.0, 57.0, 50.0, 33.0, 19.0, 22.0, 24.0, 26.0, 11.0, 8.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.5875244140625, -2.501220703125, -2.4149169921875, -2.32861328125, -2.2423095703125, -2.156005859375, -2.0697021484375, -1.9833984375, -1.8970947265625, -1.810791015625, -1.7244873046875, -1.63818359375, -1.5518798828125, -1.465576171875, -1.3792724609375, -1.29296875, -1.2066650390625, -1.120361328125, -1.0340576171875, -0.94775390625, -0.8614501953125, -0.775146484375, -0.6888427734375, -0.6025390625, -0.5162353515625, -0.429931640625, -0.3436279296875, -0.25732421875, -0.1710205078125, -0.084716796875, 0.0015869140625, 0.087890625, 0.1741943359375, 0.260498046875, 0.3468017578125, 0.43310546875, 0.5194091796875, 0.605712890625, 0.6920166015625, 0.7783203125, 0.8646240234375, 0.950927734375, 1.0372314453125, 1.12353515625, 1.2098388671875, 1.296142578125, 1.3824462890625, 1.46875, 1.5550537109375, 1.641357421875, 1.7276611328125, 1.81396484375, 1.9002685546875, 1.986572265625, 2.0728759765625, 2.1591796875, 2.2454833984375, 2.331787109375, 2.4180908203125, 2.50439453125, 2.5906982421875, 2.677001953125, 2.7633056640625, 2.849609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 27.0, 33.0, 67.0, 97.0, 189.0, 216.0, 141.0, 97.0, 52.0, 16.0, 16.0, 10.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.8323974609375, -93.44868469238281, -91.06497955322266, -88.68126678466797, -86.29756164550781, -83.91384887695312, -81.53013610839844, -79.14642333984375, -76.7627182006836, -74.3790054321289, -71.99530029296875, -69.61158752441406, -67.22787475585938, -64.84416961669922, -62.46045684814453, -60.07674789428711, -57.69303894042969, -55.309329986572266, -52.925621032714844, -50.541908264160156, -48.158199310302734, -45.77449035644531, -43.390777587890625, -41.0070686340332, -38.62335968017578, -36.23965072631836, -33.85594177246094, -31.47222900390625, -29.088520050048828, -26.704811096191406, -24.32110023498535, -21.937389373779297, -19.55368423461914, -17.16997528076172, -14.786264419555664, -12.402554512023926, -10.018844604492188, -7.635134696960449, -5.251424789428711, -2.8677139282226562, -0.4840049743652344, 1.899704933166504, 4.283414840698242, 6.6671247482299805, 9.050834655761719, 11.434544563293457, 13.818254470825195, 16.20196533203125, 18.585674285888672, 20.969383239746094, 23.35309410095215, 25.736804962158203, 28.120513916015625, 30.504222869873047, 32.88793182373047, 35.271644592285156, 37.65535354614258, 40.0390625, 42.42277526855469, 44.80648422241211, 47.19019317626953, 49.57390213012695, 51.957611083984375, 54.34132385253906, 56.725032806396484]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 10.0, 10.0, 8.0, 10.0, 12.0, 12.0, 16.0, 14.0, 23.0, 31.0, 34.0, 28.0, 28.0, 36.0, 46.0, 45.0, 74.0, 80.0, 77.0, 61.0, 57.0, 41.0, 36.0, 30.0, 36.0, 30.0, 24.0, 14.0, 9.0, 16.0, 10.0, 10.0, 7.0, 2.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.941307067871094, -39.22537612915039, -37.50944519042969, -35.79351043701172, -34.077579498291016, -32.36164855957031, -30.64571762084961, -28.929784774780273, -27.213851928710938, -25.497920989990234, -23.7819881439209, -22.066057205200195, -20.35012435913086, -18.634193420410156, -16.918262481689453, -15.202329635620117, -13.486398696899414, -11.770466804504395, -10.054534912109375, -8.338603973388672, -6.622671604156494, -4.906740188598633, -3.1908082962036133, -1.4748764038085938, 0.24105548858642578, 1.9569872617721558, 3.6729190349578857, 5.388850688934326, 7.104782581329346, 8.820713996887207, 10.536645889282227, 12.252577781677246, 13.968509674072266, 15.684441566467285, 17.400373458862305, 19.116304397583008, 20.832237243652344, 22.548168182373047, 24.26409912109375, 25.980031967163086, 27.695964813232422, 29.411895751953125, 31.12782859802246, 32.8437614440918, 34.5596923828125, 36.2756233215332, 37.991554260253906, 39.707489013671875, 41.42341613769531, 43.139347076416016, 44.85527801513672, 46.57121276855469, 48.28714370727539, 50.003074645996094, 51.7190055847168, 53.4349365234375, 55.15087127685547, 56.86680221557617, 58.582733154296875, 60.298667907714844, 62.01459884643555, 63.73052978515625, 65.44646453857422, 67.16239166259766, 68.87832641601562]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 23.0, 32.0, 54.0, 76.0, 131.0, 252.0, 562.0, 1283.0, 3990.0, 16042.0, 137193.0, 3246178.0, 739393.0, 37186.0, 7750.0, 2389.0, 900.0, 399.0, 186.0, 95.0, 50.0, 41.0, 22.0, 14.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.8057861328125, -8.572509765625, -8.3392333984375, -8.10595703125, -7.8726806640625, -7.639404296875, -7.4061279296875, -7.1728515625, -6.9395751953125, -6.706298828125, -6.4730224609375, -6.23974609375, -6.0064697265625, -5.773193359375, -5.5399169921875, -5.306640625, -5.0733642578125, -4.840087890625, -4.6068115234375, -4.37353515625, -4.1402587890625, -3.906982421875, -3.6737060546875, -3.4404296875, -3.2071533203125, -2.973876953125, -2.7406005859375, -2.50732421875, -2.2740478515625, -2.040771484375, -1.8074951171875, -1.57421875, -1.3409423828125, -1.107666015625, -0.8743896484375, -0.64111328125, -0.4078369140625, -0.174560546875, 0.0587158203125, 0.2919921875, 0.5252685546875, 0.758544921875, 0.9918212890625, 1.22509765625, 1.4583740234375, 1.691650390625, 1.9249267578125, 2.158203125, 2.3914794921875, 2.624755859375, 2.8580322265625, 3.09130859375, 3.3245849609375, 3.557861328125, 3.7911376953125, 4.0244140625, 4.2576904296875, 4.490966796875, 4.7242431640625, 4.95751953125, 5.1907958984375, 5.424072265625, 5.6573486328125, 5.890625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 8.0, 13.0, 9.0, 8.0, 27.0, 34.0, 28.0, 41.0, 35.0, 61.0, 82.0, 70.0, 79.0, 57.0, 77.0, 61.0, 60.0, 35.0, 31.0, 33.0, 37.0, 24.0, 25.0, 23.0, 8.0, 8.0, 5.0, 4.0, 3.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.030120849609375, -2.89422607421875, -2.758331298828125, -2.6224365234375, -2.486541748046875, -2.35064697265625, -2.214752197265625, -2.078857421875, -1.942962646484375, -1.80706787109375, -1.671173095703125, -1.5352783203125, -1.399383544921875, -1.26348876953125, -1.127593994140625, -0.99169921875, -0.855804443359375, -0.71990966796875, -0.584014892578125, -0.4481201171875, -0.312225341796875, -0.17633056640625, -0.040435791015625, 0.095458984375, 0.231353759765625, 0.36724853515625, 0.503143310546875, 0.6390380859375, 0.774932861328125, 0.91082763671875, 1.046722412109375, 1.1826171875, 1.318511962890625, 1.45440673828125, 1.590301513671875, 1.7261962890625, 1.862091064453125, 1.99798583984375, 2.133880615234375, 2.269775390625, 2.405670166015625, 2.54156494140625, 2.677459716796875, 2.8133544921875, 2.949249267578125, 3.08514404296875, 3.221038818359375, 3.35693359375, 3.492828369140625, 3.62872314453125, 3.764617919921875, 3.9005126953125, 4.036407470703125, 4.17230224609375, 4.308197021484375, 4.444091796875, 4.579986572265625, 4.71588134765625, 4.851776123046875, 4.9876708984375, 5.123565673828125, 5.25946044921875, 5.395355224609375, 5.53125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 4.0, 7.0, 18.0, 23.0, 50.0, 59.0, 108.0, 178.0, 335.0, 984.0, 3388.0, 15285.0, 141868.0, 3818038.0, 186903.0, 20206.0, 4357.0, 1292.0, 552.0, 269.0, 127.0, 68.0, 53.0, 21.0, 20.0, 20.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.46875, -9.15869140625, -8.8486328125, -8.53857421875, -8.228515625, -7.91845703125, -7.6083984375, -7.29833984375, -6.98828125, -6.67822265625, -6.3681640625, -6.05810546875, -5.748046875, -5.43798828125, -5.1279296875, -4.81787109375, -4.5078125, -4.19775390625, -3.8876953125, -3.57763671875, -3.267578125, -2.95751953125, -2.6474609375, -2.33740234375, -2.02734375, -1.71728515625, -1.4072265625, -1.09716796875, -0.787109375, -0.47705078125, -0.1669921875, 0.14306640625, 0.453125, 0.76318359375, 1.0732421875, 1.38330078125, 1.693359375, 2.00341796875, 2.3134765625, 2.62353515625, 2.93359375, 3.24365234375, 3.5537109375, 3.86376953125, 4.173828125, 4.48388671875, 4.7939453125, 5.10400390625, 5.4140625, 5.72412109375, 6.0341796875, 6.34423828125, 6.654296875, 6.96435546875, 7.2744140625, 7.58447265625, 7.89453125, 8.20458984375, 8.5146484375, 8.82470703125, 9.134765625, 9.44482421875, 9.7548828125, 10.06494140625, 10.375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 6.0, 15.0, 14.0, 28.0, 34.0, 50.0, 77.0, 177.0, 368.0, 811.0, 1154.0, 645.0, 267.0, 128.0, 79.0, 51.0, 49.0, 26.0, 26.0, 17.0, 9.0, 12.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.74591064453125, -6.4801025390625, -6.21429443359375, -5.948486328125, -5.68267822265625, -5.4168701171875, -5.15106201171875, -4.88525390625, -4.61944580078125, -4.3536376953125, -4.08782958984375, -3.822021484375, -3.55621337890625, -3.2904052734375, -3.02459716796875, -2.7587890625, -2.49298095703125, -2.2271728515625, -1.96136474609375, -1.695556640625, -1.42974853515625, -1.1639404296875, -0.89813232421875, -0.63232421875, -0.36651611328125, -0.1007080078125, 0.16510009765625, 0.430908203125, 0.69671630859375, 0.9625244140625, 1.22833251953125, 1.494140625, 1.75994873046875, 2.0257568359375, 2.29156494140625, 2.557373046875, 2.82318115234375, 3.0889892578125, 3.35479736328125, 3.62060546875, 3.88641357421875, 4.1522216796875, 4.41802978515625, 4.683837890625, 4.94964599609375, 5.2154541015625, 5.48126220703125, 5.7470703125, 6.01287841796875, 6.2786865234375, 6.54449462890625, 6.810302734375, 7.07611083984375, 7.3419189453125, 7.60772705078125, 7.87353515625, 8.13934326171875, 8.4051513671875, 8.67095947265625, 8.936767578125, 9.20257568359375, 9.4683837890625, 9.73419189453125, 10.0]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 18.0, 43.0, 236.0, 435.0, 187.0, 48.0, 21.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.50337982177734, -111.28587341308594, -107.06836700439453, -102.85086059570312, -98.63335418701172, -94.41584777832031, -90.19834899902344, -85.9808349609375, -81.76333618164062, -77.54582977294922, -73.32832336425781, -69.1108169555664, -64.893310546875, -60.675804138183594, -56.45830154418945, -52.24079513549805, -48.023284912109375, -43.80577850341797, -39.58827209472656, -35.370765686035156, -31.153261184692383, -26.935754776000977, -22.718250274658203, -18.500743865966797, -14.28323745727539, -10.065731048583984, -5.8482255935668945, -1.6307201385498047, 2.5867862701416016, 6.804292678833008, 11.021797180175781, 15.239303588867188, 19.456802368164062, 23.67430877685547, 27.891815185546875, 32.10932159423828, 36.32682800292969, 40.544334411621094, 44.761837005615234, 48.97934341430664, 53.19684982299805, 57.41435623168945, 61.63186264038086, 65.849365234375, 70.0668716430664, 74.28437805175781, 78.50188446044922, 82.71939086914062, 86.93689727783203, 91.15440368652344, 95.37191009521484, 99.58941650390625, 103.80692291259766, 108.02442932128906, 112.24192810058594, 116.45944213867188, 120.67694091796875, 124.89444732666016, 129.11195373535156, 133.32945251464844, 137.54696655273438, 141.76446533203125, 145.9819793701172, 150.19947814941406, 154.4169921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 5.0, 12.0, 8.0, 12.0, 18.0, 18.0, 23.0, 20.0, 32.0, 28.0, 35.0, 36.0, 36.0, 49.0, 50.0, 41.0, 57.0, 55.0, 50.0, 48.0, 54.0, 50.0, 42.0, 24.0, 30.0, 28.0, 32.0, 29.0, 15.0, 17.0, 8.0, 15.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.07742691040039, -29.08233642578125, -28.087244033813477, -27.092153549194336, -26.097061157226562, -25.101970672607422, -24.10688018798828, -23.11178970336914, -22.116697311401367, -21.121606826782227, -20.126514434814453, -19.131423950195312, -18.136333465576172, -17.1412410736084, -16.146150588989258, -15.1510591506958, -14.155967712402344, -13.160876274108887, -12.16578483581543, -11.170694351196289, -10.175602912902832, -9.180511474609375, -8.185420989990234, -7.190329551696777, -6.19523811340332, -5.200146675109863, -4.2050557136535645, -3.2099645137786865, -2.2148733139038086, -1.2197818756103516, -0.22469091415405273, 0.7704000473022461, 1.7654914855957031, 2.760582685470581, 3.755673885345459, 4.750764846801758, 5.745856285095215, 6.740947723388672, 7.736038684844971, 8.73112964630127, 9.726221084594727, 10.721312522888184, 11.71640396118164, 12.711494445800781, 13.706585884094238, 14.701677322387695, 15.696767807006836, 16.69186019897461, 17.68695068359375, 18.68204116821289, 19.677133560180664, 20.672224044799805, 21.667316436767578, 22.66240692138672, 23.65749740600586, 24.652587890625, 25.647680282592773, 26.642770767211914, 27.637863159179688, 28.632953643798828, 29.62804412841797, 30.623136520385742, 31.618227005004883, 32.613319396972656, 33.6084098815918]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 15.0, 35.0, 38.0, 75.0, 154.0, 255.0, 451.0, 844.0, 1967.0, 5257.0, 16404.0, 66648.0, 302156.0, 481431.0, 129521.0, 29593.0, 8268.0, 2897.0, 1201.0, 563.0, 331.0, 169.0, 92.0, 49.0, 32.0, 27.0, 18.0, 12.0, 13.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34375, -6.0582275390625, -5.772705078125, -5.4871826171875, -5.20166015625, -4.9161376953125, -4.630615234375, -4.3450927734375, -4.0595703125, -3.7740478515625, -3.488525390625, -3.2030029296875, -2.91748046875, -2.6319580078125, -2.346435546875, -2.0609130859375, -1.775390625, -1.4898681640625, -1.204345703125, -0.9188232421875, -0.63330078125, -0.3477783203125, -0.062255859375, 0.2232666015625, 0.5087890625, 0.7943115234375, 1.079833984375, 1.3653564453125, 1.65087890625, 1.9364013671875, 2.221923828125, 2.5074462890625, 2.79296875, 3.0784912109375, 3.364013671875, 3.6495361328125, 3.93505859375, 4.2205810546875, 4.506103515625, 4.7916259765625, 5.0771484375, 5.3626708984375, 5.648193359375, 5.9337158203125, 6.21923828125, 6.5047607421875, 6.790283203125, 7.0758056640625, 7.361328125, 7.6468505859375, 7.932373046875, 8.2178955078125, 8.50341796875, 8.7889404296875, 9.074462890625, 9.3599853515625, 9.6455078125, 9.9310302734375, 10.216552734375, 10.5020751953125, 10.78759765625, 11.0731201171875, 11.358642578125, 11.6441650390625, 11.9296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 11.0, 12.0, 11.0, 18.0, 19.0, 30.0, 39.0, 39.0, 41.0, 54.0, 62.0, 71.0, 76.0, 66.0, 54.0, 65.0, 62.0, 45.0, 37.0, 38.0, 26.0, 21.0, 25.0, 21.0, 16.0, 10.0, 5.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.0794677734375, -2.947998046875, -2.8165283203125, -2.68505859375, -2.5535888671875, -2.422119140625, -2.2906494140625, -2.1591796875, -2.0277099609375, -1.896240234375, -1.7647705078125, -1.63330078125, -1.5018310546875, -1.370361328125, -1.2388916015625, -1.107421875, -0.9759521484375, -0.844482421875, -0.7130126953125, -0.58154296875, -0.4500732421875, -0.318603515625, -0.1871337890625, -0.0556640625, 0.0758056640625, 0.207275390625, 0.3387451171875, 0.47021484375, 0.6016845703125, 0.733154296875, 0.8646240234375, 0.99609375, 1.1275634765625, 1.259033203125, 1.3905029296875, 1.52197265625, 1.6534423828125, 1.784912109375, 1.9163818359375, 2.0478515625, 2.1793212890625, 2.310791015625, 2.4422607421875, 2.57373046875, 2.7052001953125, 2.836669921875, 2.9681396484375, 3.099609375, 3.2310791015625, 3.362548828125, 3.4940185546875, 3.62548828125, 3.7569580078125, 3.888427734375, 4.0198974609375, 4.1513671875, 4.2828369140625, 4.414306640625, 4.5457763671875, 4.67724609375, 4.8087158203125, 4.940185546875, 5.0716552734375, 5.203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 9.0, 13.0, 20.0, 28.0, 28.0, 38.0, 63.0, 78.0, 137.0, 311.0, 710.0, 2326.0, 9989.0, 57557.0, 575968.0, 343345.0, 46332.0, 8250.0, 2006.0, 624.0, 263.0, 148.0, 97.0, 59.0, 40.0, 33.0, 17.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.4058837890625, -10.069580078125, -9.7332763671875, -9.39697265625, -9.0606689453125, -8.724365234375, -8.3880615234375, -8.0517578125, -7.7154541015625, -7.379150390625, -7.0428466796875, -6.70654296875, -6.3702392578125, -6.033935546875, -5.6976318359375, -5.361328125, -5.0250244140625, -4.688720703125, -4.3524169921875, -4.01611328125, -3.6798095703125, -3.343505859375, -3.0072021484375, -2.6708984375, -2.3345947265625, -1.998291015625, -1.6619873046875, -1.32568359375, -0.9893798828125, -0.653076171875, -0.3167724609375, 0.01953125, 0.3558349609375, 0.692138671875, 1.0284423828125, 1.36474609375, 1.7010498046875, 2.037353515625, 2.3736572265625, 2.7099609375, 3.0462646484375, 3.382568359375, 3.7188720703125, 4.05517578125, 4.3914794921875, 4.727783203125, 5.0640869140625, 5.400390625, 5.7366943359375, 6.072998046875, 6.4093017578125, 6.74560546875, 7.0819091796875, 7.418212890625, 7.7545166015625, 8.0908203125, 8.4271240234375, 8.763427734375, 9.0997314453125, 9.43603515625, 9.7723388671875, 10.108642578125, 10.4449462890625, 10.78125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 12.0, 21.0, 19.0, 22.0, 28.0, 34.0, 28.0, 32.0, 37.0, 38.0, 41.0, 49.0, 53.0, 49.0, 44.0, 54.0, 43.0, 60.0, 44.0, 22.0, 32.0, 32.0, 31.0, 27.0, 29.0, 22.0, 9.0, 11.0, 14.0, 4.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.7127685546875, -10.378662109375, -10.0445556640625, -9.71044921875, -9.3763427734375, -9.042236328125, -8.7081298828125, -8.3740234375, -8.0399169921875, -7.705810546875, -7.3717041015625, -7.03759765625, -6.7034912109375, -6.369384765625, -6.0352783203125, -5.701171875, -5.3670654296875, -5.032958984375, -4.6988525390625, -4.36474609375, -4.0306396484375, -3.696533203125, -3.3624267578125, -3.0283203125, -2.6942138671875, -2.360107421875, -2.0260009765625, -1.69189453125, -1.3577880859375, -1.023681640625, -0.6895751953125, -0.35546875, -0.0213623046875, 0.312744140625, 0.6468505859375, 0.98095703125, 1.3150634765625, 1.649169921875, 1.9832763671875, 2.3173828125, 2.6514892578125, 2.985595703125, 3.3197021484375, 3.65380859375, 3.9879150390625, 4.322021484375, 4.6561279296875, 4.990234375, 5.3243408203125, 5.658447265625, 5.9925537109375, 6.32666015625, 6.6607666015625, 6.994873046875, 7.3289794921875, 7.6630859375, 7.9971923828125, 8.331298828125, 8.6654052734375, 8.99951171875, 9.3336181640625, 9.667724609375, 10.0018310546875, 10.3359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 15.0, 12.0, 32.0, 24.0, 33.0, 53.0, 101.0, 218.0, 401.0, 873.0, 2374.0, 7634.0, 31454.0, 166415.0, 658059.0, 142798.0, 27318.0, 6855.0, 2204.0, 857.0, 355.0, 190.0, 103.0, 59.0, 31.0, 16.0, 12.0, 11.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.671875, -2.6005401611328125, -2.529205322265625, -2.4578704833984375, -2.38653564453125, -2.3152008056640625, -2.243865966796875, -2.1725311279296875, -2.1011962890625, -2.0298614501953125, -1.958526611328125, -1.8871917724609375, -1.81585693359375, -1.7445220947265625, -1.673187255859375, -1.6018524169921875, -1.530517578125, -1.4591827392578125, -1.387847900390625, -1.3165130615234375, -1.24517822265625, -1.1738433837890625, -1.102508544921875, -1.0311737060546875, -0.9598388671875, -0.8885040283203125, -0.817169189453125, -0.7458343505859375, -0.67449951171875, -0.6031646728515625, -0.531829833984375, -0.4604949951171875, -0.38916015625, -0.3178253173828125, -0.246490478515625, -0.1751556396484375, -0.10382080078125, -0.0324859619140625, 0.038848876953125, 0.1101837158203125, 0.1815185546875, 0.2528533935546875, 0.324188232421875, 0.3955230712890625, 0.46685791015625, 0.5381927490234375, 0.609527587890625, 0.6808624267578125, 0.752197265625, 0.8235321044921875, 0.894866943359375, 0.9662017822265625, 1.03753662109375, 1.1088714599609375, 1.180206298828125, 1.2515411376953125, 1.3228759765625, 1.3942108154296875, 1.465545654296875, 1.5368804931640625, 1.60821533203125, 1.6795501708984375, 1.750885009765625, 1.8222198486328125, 1.8935546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 12.0, 15.0, 27.0, 43.0, 39.0, 72.0, 57.0, 87.0, 125.0, 114.0, 95.0, 81.0, 40.0, 61.0, 27.0, 18.0, 20.0, 16.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007195472717285156, -0.0006956607103347778, -0.00067177414894104, -0.0006478875875473022, -0.0006240010261535645, -0.0006001144647598267, -0.0005762279033660889, -0.0005523413419723511, -0.0005284547805786133, -0.0005045682191848755, -0.0004806816577911377, -0.0004567950963973999, -0.0004329085350036621, -0.0004090219736099243, -0.0003851354122161865, -0.00036124885082244873, -0.00033736228942871094, -0.00031347572803497314, -0.00028958916664123535, -0.00026570260524749756, -0.00024181604385375977, -0.00021792948246002197, -0.00019404292106628418, -0.0001701563596725464, -0.0001462697982788086, -0.0001223832368850708, -9.849667549133301e-05, -7.461011409759521e-05, -5.072355270385742e-05, -2.683699131011963e-05, -2.950429916381836e-06, 2.0936131477355957e-05, 4.482269287109375e-05, 6.870925426483154e-05, 9.259581565856934e-05, 0.00011648237705230713, 0.00014036893844604492, 0.00016425549983978271, 0.0001881420612335205, 0.0002120286226272583, 0.0002359151840209961, 0.0002598017454147339, 0.0002836883068084717, 0.00030757486820220947, 0.00033146142959594727, 0.00035534799098968506, 0.00037923455238342285, 0.00040312111377716064, 0.00042700767517089844, 0.00045089423656463623, 0.000474780797958374, 0.0004986673593521118, 0.0005225539207458496, 0.0005464404821395874, 0.0005703270435333252, 0.000594213604927063, 0.0006181001663208008, 0.0006419867277145386, 0.0006658732891082764, 0.0006897598505020142, 0.000713646411895752, 0.0007375329732894897, 0.0007614195346832275, 0.0007853060960769653, 0.0008091926574707031]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 10.0, 12.0, 13.0, 26.0, 28.0, 46.0, 99.0, 163.0, 283.0, 607.0, 1380.0, 3802.0, 13584.0, 70420.0, 581732.0, 311907.0, 48908.0, 10218.0, 3002.0, 1148.0, 513.0, 251.0, 119.0, 86.0, 50.0, 37.0, 24.0, 15.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9453125, -1.8671875, -1.7890625, -1.7109375, -1.6328125, -1.5546875, -1.4765625, -1.3984375, -1.3203125, -1.2421875, -1.1640625, -1.0859375, -1.0078125, -0.9296875, -0.8515625, -0.7734375, -0.6953125, -0.6171875, -0.5390625, -0.4609375, -0.3828125, -0.3046875, -0.2265625, -0.1484375, -0.0703125, 0.0078125, 0.0859375, 0.1640625, 0.2421875, 0.3203125, 0.3984375, 0.4765625, 0.5546875, 0.6328125, 0.7109375, 0.7890625, 0.8671875, 0.9453125, 1.0234375, 1.1015625, 1.1796875, 1.2578125, 1.3359375, 1.4140625, 1.4921875, 1.5703125, 1.6484375, 1.7265625, 1.8046875, 1.8828125, 1.9609375, 2.0390625, 2.1171875, 2.1953125, 2.2734375, 2.3515625, 2.4296875, 2.5078125, 2.5859375, 2.6640625, 2.7421875, 2.8203125, 2.8984375, 2.9765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 8.0, 14.0, 8.0, 31.0, 33.0, 40.0, 38.0, 72.0, 70.0, 76.0, 89.0, 110.0, 98.0, 70.0, 54.0, 38.0, 45.0, 30.0, 16.0, 12.0, 9.0, 9.0, 10.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.94378662109375, -1.8582763671875, -1.77276611328125, -1.687255859375, -1.60174560546875, -1.5162353515625, -1.43072509765625, -1.34521484375, -1.25970458984375, -1.1741943359375, -1.08868408203125, -1.003173828125, -0.91766357421875, -0.8321533203125, -0.74664306640625, -0.6611328125, -0.57562255859375, -0.4901123046875, -0.40460205078125, -0.319091796875, -0.23358154296875, -0.1480712890625, -0.06256103515625, 0.02294921875, 0.10845947265625, 0.1939697265625, 0.27947998046875, 0.364990234375, 0.45050048828125, 0.5360107421875, 0.62152099609375, 0.70703125, 0.79254150390625, 0.8780517578125, 0.96356201171875, 1.049072265625, 1.13458251953125, 1.2200927734375, 1.30560302734375, 1.39111328125, 1.47662353515625, 1.5621337890625, 1.64764404296875, 1.733154296875, 1.81866455078125, 1.9041748046875, 1.98968505859375, 2.0751953125, 2.16070556640625, 2.2462158203125, 2.33172607421875, 2.417236328125, 2.50274658203125, 2.5882568359375, 2.67376708984375, 2.75927734375, 2.84478759765625, 2.9302978515625, 3.01580810546875, 3.101318359375, 3.18682861328125, 3.2723388671875, 3.35784912109375, 3.443359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 22.0, 32.0, 78.0, 111.0, 269.0, 210.0, 130.0, 56.0, 30.0, 16.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.42835235595703, -76.17144775390625, -73.91454315185547, -71.65763854980469, -69.4007339477539, -67.14382934570312, -64.88692474365234, -62.63002395629883, -60.37311935424805, -58.116214752197266, -55.859310150146484, -53.6024055480957, -51.34550476074219, -49.088600158691406, -46.831695556640625, -44.574790954589844, -42.31788635253906, -40.06098175048828, -37.8040771484375, -35.54717254638672, -33.29026794433594, -31.03336524963379, -28.77646255493164, -26.51955795288086, -24.262653350830078, -22.005748748779297, -19.748844146728516, -17.491941452026367, -15.235036849975586, -12.978132247924805, -10.72122859954834, -8.464324951171875, -6.2074127197265625, -3.9505085945129395, -1.6936044692993164, 0.5632996559143066, 2.8202037811279297, 5.077108383178711, 7.334012031555176, 9.59091567993164, 11.847820281982422, 14.104724884033203, 16.361629486083984, 18.618532180786133, 20.875436782836914, 23.132341384887695, 25.389244079589844, 27.646148681640625, 29.903053283691406, 32.15995788574219, 34.41686248779297, 36.67376708984375, 38.93067169189453, 41.18757629394531, 43.44447708129883, 45.70138168334961, 47.95828628540039, 50.21519088745117, 52.47209548950195, 54.729000091552734, 56.98590087890625, 59.24280548095703, 61.49971008300781, 63.756614685058594, 66.01351928710938]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 12.0, 8.0, 9.0, 11.0, 7.0, 24.0, 19.0, 25.0, 12.0, 27.0, 28.0, 38.0, 29.0, 31.0, 40.0, 46.0, 61.0, 64.0, 90.0, 65.0, 51.0, 33.0, 26.0, 42.0, 22.0, 28.0, 31.0, 25.0, 18.0, 12.0, 11.0, 9.0, 9.0, 8.0, 8.0, 4.0, 5.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.709571838378906, -40.51557159423828, -39.321571350097656, -38.12757110595703, -36.933570861816406, -35.73957061767578, -34.545570373535156, -33.35157012939453, -32.157569885253906, -30.96356964111328, -29.769569396972656, -28.57556915283203, -27.381568908691406, -26.18756866455078, -24.993568420410156, -23.79956817626953, -22.605566024780273, -21.41156578063965, -20.217565536499023, -19.0235652923584, -17.829565048217773, -16.63556480407715, -15.441563606262207, -14.247563362121582, -13.053563117980957, -11.859562873840332, -10.665562629699707, -9.471561431884766, -8.27756118774414, -7.083561420440674, -5.889560699462891, -4.695560455322266, -3.5015602111816406, -2.3075599670410156, -1.1135594844818115, 0.08044099807739258, 1.2744412422180176, 2.4684414863586426, 3.662442207336426, 4.856442451477051, 6.050442695617676, 7.244442939758301, 8.438443183898926, 9.632444381713867, 10.826444625854492, 12.020444869995117, 13.214445114135742, 14.408445358276367, 15.602445602416992, 16.796445846557617, 17.990446090698242, 19.184446334838867, 20.378446578979492, 21.572446823120117, 22.766448974609375, 23.96044921875, 25.154449462890625, 26.34844970703125, 27.542449951171875, 28.7364501953125, 29.930450439453125, 31.12445068359375, 32.318450927734375, 33.512451171875, 34.706451416015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 10.0, 17.0, 30.0, 25.0, 49.0, 94.0, 149.0, 270.0, 468.0, 880.0, 2055.0, 5785.0, 24010.0, 240099.0, 3051608.0, 797516.0, 55876.0, 9560.0, 3043.0, 1306.0, 645.0, 315.0, 190.0, 121.0, 61.0, 41.0, 25.0, 13.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.37890625, -6.21826171875, -6.0576171875, -5.89697265625, -5.736328125, -5.57568359375, -5.4150390625, -5.25439453125, -5.09375, -4.93310546875, -4.7724609375, -4.61181640625, -4.451171875, -4.29052734375, -4.1298828125, -3.96923828125, -3.80859375, -3.64794921875, -3.4873046875, -3.32666015625, -3.166015625, -3.00537109375, -2.8447265625, -2.68408203125, -2.5234375, -2.36279296875, -2.2021484375, -2.04150390625, -1.880859375, -1.72021484375, -1.5595703125, -1.39892578125, -1.23828125, -1.07763671875, -0.9169921875, -0.75634765625, -0.595703125, -0.43505859375, -0.2744140625, -0.11376953125, 0.046875, 0.20751953125, 0.3681640625, 0.52880859375, 0.689453125, 0.85009765625, 1.0107421875, 1.17138671875, 1.33203125, 1.49267578125, 1.6533203125, 1.81396484375, 1.974609375, 2.13525390625, 2.2958984375, 2.45654296875, 2.6171875, 2.77783203125, 2.9384765625, 3.09912109375, 3.259765625, 3.42041015625, 3.5810546875, 3.74169921875, 3.90234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 4.0, 2.0, 6.0, 10.0, 13.0, 19.0, 18.0, 21.0, 30.0, 45.0, 45.0, 47.0, 47.0, 59.0, 67.0, 64.0, 62.0, 77.0, 58.0, 40.0, 44.0, 44.0, 39.0, 27.0, 31.0, 22.0, 14.0, 13.0, 8.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.692230224609375, -2.57000732421875, -2.447784423828125, -2.3255615234375, -2.203338623046875, -2.08111572265625, -1.958892822265625, -1.836669921875, -1.714447021484375, -1.59222412109375, -1.470001220703125, -1.3477783203125, -1.225555419921875, -1.10333251953125, -0.981109619140625, -0.85888671875, -0.736663818359375, -0.61444091796875, -0.492218017578125, -0.3699951171875, -0.247772216796875, -0.12554931640625, -0.003326416015625, 0.118896484375, 0.241119384765625, 0.36334228515625, 0.485565185546875, 0.6077880859375, 0.730010986328125, 0.85223388671875, 0.974456787109375, 1.0966796875, 1.218902587890625, 1.34112548828125, 1.463348388671875, 1.5855712890625, 1.707794189453125, 1.83001708984375, 1.952239990234375, 2.074462890625, 2.196685791015625, 2.31890869140625, 2.441131591796875, 2.5633544921875, 2.685577392578125, 2.80780029296875, 2.930023193359375, 3.05224609375, 3.174468994140625, 3.29669189453125, 3.418914794921875, 3.5411376953125, 3.663360595703125, 3.78558349609375, 3.907806396484375, 4.030029296875, 4.152252197265625, 4.27447509765625, 4.396697998046875, 4.5189208984375, 4.641143798828125, 4.76336669921875, 4.885589599609375, 5.0078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 14.0, 29.0, 39.0, 77.0, 131.0, 343.0, 926.0, 3490.0, 24366.0, 3194503.0, 949630.0, 16621.0, 2692.0, 802.0, 294.0, 121.0, 46.0, 48.0, 29.0, 18.0, 9.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4765625, -12.0975341796875, -11.718505859375, -11.3394775390625, -10.96044921875, -10.5814208984375, -10.202392578125, -9.8233642578125, -9.4443359375, -9.0653076171875, -8.686279296875, -8.3072509765625, -7.92822265625, -7.5491943359375, -7.170166015625, -6.7911376953125, -6.412109375, -6.0330810546875, -5.654052734375, -5.2750244140625, -4.89599609375, -4.5169677734375, -4.137939453125, -3.7589111328125, -3.3798828125, -3.0008544921875, -2.621826171875, -2.2427978515625, -1.86376953125, -1.4847412109375, -1.105712890625, -0.7266845703125, -0.34765625, 0.0313720703125, 0.410400390625, 0.7894287109375, 1.16845703125, 1.5474853515625, 1.926513671875, 2.3055419921875, 2.6845703125, 3.0635986328125, 3.442626953125, 3.8216552734375, 4.20068359375, 4.5797119140625, 4.958740234375, 5.3377685546875, 5.716796875, 6.0958251953125, 6.474853515625, 6.8538818359375, 7.23291015625, 7.6119384765625, 7.990966796875, 8.3699951171875, 8.7490234375, 9.1280517578125, 9.507080078125, 9.8861083984375, 10.26513671875, 10.6441650390625, 11.023193359375, 11.4022216796875, 11.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 26.0, 41.0, 67.0, 149.0, 330.0, 842.0, 1311.0, 673.0, 282.0, 118.0, 77.0, 27.0, 21.0, 17.0, 13.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0390625, -9.77032470703125, -9.5015869140625, -9.23284912109375, -8.964111328125, -8.69537353515625, -8.4266357421875, -8.15789794921875, -7.88916015625, -7.62042236328125, -7.3516845703125, -7.08294677734375, -6.814208984375, -6.54547119140625, -6.2767333984375, -6.00799560546875, -5.7392578125, -5.47052001953125, -5.2017822265625, -4.93304443359375, -4.664306640625, -4.39556884765625, -4.1268310546875, -3.85809326171875, -3.58935546875, -3.32061767578125, -3.0518798828125, -2.78314208984375, -2.514404296875, -2.24566650390625, -1.9769287109375, -1.70819091796875, -1.439453125, -1.17071533203125, -0.9019775390625, -0.63323974609375, -0.364501953125, -0.09576416015625, 0.1729736328125, 0.44171142578125, 0.71044921875, 0.97918701171875, 1.2479248046875, 1.51666259765625, 1.785400390625, 2.05413818359375, 2.3228759765625, 2.59161376953125, 2.8603515625, 3.12908935546875, 3.3978271484375, 3.66656494140625, 3.935302734375, 4.20404052734375, 4.4727783203125, 4.74151611328125, 5.01025390625, 5.27899169921875, 5.5477294921875, 5.81646728515625, 6.085205078125, 6.35394287109375, 6.6226806640625, 6.89141845703125, 7.16015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 23.0, 54.0, 142.0, 220.0, 225.0, 169.0, 65.0, 53.0, 19.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.946502685546875, -23.998870849609375, -22.051239013671875, -20.103609085083008, -18.155977249145508, -16.208345413208008, -14.260714530944824, -12.31308364868164, -10.36545181274414, -8.41781997680664, -6.470189094543457, -4.522557735443115, -2.5749263763427734, -0.6272945404052734, 1.3203363418579102, 3.2679672241210938, 5.215599060058594, 7.1632304191589355, 9.110861778259277, 11.058492660522461, 13.006124496459961, 14.953756332397461, 16.901386260986328, 18.849018096923828, 20.796649932861328, 22.744281768798828, 24.691913604736328, 26.639543533325195, 28.587175369262695, 30.534807205200195, 32.48243713378906, 34.43006896972656, 36.37770080566406, 38.32533264160156, 40.27296447753906, 42.22059631347656, 44.16822814941406, 46.11585998535156, 48.0634880065918, 50.0111198425293, 51.9587516784668, 53.9063835144043, 55.8540153503418, 57.8016471862793, 59.74927520751953, 61.69690704345703, 63.64453887939453, 65.59217071533203, 67.53980255126953, 69.48743438720703, 71.43506622314453, 73.38269805908203, 75.33032989501953, 77.27796173095703, 79.22559356689453, 81.1732177734375, 83.120849609375, 85.0684814453125, 87.01611328125, 88.9637451171875, 90.911376953125, 92.8590087890625, 94.806640625, 96.7542724609375, 98.701904296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 9.0, 15.0, 8.0, 21.0, 12.0, 21.0, 23.0, 32.0, 32.0, 31.0, 39.0, 43.0, 47.0, 48.0, 55.0, 55.0, 40.0, 57.0, 55.0, 49.0, 35.0, 37.0, 38.0, 29.0, 32.0, 16.0, 20.0, 19.0, 16.0, 9.0, 10.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.020801544189453, -25.223102569580078, -24.425405502319336, -23.62770652770996, -22.83000946044922, -22.032310485839844, -21.23461151123047, -20.436912536621094, -19.63921546936035, -18.841516494750977, -18.043819427490234, -17.24612045288086, -16.448421478271484, -15.650724411010742, -14.853025436401367, -14.055327415466309, -13.25762939453125, -12.459931373596191, -11.662233352661133, -10.864534378051758, -10.0668363571167, -9.26913833618164, -8.471439361572266, -7.673741340637207, -6.876043319702148, -6.07834529876709, -5.280646800994873, -4.482948303222656, -3.6852502822875977, -2.88755202293396, -2.0898537635803223, -1.2921552658081055, -0.4944572448730469, 0.3032410144805908, 1.1009392738342285, 1.8986375331878662, 2.696335792541504, 3.4940340518951416, 4.291732311248779, 5.089430809020996, 5.887128829956055, 6.684826850891113, 7.48252534866333, 8.280223846435547, 9.077921867370605, 9.875619888305664, 10.673318862915039, 11.471016883850098, 12.268714904785156, 13.066412925720215, 13.864110946655273, 14.661809921264648, 15.459507942199707, 16.257205963134766, 17.05490493774414, 17.852603912353516, 18.650300979614258, 19.447999954223633, 20.245697021484375, 21.04339599609375, 21.841094970703125, 22.638792037963867, 23.436491012573242, 24.234188079833984, 25.03188705444336]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 6.0, 12.0, 13.0, 20.0, 48.0, 65.0, 85.0, 152.0, 247.0, 429.0, 868.0, 1642.0, 3408.0, 7548.0, 17427.0, 44776.0, 129635.0, 360961.0, 311307.0, 105381.0, 37199.0, 14877.0, 6269.0, 2977.0, 1466.0, 747.0, 414.0, 213.0, 134.0, 66.0, 53.0, 26.0, 24.0, 11.0, 13.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.06640625, -3.90313720703125, -3.7398681640625, -3.57659912109375, -3.413330078125, -3.25006103515625, -3.0867919921875, -2.92352294921875, -2.76025390625, -2.59698486328125, -2.4337158203125, -2.27044677734375, -2.107177734375, -1.94390869140625, -1.7806396484375, -1.61737060546875, -1.4541015625, -1.29083251953125, -1.1275634765625, -0.96429443359375, -0.801025390625, -0.63775634765625, -0.4744873046875, -0.31121826171875, -0.14794921875, 0.01531982421875, 0.1785888671875, 0.34185791015625, 0.505126953125, 0.66839599609375, 0.8316650390625, 0.99493408203125, 1.158203125, 1.32147216796875, 1.4847412109375, 1.64801025390625, 1.811279296875, 1.97454833984375, 2.1378173828125, 2.30108642578125, 2.46435546875, 2.62762451171875, 2.7908935546875, 2.95416259765625, 3.117431640625, 3.28070068359375, 3.4439697265625, 3.60723876953125, 3.7705078125, 3.93377685546875, 4.0970458984375, 4.26031494140625, 4.423583984375, 4.58685302734375, 4.7501220703125, 4.91339111328125, 5.07666015625, 5.23992919921875, 5.4031982421875, 5.56646728515625, 5.729736328125, 5.89300537109375, 6.0562744140625, 6.21954345703125, 6.3828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 8.0, 8.0, 22.0, 26.0, 24.0, 26.0, 42.0, 48.0, 60.0, 59.0, 68.0, 62.0, 56.0, 71.0, 63.0, 44.0, 53.0, 40.0, 35.0, 32.0, 33.0, 30.0, 22.0, 9.0, 10.0, 10.0, 5.0, 3.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.15777587890625, -3.0343017578125, -2.91082763671875, -2.787353515625, -2.66387939453125, -2.5404052734375, -2.41693115234375, -2.29345703125, -2.16998291015625, -2.0465087890625, -1.92303466796875, -1.799560546875, -1.67608642578125, -1.5526123046875, -1.42913818359375, -1.3056640625, -1.18218994140625, -1.0587158203125, -0.93524169921875, -0.811767578125, -0.68829345703125, -0.5648193359375, -0.44134521484375, -0.31787109375, -0.19439697265625, -0.0709228515625, 0.05255126953125, 0.176025390625, 0.29949951171875, 0.4229736328125, 0.54644775390625, 0.669921875, 0.79339599609375, 0.9168701171875, 1.04034423828125, 1.163818359375, 1.28729248046875, 1.4107666015625, 1.53424072265625, 1.65771484375, 1.78118896484375, 1.9046630859375, 2.02813720703125, 2.151611328125, 2.27508544921875, 2.3985595703125, 2.52203369140625, 2.6455078125, 2.76898193359375, 2.8924560546875, 3.01593017578125, 3.139404296875, 3.26287841796875, 3.3863525390625, 3.50982666015625, 3.63330078125, 3.75677490234375, 3.8802490234375, 4.00372314453125, 4.127197265625, 4.25067138671875, 4.3741455078125, 4.49761962890625, 4.62109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 11.0, 17.0, 18.0, 23.0, 36.0, 44.0, 71.0, 91.0, 151.0, 255.0, 385.0, 686.0, 1436.0, 3280.0, 9254.0, 33470.0, 164231.0, 679783.0, 116711.0, 25451.0, 7490.0, 2742.0, 1240.0, 672.0, 339.0, 207.0, 134.0, 72.0, 73.0, 38.0, 26.0, 36.0, 20.0, 12.0, 9.0, 10.0, 6.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.5911865234375, -5.362060546875, -5.1329345703125, -4.90380859375, -4.6746826171875, -4.445556640625, -4.2164306640625, -3.9873046875, -3.7581787109375, -3.529052734375, -3.2999267578125, -3.07080078125, -2.8416748046875, -2.612548828125, -2.3834228515625, -2.154296875, -1.9251708984375, -1.696044921875, -1.4669189453125, -1.23779296875, -1.0086669921875, -0.779541015625, -0.5504150390625, -0.3212890625, -0.0921630859375, 0.136962890625, 0.3660888671875, 0.59521484375, 0.8243408203125, 1.053466796875, 1.2825927734375, 1.51171875, 1.7408447265625, 1.969970703125, 2.1990966796875, 2.42822265625, 2.6573486328125, 2.886474609375, 3.1156005859375, 3.3447265625, 3.5738525390625, 3.802978515625, 4.0321044921875, 4.26123046875, 4.4903564453125, 4.719482421875, 4.9486083984375, 5.177734375, 5.4068603515625, 5.635986328125, 5.8651123046875, 6.09423828125, 6.3233642578125, 6.552490234375, 6.7816162109375, 7.0107421875, 7.2398681640625, 7.468994140625, 7.6981201171875, 7.92724609375, 8.1563720703125, 8.385498046875, 8.6146240234375, 8.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 9.0, 4.0, 15.0, 10.0, 8.0, 14.0, 24.0, 31.0, 37.0, 39.0, 47.0, 45.0, 66.0, 68.0, 74.0, 73.0, 56.0, 68.0, 51.0, 47.0, 39.0, 32.0, 36.0, 16.0, 19.0, 12.0, 14.0, 15.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.5078125, -14.104736328125, -13.70166015625, -13.298583984375, -12.8955078125, -12.492431640625, -12.08935546875, -11.686279296875, -11.283203125, -10.880126953125, -10.47705078125, -10.073974609375, -9.6708984375, -9.267822265625, -8.86474609375, -8.461669921875, -8.05859375, -7.655517578125, -7.25244140625, -6.849365234375, -6.4462890625, -6.043212890625, -5.64013671875, -5.237060546875, -4.833984375, -4.430908203125, -4.02783203125, -3.624755859375, -3.2216796875, -2.818603515625, -2.41552734375, -2.012451171875, -1.609375, -1.206298828125, -0.80322265625, -0.400146484375, 0.0029296875, 0.406005859375, 0.80908203125, 1.212158203125, 1.615234375, 2.018310546875, 2.42138671875, 2.824462890625, 3.2275390625, 3.630615234375, 4.03369140625, 4.436767578125, 4.83984375, 5.242919921875, 5.64599609375, 6.049072265625, 6.4521484375, 6.855224609375, 7.25830078125, 7.661376953125, 8.064453125, 8.467529296875, 8.87060546875, 9.273681640625, 9.6767578125, 10.079833984375, 10.48291015625, 10.885986328125, 11.2890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 14.0, 15.0, 22.0, 19.0, 36.0, 61.0, 85.0, 147.0, 243.0, 406.0, 788.0, 1623.0, 3881.0, 11133.0, 39075.0, 187065.0, 668095.0, 98998.0, 23931.0, 7349.0, 2834.0, 1227.0, 638.0, 325.0, 204.0, 99.0, 67.0, 35.0, 32.0, 29.0, 11.0, 11.0, 8.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0718536376953125, -2.014801025390625, -1.9577484130859375, -1.90069580078125, -1.8436431884765625, -1.786590576171875, -1.7295379638671875, -1.6724853515625, -1.6154327392578125, -1.558380126953125, -1.5013275146484375, -1.44427490234375, -1.3872222900390625, -1.330169677734375, -1.2731170654296875, -1.216064453125, -1.1590118408203125, -1.101959228515625, -1.0449066162109375, -0.98785400390625, -0.9308013916015625, -0.873748779296875, -0.8166961669921875, -0.7596435546875, -0.7025909423828125, -0.645538330078125, -0.5884857177734375, -0.53143310546875, -0.4743804931640625, -0.417327880859375, -0.3602752685546875, -0.30322265625, -0.2461700439453125, -0.189117431640625, -0.1320648193359375, -0.07501220703125, -0.0179595947265625, 0.039093017578125, 0.0961456298828125, 0.1531982421875, 0.2102508544921875, 0.267303466796875, 0.3243560791015625, 0.38140869140625, 0.4384613037109375, 0.495513916015625, 0.5525665283203125, 0.609619140625, 0.6666717529296875, 0.723724365234375, 0.7807769775390625, 0.83782958984375, 0.8948822021484375, 0.951934814453125, 1.0089874267578125, 1.0660400390625, 1.1230926513671875, 1.180145263671875, 1.2371978759765625, 1.29425048828125, 1.3513031005859375, 1.408355712890625, 1.4654083251953125, 1.5224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 8.0, 9.0, 17.0, 18.0, 16.0, 31.0, 32.0, 33.0, 55.0, 61.0, 76.0, 75.0, 79.0, 109.0, 73.0, 60.0, 46.0, 36.0, 36.0, 23.0, 22.0, 11.0, 16.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0003807544708251953, -0.0003657899796962738, -0.0003508254885673523, -0.0003358609974384308, -0.0003208965063095093, -0.00030593201518058777, -0.00029096752405166626, -0.00027600303292274475, -0.00026103854179382324, -0.00024607405066490173, -0.00023110955953598022, -0.00021614506840705872, -0.0002011805772781372, -0.0001862160861492157, -0.0001712515950202942, -0.00015628710389137268, -0.00014132261276245117, -0.00012635812163352966, -0.00011139363050460815, -9.642913937568665e-05, -8.146464824676514e-05, -6.650015711784363e-05, -5.153566598892212e-05, -3.657117486000061e-05, -2.16066837310791e-05, -6.642192602157593e-06, 8.322298526763916e-06, 2.3286789655685425e-05, 3.8251280784606934e-05, 5.321577191352844e-05, 6.818026304244995e-05, 8.314475417137146e-05, 9.810924530029297e-05, 0.00011307373642921448, 0.00012803822755813599, 0.0001430027186870575, 0.000157967209815979, 0.0001729317009449005, 0.00018789619207382202, 0.00020286068320274353, 0.00021782517433166504, 0.00023278966546058655, 0.00024775415658950806, 0.00026271864771842957, 0.0002776831388473511, 0.0002926476299762726, 0.0003076121211051941, 0.0003225766122341156, 0.0003375411033630371, 0.0003525055944919586, 0.0003674700856208801, 0.00038243457674980164, 0.00039739906787872314, 0.00041236355900764465, 0.00042732805013656616, 0.00044229254126548767, 0.0004572570323944092, 0.0004722215235233307, 0.0004871860146522522, 0.0005021505057811737, 0.0005171149969100952, 0.0005320794880390167, 0.0005470439791679382, 0.0005620084702968597, 0.0005769729614257812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 15.0, 13.0, 17.0, 23.0, 44.0, 60.0, 76.0, 106.0, 155.0, 263.0, 419.0, 666.0, 1273.0, 2602.0, 5349.0, 12760.0, 35274.0, 122521.0, 611377.0, 177724.0, 47963.0, 16508.0, 6574.0, 3054.0, 1499.0, 873.0, 438.0, 288.0, 178.0, 130.0, 82.0, 53.0, 54.0, 21.0, 26.0, 16.0, 7.0, 9.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.4892578125, -1.444976806640625, -1.40069580078125, -1.356414794921875, -1.3121337890625, -1.267852783203125, -1.22357177734375, -1.179290771484375, -1.135009765625, -1.090728759765625, -1.04644775390625, -1.002166748046875, -0.9578857421875, -0.913604736328125, -0.86932373046875, -0.825042724609375, -0.78076171875, -0.736480712890625, -0.69219970703125, -0.647918701171875, -0.6036376953125, -0.559356689453125, -0.51507568359375, -0.470794677734375, -0.426513671875, -0.382232666015625, -0.33795166015625, -0.293670654296875, -0.2493896484375, -0.205108642578125, -0.16082763671875, -0.116546630859375, -0.072265625, -0.027984619140625, 0.01629638671875, 0.060577392578125, 0.1048583984375, 0.149139404296875, 0.19342041015625, 0.237701416015625, 0.281982421875, 0.326263427734375, 0.37054443359375, 0.414825439453125, 0.4591064453125, 0.503387451171875, 0.54766845703125, 0.591949462890625, 0.63623046875, 0.680511474609375, 0.72479248046875, 0.769073486328125, 0.8133544921875, 0.857635498046875, 0.90191650390625, 0.946197509765625, 0.990478515625, 1.034759521484375, 1.07904052734375, 1.123321533203125, 1.1676025390625, 1.211883544921875, 1.25616455078125, 1.300445556640625, 1.3447265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 9.0, 6.0, 5.0, 15.0, 15.0, 15.0, 26.0, 22.0, 28.0, 44.0, 41.0, 89.0, 73.0, 77.0, 78.0, 72.0, 63.0, 44.0, 47.0, 37.0, 43.0, 23.0, 20.0, 12.0, 13.0, 8.0, 11.0, 6.0, 9.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.79296875, -1.7374420166015625, -1.681915283203125, -1.6263885498046875, -1.57086181640625, -1.5153350830078125, -1.459808349609375, -1.4042816162109375, -1.3487548828125, -1.2932281494140625, -1.237701416015625, -1.1821746826171875, -1.12664794921875, -1.0711212158203125, -1.015594482421875, -0.9600677490234375, -0.904541015625, -0.8490142822265625, -0.793487548828125, -0.7379608154296875, -0.68243408203125, -0.6269073486328125, -0.571380615234375, -0.5158538818359375, -0.4603271484375, -0.4048004150390625, -0.349273681640625, -0.2937469482421875, -0.23822021484375, -0.1826934814453125, -0.127166748046875, -0.0716400146484375, -0.01611328125, 0.0394134521484375, 0.094940185546875, 0.1504669189453125, 0.20599365234375, 0.2615203857421875, 0.317047119140625, 0.3725738525390625, 0.4281005859375, 0.4836273193359375, 0.539154052734375, 0.5946807861328125, 0.65020751953125, 0.7057342529296875, 0.761260986328125, 0.8167877197265625, 0.872314453125, 0.9278411865234375, 0.983367919921875, 1.0388946533203125, 1.09442138671875, 1.1499481201171875, 1.205474853515625, 1.2610015869140625, 1.3165283203125, 1.3720550537109375, 1.427581787109375, 1.4831085205078125, 1.53863525390625, 1.5941619873046875, 1.649688720703125, 1.7052154541015625, 1.7607421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 28.0, 42.0, 91.0, 173.0, 327.0, 143.0, 78.0, 39.0, 16.0, 13.0, 9.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.86172485351562, -66.86456298828125, -64.86739349365234, -62.87023162841797, -60.87306594848633, -58.87590026855469, -56.87873840332031, -54.88157272338867, -52.88440704345703, -50.88724136352539, -48.89007568359375, -46.892913818359375, -44.895748138427734, -42.898582458496094, -40.90142059326172, -38.90425491333008, -36.90708923339844, -34.9099235534668, -32.912757873535156, -30.91559600830078, -28.91843032836914, -26.9212646484375, -24.924100875854492, -22.926937103271484, -20.929771423339844, -18.932605743408203, -16.935441970825195, -14.938277244567871, -12.941112518310547, -10.943947792053223, -8.946783065795898, -6.949618339538574, -4.95245361328125, -2.955288887023926, -0.9581241607666016, 1.0390405654907227, 3.036205291748047, 5.033370018005371, 7.030534744262695, 9.02769947052002, 11.024864196777344, 13.022028923034668, 15.019193649291992, 17.016357421875, 19.01352310180664, 21.01068878173828, 23.00785255432129, 25.005016326904297, 27.002182006835938, 28.999347686767578, 30.996511459350586, 32.993675231933594, 34.990840911865234, 36.988006591796875, 38.98516845703125, 40.98233413696289, 42.97949981689453, 44.97666549682617, 46.97383117675781, 48.97099304199219, 50.96815872192383, 52.96532440185547, 54.962486267089844, 56.959651947021484, 58.956817626953125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 10.0, 6.0, 18.0, 28.0, 6.0, 19.0, 23.0, 22.0, 30.0, 32.0, 38.0, 32.0, 49.0, 77.0, 108.0, 81.0, 68.0, 41.0, 35.0, 20.0, 31.0, 17.0, 22.0, 21.0, 23.0, 11.0, 12.0, 13.0, 20.0, 8.0, 6.0, 7.0, 7.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.4849853515625, -36.410030364990234, -35.33507537841797, -34.26012420654297, -33.1851692199707, -32.11021423339844, -31.035259246826172, -29.960304260253906, -28.885351181030273, -27.810396194458008, -26.735443115234375, -25.66048812866211, -24.585533142089844, -23.51058006286621, -22.435625076293945, -21.360671997070312, -20.285717010498047, -19.21076202392578, -18.13580894470215, -17.060853958129883, -15.985899925231934, -14.910945892333984, -13.835990905761719, -12.76103687286377, -11.68608283996582, -10.611128807067871, -9.536174774169922, -8.461219787597656, -7.386265754699707, -6.311311721801758, -5.23635721206665, -4.161402702331543, -3.086444854736328, -2.0114905834198, -0.9365363121032715, 0.13841795921325684, 1.2133722305297852, 2.2883262634277344, 3.363280773162842, 4.438235282897949, 5.513189315795898, 6.588143348693848, 7.663097858428955, 8.738052368164062, 9.813006401062012, 10.887960433959961, 11.962915420532227, 13.037869453430176, 14.112823486328125, 15.187777519226074, 16.262731552124023, 17.33768653869629, 18.412639617919922, 19.487594604492188, 20.562549591064453, 21.63750457763672, 22.71245765686035, 23.787412643432617, 24.86236572265625, 25.937320709228516, 27.01227569580078, 28.087228775024414, 29.16218376159668, 30.237136840820312, 31.312091827392578]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 9.0, 9.0, 15.0, 22.0, 45.0, 53.0, 83.0, 141.0, 247.0, 439.0, 941.0, 2212.0, 7312.0, 39327.0, 517621.0, 3177604.0, 403807.0, 33849.0, 6387.0, 2163.0, 961.0, 431.0, 237.0, 134.0, 63.0, 57.0, 32.0, 17.0, 10.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.7083740234375, -6.533935546875, -6.3594970703125, -6.18505859375, -6.0106201171875, -5.836181640625, -5.6617431640625, -5.4873046875, -5.3128662109375, -5.138427734375, -4.9639892578125, -4.78955078125, -4.6151123046875, -4.440673828125, -4.2662353515625, -4.091796875, -3.9173583984375, -3.742919921875, -3.5684814453125, -3.39404296875, -3.2196044921875, -3.045166015625, -2.8707275390625, -2.6962890625, -2.5218505859375, -2.347412109375, -2.1729736328125, -1.99853515625, -1.8240966796875, -1.649658203125, -1.4752197265625, -1.30078125, -1.1263427734375, -0.951904296875, -0.7774658203125, -0.60302734375, -0.4285888671875, -0.254150390625, -0.0797119140625, 0.0947265625, 0.2691650390625, 0.443603515625, 0.6180419921875, 0.79248046875, 0.9669189453125, 1.141357421875, 1.3157958984375, 1.490234375, 1.6646728515625, 1.839111328125, 2.0135498046875, 2.18798828125, 2.3624267578125, 2.536865234375, 2.7113037109375, 2.8857421875, 3.0601806640625, 3.234619140625, 3.4090576171875, 3.58349609375, 3.7579345703125, 3.932373046875, 4.1068115234375, 4.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 6.0, 16.0, 23.0, 25.0, 23.0, 33.0, 28.0, 59.0, 52.0, 62.0, 61.0, 47.0, 71.0, 63.0, 48.0, 54.0, 50.0, 47.0, 29.0, 37.0, 30.0, 35.0, 22.0, 16.0, 12.0, 5.0, 5.0, 8.0, 5.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.790435791015625, -2.67266845703125, -2.554901123046875, -2.4371337890625, -2.319366455078125, -2.20159912109375, -2.083831787109375, -1.966064453125, -1.848297119140625, -1.73052978515625, -1.612762451171875, -1.4949951171875, -1.377227783203125, -1.25946044921875, -1.141693115234375, -1.02392578125, -0.906158447265625, -0.78839111328125, -0.670623779296875, -0.5528564453125, -0.435089111328125, -0.31732177734375, -0.199554443359375, -0.081787109375, 0.035980224609375, 0.15374755859375, 0.271514892578125, 0.3892822265625, 0.507049560546875, 0.62481689453125, 0.742584228515625, 0.8603515625, 0.978118896484375, 1.09588623046875, 1.213653564453125, 1.3314208984375, 1.449188232421875, 1.56695556640625, 1.684722900390625, 1.802490234375, 1.920257568359375, 2.03802490234375, 2.155792236328125, 2.2735595703125, 2.391326904296875, 2.50909423828125, 2.626861572265625, 2.74462890625, 2.862396240234375, 2.98016357421875, 3.097930908203125, 3.2156982421875, 3.333465576171875, 3.45123291015625, 3.569000244140625, 3.686767578125, 3.804534912109375, 3.92230224609375, 4.040069580078125, 4.1578369140625, 4.275604248046875, 4.39337158203125, 4.511138916015625, 4.62890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 12.0, 18.0, 19.0, 30.0, 63.0, 146.0, 341.0, 995.0, 5011.0, 96898.0, 4044440.0, 41735.0, 3290.0, 736.0, 267.0, 140.0, 49.0, 29.0, 21.0, 12.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.921875, -16.44384765625, -15.9658203125, -15.48779296875, -15.009765625, -14.53173828125, -14.0537109375, -13.57568359375, -13.09765625, -12.61962890625, -12.1416015625, -11.66357421875, -11.185546875, -10.70751953125, -10.2294921875, -9.75146484375, -9.2734375, -8.79541015625, -8.3173828125, -7.83935546875, -7.361328125, -6.88330078125, -6.4052734375, -5.92724609375, -5.44921875, -4.97119140625, -4.4931640625, -4.01513671875, -3.537109375, -3.05908203125, -2.5810546875, -2.10302734375, -1.625, -1.14697265625, -0.6689453125, -0.19091796875, 0.287109375, 0.76513671875, 1.2431640625, 1.72119140625, 2.19921875, 2.67724609375, 3.1552734375, 3.63330078125, 4.111328125, 4.58935546875, 5.0673828125, 5.54541015625, 6.0234375, 6.50146484375, 6.9794921875, 7.45751953125, 7.935546875, 8.41357421875, 8.8916015625, 9.36962890625, 9.84765625, 10.32568359375, 10.8037109375, 11.28173828125, 11.759765625, 12.23779296875, 12.7158203125, 13.19384765625, 13.671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 11.0, 23.0, 16.0, 41.0, 88.0, 136.0, 418.0, 1032.0, 1305.0, 567.0, 220.0, 93.0, 41.0, 28.0, 13.0, 14.0, 9.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.5755615234375, -13.229248046875, -12.8829345703125, -12.53662109375, -12.1903076171875, -11.843994140625, -11.4976806640625, -11.1513671875, -10.8050537109375, -10.458740234375, -10.1124267578125, -9.76611328125, -9.4197998046875, -9.073486328125, -8.7271728515625, -8.380859375, -8.0345458984375, -7.688232421875, -7.3419189453125, -6.99560546875, -6.6492919921875, -6.302978515625, -5.9566650390625, -5.6103515625, -5.2640380859375, -4.917724609375, -4.5714111328125, -4.22509765625, -3.8787841796875, -3.532470703125, -3.1861572265625, -2.83984375, -2.4935302734375, -2.147216796875, -1.8009033203125, -1.45458984375, -1.1082763671875, -0.761962890625, -0.4156494140625, -0.0693359375, 0.2769775390625, 0.623291015625, 0.9696044921875, 1.31591796875, 1.6622314453125, 2.008544921875, 2.3548583984375, 2.701171875, 3.0474853515625, 3.393798828125, 3.7401123046875, 4.08642578125, 4.4327392578125, 4.779052734375, 5.1253662109375, 5.4716796875, 5.8179931640625, 6.164306640625, 6.5106201171875, 6.85693359375, 7.2032470703125, 7.549560546875, 7.8958740234375, 8.2421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 5.0, 8.0, 14.0, 22.0, 18.0, 43.0, 53.0, 86.0, 115.0, 137.0, 180.0, 128.0, 75.0, 47.0, 28.0, 13.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.12649154663086, -55.70967483520508, -54.29285430908203, -52.87603759765625, -51.45922088623047, -50.04240417480469, -48.62558364868164, -47.20876693725586, -45.79194641113281, -44.37512969970703, -42.958309173583984, -41.5414924621582, -40.12467575073242, -38.707855224609375, -37.291038513183594, -35.87422180175781, -34.45740509033203, -33.04058837890625, -31.623769760131836, -30.206951141357422, -28.79013442993164, -27.373315811157227, -25.956497192382812, -24.53968048095703, -23.122861862182617, -21.706043243408203, -20.289226531982422, -18.872407913208008, -17.455589294433594, -16.038772583007812, -14.621953964233398, -13.2051362991333, -11.788314819335938, -10.37149715423584, -8.954679489135742, -7.537860870361328, -6.1210432052612305, -4.704225540161133, -3.2874069213867188, -1.870589256286621, -0.45377159118652344, 0.9630463123321533, 2.37986421585083, 3.796682357788086, 5.213500022888184, 6.630317687988281, 8.047136306762695, 9.463953971862793, 10.88077163696289, 12.297589302062988, 13.714406967163086, 15.1312255859375, 16.54804229736328, 17.964860916137695, 19.38167953491211, 20.79849624633789, 22.215314865112305, 23.63213348388672, 25.0489501953125, 26.465768814086914, 27.882587432861328, 29.29940414428711, 30.716222763061523, 32.13304138183594, 33.54985809326172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 10.0, 9.0, 10.0, 13.0, 12.0, 23.0, 17.0, 19.0, 20.0, 23.0, 23.0, 24.0, 31.0, 40.0, 39.0, 30.0, 34.0, 38.0, 41.0, 42.0, 40.0, 46.0, 54.0, 37.0, 33.0, 36.0, 32.0, 24.0, 27.0, 18.0, 17.0, 18.0, 15.0, 18.0, 14.0, 17.0, 11.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.05431365966797, -26.233734130859375, -25.41315269470215, -24.592573165893555, -23.77199363708496, -22.951412200927734, -22.13083267211914, -21.310253143310547, -20.48967170715332, -19.669092178344727, -18.8485107421875, -18.027931213378906, -17.207351684570312, -16.386770248413086, -15.566190719604492, -14.745610237121582, -13.925030708312988, -13.104450225830078, -12.283870697021484, -11.463290214538574, -10.642709732055664, -9.82213020324707, -9.00154972076416, -8.18096923828125, -7.360389232635498, -6.539809226989746, -5.719228744506836, -4.898648738861084, -4.078068733215332, -3.257488250732422, -2.43690824508667, -1.6163277626037598, -0.7957477569580078, 0.024832427501678467, 0.8454126119613647, 1.6659927368164062, 2.4865729808807373, 3.3071532249450684, 4.12773323059082, 4.9483137130737305, 5.768893718719482, 6.589473724365234, 7.4100542068481445, 8.230634689331055, 9.051214218139648, 9.871794700622559, 10.692375183105469, 11.512954711914062, 12.333535194396973, 13.154115676879883, 13.974695205688477, 14.795275688171387, 15.615856170654297, 16.43643569946289, 17.257015228271484, 18.07759666442871, 18.898176193237305, 19.7187557220459, 20.539337158203125, 21.35991668701172, 22.180496215820312, 23.00107765197754, 23.821657180786133, 24.64223861694336, 25.462818145751953]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 18.0, 27.0, 42.0, 69.0, 133.0, 212.0, 329.0, 674.0, 1221.0, 2262.0, 4624.0, 9992.0, 23085.0, 63817.0, 217312.0, 473976.0, 164647.0, 50186.0, 19214.0, 8275.0, 3957.0, 2029.0, 1093.0, 565.0, 313.0, 182.0, 106.0, 52.0, 42.0, 32.0, 14.0, 13.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.80078125, -7.5921630859375, -7.383544921875, -7.1749267578125, -6.96630859375, -6.7576904296875, -6.549072265625, -6.3404541015625, -6.1318359375, -5.9232177734375, -5.714599609375, -5.5059814453125, -5.29736328125, -5.0887451171875, -4.880126953125, -4.6715087890625, -4.462890625, -4.2542724609375, -4.045654296875, -3.8370361328125, -3.62841796875, -3.4197998046875, -3.211181640625, -3.0025634765625, -2.7939453125, -2.5853271484375, -2.376708984375, -2.1680908203125, -1.95947265625, -1.7508544921875, -1.542236328125, -1.3336181640625, -1.125, -0.9163818359375, -0.707763671875, -0.4991455078125, -0.29052734375, -0.0819091796875, 0.126708984375, 0.3353271484375, 0.5439453125, 0.7525634765625, 0.961181640625, 1.1697998046875, 1.37841796875, 1.5870361328125, 1.795654296875, 2.0042724609375, 2.212890625, 2.4215087890625, 2.630126953125, 2.8387451171875, 3.04736328125, 3.2559814453125, 3.464599609375, 3.6732177734375, 3.8818359375, 4.0904541015625, 4.299072265625, 4.5076904296875, 4.71630859375, 4.9249267578125, 5.133544921875, 5.3421630859375, 5.55078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 8.0, 7.0, 16.0, 24.0, 21.0, 21.0, 26.0, 35.0, 36.0, 50.0, 53.0, 63.0, 65.0, 59.0, 56.0, 43.0, 51.0, 57.0, 50.0, 43.0, 36.0, 28.0, 31.0, 21.0, 22.0, 13.0, 10.0, 20.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.117767333984375, -2.99920654296875, -2.880645751953125, -2.7620849609375, -2.643524169921875, -2.52496337890625, -2.406402587890625, -2.287841796875, -2.169281005859375, -2.05072021484375, -1.932159423828125, -1.8135986328125, -1.695037841796875, -1.57647705078125, -1.457916259765625, -1.33935546875, -1.220794677734375, -1.10223388671875, -0.983673095703125, -0.8651123046875, -0.746551513671875, -0.62799072265625, -0.509429931640625, -0.390869140625, -0.272308349609375, -0.15374755859375, -0.035186767578125, 0.0833740234375, 0.201934814453125, 0.32049560546875, 0.439056396484375, 0.5576171875, 0.676177978515625, 0.79473876953125, 0.913299560546875, 1.0318603515625, 1.150421142578125, 1.26898193359375, 1.387542724609375, 1.506103515625, 1.624664306640625, 1.74322509765625, 1.861785888671875, 1.9803466796875, 2.098907470703125, 2.21746826171875, 2.336029052734375, 2.45458984375, 2.573150634765625, 2.69171142578125, 2.810272216796875, 2.9288330078125, 3.047393798828125, 3.16595458984375, 3.284515380859375, 3.403076171875, 3.521636962890625, 3.64019775390625, 3.758758544921875, 3.8773193359375, 3.995880126953125, 4.11444091796875, 4.233001708984375, 4.3515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 4.0, 4.0, 10.0, 16.0, 17.0, 23.0, 51.0, 61.0, 127.0, 182.0, 323.0, 642.0, 1321.0, 3552.0, 16770.0, 220225.0, 766802.0, 29886.0, 5220.0, 1649.0, 716.0, 380.0, 221.0, 122.0, 93.0, 52.0, 28.0, 19.0, 14.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.5792236328125, -10.158447265625, -9.7376708984375, -9.31689453125, -8.8961181640625, -8.475341796875, -8.0545654296875, -7.6337890625, -7.2130126953125, -6.792236328125, -6.3714599609375, -5.95068359375, -5.5299072265625, -5.109130859375, -4.6883544921875, -4.267578125, -3.8468017578125, -3.426025390625, -3.0052490234375, -2.58447265625, -2.1636962890625, -1.742919921875, -1.3221435546875, -0.9013671875, -0.4805908203125, -0.059814453125, 0.3609619140625, 0.78173828125, 1.2025146484375, 1.623291015625, 2.0440673828125, 2.46484375, 2.8856201171875, 3.306396484375, 3.7271728515625, 4.14794921875, 4.5687255859375, 4.989501953125, 5.4102783203125, 5.8310546875, 6.2518310546875, 6.672607421875, 7.0933837890625, 7.51416015625, 7.9349365234375, 8.355712890625, 8.7764892578125, 9.197265625, 9.6180419921875, 10.038818359375, 10.4595947265625, 10.88037109375, 11.3011474609375, 11.721923828125, 12.1427001953125, 12.5634765625, 12.9842529296875, 13.405029296875, 13.8258056640625, 14.24658203125, 14.6673583984375, 15.088134765625, 15.5089111328125, 15.9296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 8.0, 2.0, 7.0, 7.0, 12.0, 22.0, 26.0, 26.0, 34.0, 44.0, 54.0, 73.0, 93.0, 82.0, 82.0, 85.0, 69.0, 60.0, 59.0, 39.0, 23.0, 24.0, 12.0, 11.0, 6.0, 10.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.46875, -18.97119140625, -18.4736328125, -17.97607421875, -17.478515625, -16.98095703125, -16.4833984375, -15.98583984375, -15.48828125, -14.99072265625, -14.4931640625, -13.99560546875, -13.498046875, -13.00048828125, -12.5029296875, -12.00537109375, -11.5078125, -11.01025390625, -10.5126953125, -10.01513671875, -9.517578125, -9.02001953125, -8.5224609375, -8.02490234375, -7.52734375, -7.02978515625, -6.5322265625, -6.03466796875, -5.537109375, -5.03955078125, -4.5419921875, -4.04443359375, -3.546875, -3.04931640625, -2.5517578125, -2.05419921875, -1.556640625, -1.05908203125, -0.5615234375, -0.06396484375, 0.43359375, 0.93115234375, 1.4287109375, 1.92626953125, 2.423828125, 2.92138671875, 3.4189453125, 3.91650390625, 4.4140625, 4.91162109375, 5.4091796875, 5.90673828125, 6.404296875, 6.90185546875, 7.3994140625, 7.89697265625, 8.39453125, 8.89208984375, 9.3896484375, 9.88720703125, 10.384765625, 10.88232421875, 11.3798828125, 11.87744140625, 12.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 12.0, 14.0, 17.0, 26.0, 32.0, 46.0, 52.0, 81.0, 127.0, 200.0, 285.0, 530.0, 890.0, 1873.0, 4759.0, 15161.0, 65905.0, 659554.0, 239317.0, 41909.0, 10576.0, 3614.0, 1542.0, 797.0, 367.0, 268.0, 164.0, 124.0, 63.0, 58.0, 45.0, 33.0, 25.0, 22.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.9091796875, -1.85107421875, -1.79296875, -1.73486328125, -1.6767578125, -1.61865234375, -1.560546875, -1.50244140625, -1.4443359375, -1.38623046875, -1.328125, -1.27001953125, -1.2119140625, -1.15380859375, -1.095703125, -1.03759765625, -0.9794921875, -0.92138671875, -0.86328125, -0.80517578125, -0.7470703125, -0.68896484375, -0.630859375, -0.57275390625, -0.5146484375, -0.45654296875, -0.3984375, -0.34033203125, -0.2822265625, -0.22412109375, -0.166015625, -0.10791015625, -0.0498046875, 0.00830078125, 0.06640625, 0.12451171875, 0.1826171875, 0.24072265625, 0.298828125, 0.35693359375, 0.4150390625, 0.47314453125, 0.53125, 0.58935546875, 0.6474609375, 0.70556640625, 0.763671875, 0.82177734375, 0.8798828125, 0.93798828125, 0.99609375, 1.05419921875, 1.1123046875, 1.17041015625, 1.228515625, 1.28662109375, 1.3447265625, 1.40283203125, 1.4609375, 1.51904296875, 1.5771484375, 1.63525390625, 1.693359375, 1.75146484375, 1.8095703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 13.0, 10.0, 10.0, 11.0, 17.0, 19.0, 25.0, 30.0, 51.0, 54.0, 92.0, 103.0, 104.0, 107.0, 75.0, 73.0, 44.0, 38.0, 19.0, 20.0, 17.0, 14.0, 15.0, 4.0, 2.0, 3.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006914138793945312, -0.0006729662418365479, -0.0006545186042785645, -0.0006360709667205811, -0.0006176233291625977, -0.0005991756916046143, -0.0005807280540466309, -0.0005622804164886475, -0.0005438327789306641, -0.0005253851413726807, -0.0005069375038146973, -0.0004884898662567139, -0.00047004222869873047, -0.00045159459114074707, -0.00043314695358276367, -0.0004146993160247803, -0.0003962516784667969, -0.0003778040409088135, -0.0003593564033508301, -0.0003409087657928467, -0.0003224611282348633, -0.0003040134906768799, -0.0002855658531188965, -0.0002671182155609131, -0.0002486705780029297, -0.0002302229404449463, -0.0002117753028869629, -0.0001933276653289795, -0.0001748800277709961, -0.0001564323902130127, -0.0001379847526550293, -0.0001195371150970459, -0.0001010894775390625, -8.26418399810791e-05, -6.41942024230957e-05, -4.5746564865112305e-05, -2.7298927307128906e-05, -8.851289749145508e-06, 9.59634780883789e-06, 2.804398536682129e-05, 4.649162292480469e-05, 6.493926048278809e-05, 8.338689804077148e-05, 0.00010183453559875488, 0.00012028217315673828, 0.00013872981071472168, 0.00015717744827270508, 0.00017562508583068848, 0.00019407272338867188, 0.00021252036094665527, 0.00023096799850463867, 0.00024941563606262207, 0.00026786327362060547, 0.00028631091117858887, 0.00030475854873657227, 0.00032320618629455566, 0.00034165382385253906, 0.00036010146141052246, 0.00037854909896850586, 0.00039699673652648926, 0.00041544437408447266, 0.00043389201164245605, 0.00045233964920043945, 0.00047078728675842285, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 15.0, 22.0, 47.0, 77.0, 127.0, 223.0, 498.0, 1051.0, 2964.0, 10951.0, 81139.0, 847685.0, 86914.0, 11443.0, 3177.0, 1164.0, 468.0, 243.0, 124.0, 77.0, 50.0, 21.0, 19.0, 10.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.2890625, -3.201385498046875, -3.11370849609375, -3.026031494140625, -2.9383544921875, -2.850677490234375, -2.76300048828125, -2.675323486328125, -2.587646484375, -2.499969482421875, -2.41229248046875, -2.324615478515625, -2.2369384765625, -2.149261474609375, -2.06158447265625, -1.973907470703125, -1.88623046875, -1.798553466796875, -1.71087646484375, -1.623199462890625, -1.5355224609375, -1.447845458984375, -1.36016845703125, -1.272491455078125, -1.184814453125, -1.097137451171875, -1.00946044921875, -0.921783447265625, -0.8341064453125, -0.746429443359375, -0.65875244140625, -0.571075439453125, -0.4833984375, -0.395721435546875, -0.30804443359375, -0.220367431640625, -0.1326904296875, -0.045013427734375, 0.04266357421875, 0.130340576171875, 0.218017578125, 0.305694580078125, 0.39337158203125, 0.481048583984375, 0.5687255859375, 0.656402587890625, 0.74407958984375, 0.831756591796875, 0.91943359375, 1.007110595703125, 1.09478759765625, 1.182464599609375, 1.2701416015625, 1.357818603515625, 1.44549560546875, 1.533172607421875, 1.620849609375, 1.708526611328125, 1.79620361328125, 1.883880615234375, 1.9715576171875, 2.059234619140625, 2.14691162109375, 2.234588623046875, 2.322265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 10.0, 6.0, 6.0, 19.0, 22.0, 22.0, 36.0, 42.0, 76.0, 91.0, 129.0, 128.0, 109.0, 81.0, 51.0, 55.0, 37.0, 29.0, 21.0, 11.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0625, -2.975555419921875, -2.88861083984375, -2.801666259765625, -2.7147216796875, -2.627777099609375, -2.54083251953125, -2.453887939453125, -2.366943359375, -2.279998779296875, -2.19305419921875, -2.106109619140625, -2.0191650390625, -1.932220458984375, -1.84527587890625, -1.758331298828125, -1.67138671875, -1.584442138671875, -1.49749755859375, -1.410552978515625, -1.3236083984375, -1.236663818359375, -1.14971923828125, -1.062774658203125, -0.975830078125, -0.888885498046875, -0.80194091796875, -0.714996337890625, -0.6280517578125, -0.541107177734375, -0.45416259765625, -0.367218017578125, -0.2802734375, -0.193328857421875, -0.10638427734375, -0.019439697265625, 0.0675048828125, 0.154449462890625, 0.24139404296875, 0.328338623046875, 0.415283203125, 0.502227783203125, 0.58917236328125, 0.676116943359375, 0.7630615234375, 0.850006103515625, 0.93695068359375, 1.023895263671875, 1.11083984375, 1.197784423828125, 1.28472900390625, 1.371673583984375, 1.4586181640625, 1.545562744140625, 1.63250732421875, 1.719451904296875, 1.806396484375, 1.893341064453125, 1.98028564453125, 2.067230224609375, 2.1541748046875, 2.241119384765625, 2.32806396484375, 2.415008544921875, 2.501953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 20.0, 43.0, 101.0, 280.0, 298.0, 118.0, 65.0, 32.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.96814727783203, -79.55622863769531, -77.1443099975586, -74.7323989868164, -72.32048034667969, -69.90856170654297, -67.49664306640625, -65.08473205566406, -62.672813415527344, -60.260894775390625, -57.84897994995117, -55.43706130981445, -53.025146484375, -50.61322784423828, -48.20130920410156, -45.78939437866211, -43.37747573852539, -40.96555709838867, -38.55364227294922, -36.1417236328125, -33.72980880737305, -31.317890167236328, -28.905973434448242, -26.494056701660156, -24.08213996887207, -21.670223236083984, -19.2583065032959, -16.846389770507812, -14.43447208404541, -12.022555351257324, -9.610637664794922, -7.198720932006836, -4.78680419921875, -2.374887228012085, 0.03702974319458008, 2.448946952819824, 4.86086368560791, 7.272780418395996, 9.684698104858398, 12.096614837646484, 14.50853157043457, 16.920448303222656, 19.332365036010742, 21.744281768798828, 24.156200408935547, 26.568115234375, 28.98003387451172, 31.391950607299805, 33.80386734008789, 36.21578598022461, 38.62770080566406, 41.03961944580078, 43.451534271240234, 45.86345291137695, 48.275367736816406, 50.687286376953125, 53.099205017089844, 55.51112365722656, 57.923038482666016, 60.334957122802734, 62.74687194824219, 65.1587905883789, 67.57070922851562, 69.98262023925781, 72.39453887939453]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 5.0, 13.0, 10.0, 12.0, 14.0, 16.0, 10.0, 23.0, 25.0, 22.0, 19.0, 25.0, 39.0, 33.0, 46.0, 93.0, 128.0, 111.0, 51.0, 42.0, 31.0, 30.0, 17.0, 22.0, 22.0, 15.0, 23.0, 8.0, 21.0, 15.0, 7.0, 2.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.72791290283203, -37.50796127319336, -36.28800582885742, -35.06805419921875, -33.84809875488281, -32.62814712524414, -31.408191680908203, -30.18824005126953, -28.968284606933594, -27.74833106994629, -26.528377532958984, -25.30842399597168, -24.088470458984375, -22.86851692199707, -21.648563385009766, -20.428611755371094, -19.20865821838379, -17.988704681396484, -16.76875114440918, -15.548797607421875, -14.32884407043457, -13.108890533447266, -11.888937950134277, -10.668984413146973, -9.449030876159668, -8.229077339172363, -7.009123802185059, -5.789170742034912, -4.569217205047607, -3.3492636680603027, -2.1293106079101562, -0.9093570709228516, 0.3105964660644531, 1.5305498838424683, 2.7505033016204834, 3.970456600189209, 5.190410137176514, 6.410363674163818, 7.630316734313965, 8.85027027130127, 10.070223808288574, 11.290177345275879, 12.510130882263184, 13.730083465576172, 14.950037002563477, 16.16999053955078, 17.389944076538086, 18.60989761352539, 19.829851150512695, 21.0498046875, 22.269758224487305, 23.48971176147461, 24.709665298461914, 25.92961883544922, 27.14957046508789, 28.369525909423828, 29.5894775390625, 30.809431076049805, 32.02938461303711, 33.24933624267578, 34.46929168701172, 35.68924331665039, 36.90919876098633, 38.129150390625, 39.34910583496094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 10.0, 6.0, 18.0, 23.0, 56.0, 78.0, 138.0, 301.0, 602.0, 1692.0, 5366.0, 29384.0, 672991.0, 3288345.0, 175650.0, 14293.0, 3361.0, 1103.0, 451.0, 205.0, 76.0, 54.0, 31.0, 25.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9749755859375, -11.645263671875, -11.3155517578125, -10.98583984375, -10.6561279296875, -10.326416015625, -9.9967041015625, -9.6669921875, -9.3372802734375, -9.007568359375, -8.6778564453125, -8.34814453125, -8.0184326171875, -7.688720703125, -7.3590087890625, -7.029296875, -6.6995849609375, -6.369873046875, -6.0401611328125, -5.71044921875, -5.3807373046875, -5.051025390625, -4.7213134765625, -4.3916015625, -4.0618896484375, -3.732177734375, -3.4024658203125, -3.07275390625, -2.7430419921875, -2.413330078125, -2.0836181640625, -1.75390625, -1.4241943359375, -1.094482421875, -0.7647705078125, -0.43505859375, -0.1053466796875, 0.224365234375, 0.5540771484375, 0.8837890625, 1.2135009765625, 1.543212890625, 1.8729248046875, 2.20263671875, 2.5323486328125, 2.862060546875, 3.1917724609375, 3.521484375, 3.8511962890625, 4.180908203125, 4.5106201171875, 4.84033203125, 5.1700439453125, 5.499755859375, 5.8294677734375, 6.1591796875, 6.4888916015625, 6.818603515625, 7.1483154296875, 7.47802734375, 7.8077392578125, 8.137451171875, 8.4671630859375, 8.796875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 13.0, 17.0, 20.0, 17.0, 16.0, 29.0, 35.0, 45.0, 47.0, 46.0, 52.0, 51.0, 62.0, 68.0, 61.0, 48.0, 58.0, 52.0, 54.0, 31.0, 39.0, 32.0, 20.0, 16.0, 15.0, 11.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.09423828125, -2.9775390625, -2.86083984375, -2.744140625, -2.62744140625, -2.5107421875, -2.39404296875, -2.27734375, -2.16064453125, -2.0439453125, -1.92724609375, -1.810546875, -1.69384765625, -1.5771484375, -1.46044921875, -1.34375, -1.22705078125, -1.1103515625, -0.99365234375, -0.876953125, -0.76025390625, -0.6435546875, -0.52685546875, -0.41015625, -0.29345703125, -0.1767578125, -0.06005859375, 0.056640625, 0.17333984375, 0.2900390625, 0.40673828125, 0.5234375, 0.64013671875, 0.7568359375, 0.87353515625, 0.990234375, 1.10693359375, 1.2236328125, 1.34033203125, 1.45703125, 1.57373046875, 1.6904296875, 1.80712890625, 1.923828125, 2.04052734375, 2.1572265625, 2.27392578125, 2.390625, 2.50732421875, 2.6240234375, 2.74072265625, 2.857421875, 2.97412109375, 3.0908203125, 3.20751953125, 3.32421875, 3.44091796875, 3.5576171875, 3.67431640625, 3.791015625, 3.90771484375, 4.0244140625, 4.14111328125, 4.2578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 12.0, 19.0, 26.0, 50.0, 104.0, 166.0, 368.0, 816.0, 2005.0, 6926.0, 80892.0, 4015915.0, 77049.0, 6406.0, 1920.0, 726.0, 367.0, 197.0, 107.0, 68.0, 35.0, 21.0, 17.0, 15.0, 9.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0625, -13.510986328125, -12.95947265625, -12.407958984375, -11.8564453125, -11.304931640625, -10.75341796875, -10.201904296875, -9.650390625, -9.098876953125, -8.54736328125, -7.995849609375, -7.4443359375, -6.892822265625, -6.34130859375, -5.789794921875, -5.23828125, -4.686767578125, -4.13525390625, -3.583740234375, -3.0322265625, -2.480712890625, -1.92919921875, -1.377685546875, -0.826171875, -0.274658203125, 0.27685546875, 0.828369140625, 1.3798828125, 1.931396484375, 2.48291015625, 3.034423828125, 3.5859375, 4.137451171875, 4.68896484375, 5.240478515625, 5.7919921875, 6.343505859375, 6.89501953125, 7.446533203125, 7.998046875, 8.549560546875, 9.10107421875, 9.652587890625, 10.2041015625, 10.755615234375, 11.30712890625, 11.858642578125, 12.41015625, 12.961669921875, 13.51318359375, 14.064697265625, 14.6162109375, 15.167724609375, 15.71923828125, 16.270751953125, 16.822265625, 17.373779296875, 17.92529296875, 18.476806640625, 19.0283203125, 19.579833984375, 20.13134765625, 20.682861328125, 21.234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 8.0, 14.0, 11.0, 26.0, 28.0, 48.0, 73.0, 96.0, 156.0, 298.0, 516.0, 813.0, 849.0, 492.0, 233.0, 167.0, 85.0, 59.0, 34.0, 20.0, 16.0, 15.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.181884765625, -13.80908203125, -13.436279296875, -13.0634765625, -12.690673828125, -12.31787109375, -11.945068359375, -11.572265625, -11.199462890625, -10.82666015625, -10.453857421875, -10.0810546875, -9.708251953125, -9.33544921875, -8.962646484375, -8.58984375, -8.217041015625, -7.84423828125, -7.471435546875, -7.0986328125, -6.725830078125, -6.35302734375, -5.980224609375, -5.607421875, -5.234619140625, -4.86181640625, -4.489013671875, -4.1162109375, -3.743408203125, -3.37060546875, -2.997802734375, -2.625, -2.252197265625, -1.87939453125, -1.506591796875, -1.1337890625, -0.760986328125, -0.38818359375, -0.015380859375, 0.357421875, 0.730224609375, 1.10302734375, 1.475830078125, 1.8486328125, 2.221435546875, 2.59423828125, 2.967041015625, 3.33984375, 3.712646484375, 4.08544921875, 4.458251953125, 4.8310546875, 5.203857421875, 5.57666015625, 5.949462890625, 6.322265625, 6.695068359375, 7.06787109375, 7.440673828125, 7.8134765625, 8.186279296875, 8.55908203125, 8.931884765625, 9.3046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 9.0, 14.0, 21.0, 45.0, 80.0, 167.0, 243.0, 192.0, 108.0, 49.0, 25.0, 15.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.19721984863281, -110.23877716064453, -106.28034210205078, -102.3218994140625, -98.36346435546875, -94.40502166748047, -90.44657897949219, -86.48814392089844, -82.52970886230469, -78.5712661743164, -74.61283111572266, -70.65438842773438, -66.69595336914062, -62.737510681152344, -58.77907180786133, -54.82063293457031, -50.86219024658203, -46.903751373291016, -42.9453125, -38.98686981201172, -35.02843475341797, -31.06999397277832, -27.111553192138672, -23.153114318847656, -19.19467544555664, -15.236236572265625, -11.277796745300293, -7.319356918334961, -3.3609180450439453, 0.5975208282470703, 4.555961608886719, 8.514400482177734, 12.47283935546875, 16.431278228759766, 20.38971710205078, 24.34815788269043, 28.306596755981445, 32.265037536621094, 36.22347640991211, 40.181915283203125, 44.14035415649414, 48.098793029785156, 52.05723190307617, 56.01567077636719, 59.97411346435547, 63.93254852294922, 67.8909912109375, 71.84942626953125, 75.80786895751953, 79.76631164550781, 83.72474670410156, 87.68318939208984, 91.6416244506836, 95.60006713867188, 99.55850219726562, 103.5169448852539, 107.47538757324219, 111.43383026123047, 115.39226531982422, 119.3507080078125, 123.30914306640625, 127.26758575439453, 131.2260284423828, 135.18446350097656, 139.1428985595703]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 15.0, 11.0, 23.0, 19.0, 20.0, 21.0, 31.0, 27.0, 39.0, 42.0, 40.0, 60.0, 60.0, 57.0, 60.0, 41.0, 45.0, 29.0, 46.0, 43.0, 39.0, 36.0, 38.0, 32.0, 24.0, 19.0, 15.0, 14.0, 12.0, 8.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96317672729492, -43.280418395996094, -41.59765625, -39.91489791870117, -38.232139587402344, -36.54937744140625, -34.86661911010742, -33.183860778808594, -31.5010986328125, -29.81833839416504, -28.135578155517578, -26.45281982421875, -24.77005958557129, -23.087299346923828, -21.404541015625, -19.72178077697754, -18.039020538330078, -16.356260299682617, -14.673501014709473, -12.990741729736328, -11.307981491088867, -9.625221252441406, -7.942461967468262, -6.259702682495117, -4.576942443847656, -2.8941826820373535, -1.2114229202270508, 0.47133684158325195, 2.1540966033935547, 3.8368568420410156, 5.51961612701416, 7.202375411987305, 8.885139465332031, 10.567899703979492, 12.250658988952637, 13.933418273925781, 15.616178512573242, 17.298938751220703, 18.98169708251953, 20.664457321166992, 22.347217559814453, 24.029977798461914, 25.712738037109375, 27.395496368408203, 29.078256607055664, 30.761016845703125, 32.44377517700195, 34.12653350830078, 35.809295654296875, 37.4920539855957, 39.1748161315918, 40.857574462890625, 42.54033660888672, 44.22309494018555, 45.905853271484375, 47.58861541748047, 49.2713737487793, 50.954132080078125, 52.63689422607422, 54.31965255737305, 56.002410888671875, 57.68517303466797, 59.3679313659668, 61.050689697265625, 62.73345184326172]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 6.0, 12.0, 11.0, 8.0, 22.0, 35.0, 36.0, 53.0, 69.0, 105.0, 150.0, 229.0, 345.0, 545.0, 895.0, 1334.0, 2320.0, 4357.0, 8130.0, 16160.0, 37479.0, 104100.0, 515827.0, 239263.0, 64865.0, 25819.0, 12023.0, 5974.0, 3381.0, 1860.0, 1065.0, 703.0, 440.0, 280.0, 189.0, 121.0, 99.0, 72.0, 44.0, 33.0, 26.0, 20.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.14453125, -4.9774169921875, -4.810302734375, -4.6431884765625, -4.47607421875, -4.3089599609375, -4.141845703125, -3.9747314453125, -3.8076171875, -3.6405029296875, -3.473388671875, -3.3062744140625, -3.13916015625, -2.9720458984375, -2.804931640625, -2.6378173828125, -2.470703125, -2.3035888671875, -2.136474609375, -1.9693603515625, -1.80224609375, -1.6351318359375, -1.468017578125, -1.3009033203125, -1.1337890625, -0.9666748046875, -0.799560546875, -0.6324462890625, -0.46533203125, -0.2982177734375, -0.131103515625, 0.0360107421875, 0.203125, 0.3702392578125, 0.537353515625, 0.7044677734375, 0.87158203125, 1.0386962890625, 1.205810546875, 1.3729248046875, 1.5400390625, 1.7071533203125, 1.874267578125, 2.0413818359375, 2.20849609375, 2.3756103515625, 2.542724609375, 2.7098388671875, 2.876953125, 3.0440673828125, 3.211181640625, 3.3782958984375, 3.54541015625, 3.7125244140625, 3.879638671875, 4.0467529296875, 4.2138671875, 4.3809814453125, 4.548095703125, 4.7152099609375, 4.88232421875, 5.0494384765625, 5.216552734375, 5.3836669921875, 5.55078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 8.0, 11.0, 18.0, 21.0, 22.0, 41.0, 31.0, 45.0, 54.0, 52.0, 68.0, 50.0, 67.0, 60.0, 64.0, 56.0, 47.0, 53.0, 42.0, 33.0, 40.0, 23.0, 14.0, 17.0, 14.0, 7.0, 10.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.58331298828125, -4.4439697265625, -4.30462646484375, -4.165283203125, -4.02593994140625, -3.8865966796875, -3.74725341796875, -3.60791015625, -3.46856689453125, -3.3292236328125, -3.18988037109375, -3.050537109375, -2.91119384765625, -2.7718505859375, -2.63250732421875, -2.4931640625, -2.35382080078125, -2.2144775390625, -2.07513427734375, -1.935791015625, -1.79644775390625, -1.6571044921875, -1.51776123046875, -1.37841796875, -1.23907470703125, -1.0997314453125, -0.96038818359375, -0.821044921875, -0.68170166015625, -0.5423583984375, -0.40301513671875, -0.263671875, -0.12432861328125, 0.0150146484375, 0.15435791015625, 0.293701171875, 0.43304443359375, 0.5723876953125, 0.71173095703125, 0.85107421875, 0.99041748046875, 1.1297607421875, 1.26910400390625, 1.408447265625, 1.54779052734375, 1.6871337890625, 1.82647705078125, 1.9658203125, 2.10516357421875, 2.2445068359375, 2.38385009765625, 2.523193359375, 2.66253662109375, 2.8018798828125, 2.94122314453125, 3.08056640625, 3.21990966796875, 3.3592529296875, 3.49859619140625, 3.637939453125, 3.77728271484375, 3.9166259765625, 4.05596923828125, 4.1953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 14.0, 12.0, 21.0, 32.0, 50.0, 98.0, 120.0, 160.0, 304.0, 528.0, 1068.0, 2493.0, 8873.0, 59851.0, 910397.0, 51697.0, 8202.0, 2373.0, 986.0, 474.0, 276.0, 171.0, 103.0, 65.0, 42.0, 34.0, 28.0, 13.0, 13.0, 9.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-13.6328125, -13.2784423828125, -12.924072265625, -12.5697021484375, -12.21533203125, -11.8609619140625, -11.506591796875, -11.1522216796875, -10.7978515625, -10.4434814453125, -10.089111328125, -9.7347412109375, -9.38037109375, -9.0260009765625, -8.671630859375, -8.3172607421875, -7.962890625, -7.6085205078125, -7.254150390625, -6.8997802734375, -6.54541015625, -6.1910400390625, -5.836669921875, -5.4822998046875, -5.1279296875, -4.7735595703125, -4.419189453125, -4.0648193359375, -3.71044921875, -3.3560791015625, -3.001708984375, -2.6473388671875, -2.29296875, -1.9385986328125, -1.584228515625, -1.2298583984375, -0.87548828125, -0.5211181640625, -0.166748046875, 0.1876220703125, 0.5419921875, 0.8963623046875, 1.250732421875, 1.6051025390625, 1.95947265625, 2.3138427734375, 2.668212890625, 3.0225830078125, 3.376953125, 3.7313232421875, 4.085693359375, 4.4400634765625, 4.79443359375, 5.1488037109375, 5.503173828125, 5.8575439453125, 6.2119140625, 6.5662841796875, 6.920654296875, 7.2750244140625, 7.62939453125, 7.9837646484375, 8.338134765625, 8.6925048828125, 9.046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 13.0, 17.0, 14.0, 14.0, 17.0, 20.0, 25.0, 36.0, 44.0, 49.0, 57.0, 69.0, 75.0, 75.0, 80.0, 53.0, 57.0, 39.0, 33.0, 26.0, 22.0, 15.0, 17.0, 16.0, 13.0, 15.0, 5.0, 6.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.21875, -14.72998046875, -14.2412109375, -13.75244140625, -13.263671875, -12.77490234375, -12.2861328125, -11.79736328125, -11.30859375, -10.81982421875, -10.3310546875, -9.84228515625, -9.353515625, -8.86474609375, -8.3759765625, -7.88720703125, -7.3984375, -6.90966796875, -6.4208984375, -5.93212890625, -5.443359375, -4.95458984375, -4.4658203125, -3.97705078125, -3.48828125, -2.99951171875, -2.5107421875, -2.02197265625, -1.533203125, -1.04443359375, -0.5556640625, -0.06689453125, 0.421875, 0.91064453125, 1.3994140625, 1.88818359375, 2.376953125, 2.86572265625, 3.3544921875, 3.84326171875, 4.33203125, 4.82080078125, 5.3095703125, 5.79833984375, 6.287109375, 6.77587890625, 7.2646484375, 7.75341796875, 8.2421875, 8.73095703125, 9.2197265625, 9.70849609375, 10.197265625, 10.68603515625, 11.1748046875, 11.66357421875, 12.15234375, 12.64111328125, 13.1298828125, 13.61865234375, 14.107421875, 14.59619140625, 15.0849609375, 15.57373046875, 16.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 18.0, 19.0, 25.0, 40.0, 54.0, 69.0, 107.0, 156.0, 257.0, 398.0, 598.0, 1169.0, 2352.0, 5536.0, 14720.0, 52654.0, 767057.0, 154516.0, 30807.0, 9843.0, 3954.0, 1730.0, 886.0, 539.0, 339.0, 207.0, 152.0, 90.0, 54.0, 58.0, 29.0, 19.0, 22.0, 9.0, 14.0, 4.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.6689453125, -1.618072509765625, -1.56719970703125, -1.516326904296875, -1.4654541015625, -1.414581298828125, -1.36370849609375, -1.312835693359375, -1.261962890625, -1.211090087890625, -1.16021728515625, -1.109344482421875, -1.0584716796875, -1.007598876953125, -0.95672607421875, -0.905853271484375, -0.85498046875, -0.804107666015625, -0.75323486328125, -0.702362060546875, -0.6514892578125, -0.600616455078125, -0.54974365234375, -0.498870849609375, -0.447998046875, -0.397125244140625, -0.34625244140625, -0.295379638671875, -0.2445068359375, -0.193634033203125, -0.14276123046875, -0.091888427734375, -0.041015625, 0.009857177734375, 0.06072998046875, 0.111602783203125, 0.1624755859375, 0.213348388671875, 0.26422119140625, 0.315093994140625, 0.365966796875, 0.416839599609375, 0.46771240234375, 0.518585205078125, 0.5694580078125, 0.620330810546875, 0.67120361328125, 0.722076416015625, 0.77294921875, 0.823822021484375, 0.87469482421875, 0.925567626953125, 0.9764404296875, 1.027313232421875, 1.07818603515625, 1.129058837890625, 1.179931640625, 1.230804443359375, 1.28167724609375, 1.332550048828125, 1.3834228515625, 1.434295654296875, 1.48516845703125, 1.536041259765625, 1.5869140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 7.0, 6.0, 12.0, 11.0, 21.0, 26.0, 18.0, 39.0, 41.0, 79.0, 98.0, 123.0, 130.0, 98.0, 69.0, 65.0, 28.0, 29.0, 24.0, 18.0, 8.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005211830139160156, -0.0005010738968849182, -0.0004809647798538208, -0.0004608556628227234, -0.000440746545791626, -0.00042063742876052856, -0.00040052831172943115, -0.00038041919469833374, -0.00036031007766723633, -0.0003402009606361389, -0.0003200918436050415, -0.0002999827265739441, -0.0002798736095428467, -0.00025976449251174927, -0.00023965537548065186, -0.00021954625844955444, -0.00019943714141845703, -0.00017932802438735962, -0.0001592189073562622, -0.0001391097903251648, -0.00011900067329406738, -9.889155626296997e-05, -7.878243923187256e-05, -5.8673322200775146e-05, -3.8564205169677734e-05, -1.8455088138580322e-05, 1.6540288925170898e-06, 2.1763145923614502e-05, 4.1872262954711914e-05, 6.198137998580933e-05, 8.209049701690674e-05, 0.00010219961404800415, 0.00012230873107910156, 0.00014241784811019897, 0.0001625269651412964, 0.0001826360821723938, 0.0002027451992034912, 0.00022285431623458862, 0.00024296343326568604, 0.00026307255029678345, 0.00028318166732788086, 0.00030329078435897827, 0.0003233999013900757, 0.0003435090184211731, 0.0003636181354522705, 0.0003837272524833679, 0.00040383636951446533, 0.00042394548654556274, 0.00044405460357666016, 0.00046416372060775757, 0.000484272837638855, 0.0005043819546699524, 0.0005244910717010498, 0.0005446001887321472, 0.0005647093057632446, 0.000584818422794342, 0.0006049275398254395, 0.0006250366568565369, 0.0006451457738876343, 0.0006652548909187317, 0.0006853640079498291, 0.0007054731249809265, 0.0007255822420120239, 0.0007456913590431213, 0.0007658004760742188]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 18.0, 8.0, 36.0, 40.0, 51.0, 85.0, 125.0, 234.0, 396.0, 724.0, 1492.0, 3424.0, 9933.0, 38180.0, 728788.0, 219597.0, 30842.0, 8574.0, 3045.0, 1331.0, 680.0, 356.0, 215.0, 128.0, 66.0, 49.0, 35.0, 28.0, 24.0, 15.0, 4.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.0143585205078125, -0.970123291015625, -0.9258880615234375, -0.88165283203125, -0.8374176025390625, -0.793182373046875, -0.7489471435546875, -0.7047119140625, -0.6604766845703125, -0.616241455078125, -0.5720062255859375, -0.52777099609375, -0.4835357666015625, -0.439300537109375, -0.3950653076171875, -0.350830078125, -0.3065948486328125, -0.262359619140625, -0.2181243896484375, -0.17388916015625, -0.1296539306640625, -0.085418701171875, -0.0411834716796875, 0.0030517578125, 0.0472869873046875, 0.091522216796875, 0.1357574462890625, 0.17999267578125, 0.2242279052734375, 0.268463134765625, 0.3126983642578125, 0.35693359375, 0.4011688232421875, 0.445404052734375, 0.4896392822265625, 0.53387451171875, 0.5781097412109375, 0.622344970703125, 0.6665802001953125, 0.7108154296875, 0.7550506591796875, 0.799285888671875, 0.8435211181640625, 0.88775634765625, 0.9319915771484375, 0.976226806640625, 1.0204620361328125, 1.064697265625, 1.1089324951171875, 1.153167724609375, 1.1974029541015625, 1.24163818359375, 1.2858734130859375, 1.330108642578125, 1.3743438720703125, 1.4185791015625, 1.4628143310546875, 1.507049560546875, 1.5512847900390625, 1.59552001953125, 1.6397552490234375, 1.683990478515625, 1.7282257080078125, 1.7724609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 7.0, 10.0, 8.0, 5.0, 7.0, 9.0, 12.0, 17.0, 17.0, 16.0, 18.0, 30.0, 34.0, 43.0, 41.0, 55.0, 67.0, 76.0, 66.0, 77.0, 78.0, 55.0, 41.0, 36.0, 28.0, 38.0, 24.0, 19.0, 13.0, 7.0, 10.0, 4.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3066253662109375, -1.252899169921875, -1.1991729736328125, -1.14544677734375, -1.0917205810546875, -1.037994384765625, -0.9842681884765625, -0.9305419921875, -0.8768157958984375, -0.823089599609375, -0.7693634033203125, -0.71563720703125, -0.6619110107421875, -0.608184814453125, -0.5544586181640625, -0.500732421875, -0.4470062255859375, -0.393280029296875, -0.3395538330078125, -0.28582763671875, -0.2321014404296875, -0.178375244140625, -0.1246490478515625, -0.0709228515625, -0.0171966552734375, 0.036529541015625, 0.0902557373046875, 0.14398193359375, 0.1977081298828125, 0.251434326171875, 0.3051605224609375, 0.35888671875, 0.4126129150390625, 0.466339111328125, 0.5200653076171875, 0.57379150390625, 0.6275177001953125, 0.681243896484375, 0.7349700927734375, 0.7886962890625, 0.8424224853515625, 0.896148681640625, 0.9498748779296875, 1.00360107421875, 1.0573272705078125, 1.111053466796875, 1.1647796630859375, 1.218505859375, 1.2722320556640625, 1.325958251953125, 1.3796844482421875, 1.43341064453125, 1.4871368408203125, 1.540863037109375, 1.5945892333984375, 1.6483154296875, 1.7020416259765625, 1.755767822265625, 1.8094940185546875, 1.86322021484375, 1.9169464111328125, 1.970672607421875, 2.0243988037109375, 2.078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 12.0, 36.0, 39.0, 58.0, 105.0, 526.0, 93.0, 58.0, 23.0, 23.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.39476013183594, -70.82308959960938, -68.25141143798828, -65.67974090576172, -63.108062744140625, -60.53639221191406, -57.964717864990234, -55.393043518066406, -52.82136917114258, -50.24969482421875, -47.67802047729492, -45.106346130371094, -42.53467559814453, -39.96299743652344, -37.391326904296875, -34.81965255737305, -32.24797821044922, -29.67630386352539, -27.104629516601562, -24.532957077026367, -21.96128273010254, -19.38960838317871, -16.817935943603516, -14.246261596679688, -11.67458724975586, -9.102912902832031, -6.5312395095825195, -3.9595656394958496, -1.3878917694091797, 1.1837825775146484, 3.75545597076416, 6.327129364013672, 8.898796081542969, 11.470470428466797, 14.042143821716309, 16.61381721496582, 19.18549156188965, 21.757165908813477, 24.328838348388672, 26.9005126953125, 29.472187042236328, 32.043861389160156, 34.615535736083984, 37.18721008300781, 39.758880615234375, 42.33055877685547, 44.90222930908203, 47.47390365600586, 50.04557800292969, 52.617252349853516, 55.188926696777344, 57.76060104370117, 60.332275390625, 62.90394592285156, 65.47562408447266, 68.04729461669922, 70.61897277832031, 73.19064331054688, 75.76232147216797, 78.33399200439453, 80.90567016601562, 83.47734069824219, 86.04901885986328, 88.62068939208984, 91.1923599243164]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 16.0, 12.0, 21.0, 25.0, 25.0, 25.0, 27.0, 39.0, 93.0, 232.0, 185.0, 39.0, 24.0, 27.0, 27.0, 26.0, 29.0, 18.0, 18.0, 5.0, 4.0, 8.0, 7.0, 8.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.49089431762695, -39.99684143066406, -38.50278854370117, -37.00873565673828, -35.514678955078125, -34.020626068115234, -32.526573181152344, -31.032520294189453, -29.53846549987793, -28.04441261291504, -26.550357818603516, -25.056304931640625, -23.562252044677734, -22.06819725036621, -20.57414436340332, -19.080089569091797, -17.586036682128906, -16.091983795166016, -14.597929000854492, -13.103876113891602, -11.609822273254395, -10.115768432617188, -8.621715545654297, -7.12766170501709, -5.633607864379883, -4.139554023742676, -2.645500659942627, -1.1514472961425781, 0.3426065444946289, 1.836660385131836, 3.3307132720947266, 4.824767112731934, 6.318817138671875, 7.812870979309082, 9.306924819946289, 10.80097770690918, 12.295031547546387, 13.789085388183594, 15.283138275146484, 16.777191162109375, 18.2712459564209, 19.76529884338379, 21.259353637695312, 22.753406524658203, 24.247459411621094, 25.741514205932617, 27.235567092895508, 28.72962188720703, 30.223674774169922, 31.717727661132812, 33.2117805480957, 34.705833435058594, 36.19989013671875, 37.69394302368164, 39.18799591064453, 40.68204879760742, 42.17610168457031, 43.6701545715332, 45.164207458496094, 46.65826416015625, 48.15231704711914, 49.64636993408203, 51.14042282104492, 52.63447570800781, 54.12853240966797]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 11.0, 24.0, 16.0, 28.0, 35.0, 44.0, 48.0, 52.0, 150.0, 285.0, 64.0, 46.0, 32.0, 28.0, 24.0, 22.0, 28.0, 10.0, 15.0, 8.0, 2.0, 8.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.79156494140625, -4.6378173828125, -4.48406982421875, -4.330322265625, -4.17657470703125, -4.0228271484375, -3.86907958984375, -3.71533203125, -3.56158447265625, -3.4078369140625, -3.25408935546875, -3.100341796875, -2.94659423828125, -2.7928466796875, -2.63909912109375, -2.4853515625, -2.33160400390625, -2.1778564453125, -2.02410888671875, -1.870361328125, -1.71661376953125, -1.5628662109375, -1.40911865234375, -1.25537109375, -1.10162353515625, -0.9478759765625, -0.79412841796875, -0.640380859375, -0.48663330078125, -0.3328857421875, -0.17913818359375, -0.025390625, 0.12835693359375, 0.2821044921875, 0.43585205078125, 0.589599609375, 0.74334716796875, 0.8970947265625, 1.05084228515625, 1.20458984375, 1.35833740234375, 1.5120849609375, 1.66583251953125, 1.819580078125, 1.97332763671875, 2.1270751953125, 2.28082275390625, 2.4345703125, 2.58831787109375, 2.7420654296875, 2.89581298828125, 3.049560546875, 3.20330810546875, 3.3570556640625, 3.51080322265625, 3.66455078125, 3.81829833984375, 3.9720458984375, 4.12579345703125, 4.279541015625, 4.43328857421875, 4.5870361328125, 4.74078369140625, 4.89453125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 4.0, 8.0, 5.0, 18.0, 7.0, 17.0, 44.0, 55.0, 115.0, 214.0, 556.0, 2101.0, 17332.0, 8356451.0, 9291.0, 1541.0, 441.0, 153.0, 92.0, 45.0, 18.0, 21.0, 8.0, 15.0, 9.0, 12.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.30021667480469, -35.83097457885742, -34.36172866821289, -32.892486572265625, -31.423240661621094, -29.953998565673828, -28.48475456237793, -27.01551055908203, -25.546266555786133, -24.077022552490234, -22.607778549194336, -21.138534545898438, -19.669292449951172, -18.20004653930664, -16.730804443359375, -15.261560440063477, -13.792316436767578, -12.32307243347168, -10.853828430175781, -9.3845853805542, -7.915341377258301, -6.446097373962402, -4.97685432434082, -3.507610321044922, -2.0383663177490234, -0.5691225528717041, 0.9001212120056152, 2.3693647384643555, 3.838608741760254, 5.307852745056152, 6.777095794677734, 8.246339797973633, 9.715579986572266, 11.184823989868164, 12.654067993164062, 14.123311042785645, 15.592555046081543, 17.061798095703125, 18.531042098999023, 20.000286102294922, 21.46953010559082, 22.93877410888672, 24.408018112182617, 25.877262115478516, 27.34650421142578, 28.815750122070312, 30.284992218017578, 31.754236221313477, 33.223480224609375, 34.69272232055664, 36.16196823120117, 37.63121032714844, 39.10045623779297, 40.569698333740234, 42.0389404296875, 43.50818634033203, 44.97743225097656, 46.44667434692383, 47.91592025756836, 49.385162353515625, 50.854408264160156, 52.32365036010742, 53.79289245605469, 55.26213836669922, 56.731380462646484]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 6.0, 0.0, 4.0, 1.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 12.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.37743377685547, -82.17849731445312, -78.97956085205078, -75.78062438964844, -72.58169555664062, -69.38275909423828, -66.18382263183594, -62.984886169433594, -59.78594970703125, -56.587013244628906, -53.38807678222656, -50.189144134521484, -46.99020767211914, -43.7912712097168, -40.59233856201172, -37.393402099609375, -34.19446563720703, -30.995529174804688, -27.796594619750977, -24.597660064697266, -21.398723602294922, -18.199787139892578, -15.000852584838867, -11.801918029785156, -8.602981567382812, -5.404046058654785, -2.205110549926758, 0.9938249588012695, 4.192760467529297, 7.391695976257324, 10.590631484985352, 13.789566040039062, 16.988494873046875, 20.18743133544922, 23.38636589050293, 26.58530044555664, 29.784236907958984, 32.98317337036133, 36.182106018066406, 39.38104248046875, 42.579978942871094, 45.77891540527344, 48.97785186767578, 52.17678451538086, 55.3757209777832, 58.57465744018555, 61.773590087890625, 64.97252655029297, 68.17146301269531, 71.37039947509766, 74.5693359375, 77.76827239990234, 80.96720886230469, 84.1661376953125, 87.36507415771484, 90.56401062011719, 93.76294708251953, 96.96188354492188, 100.16082000732422, 103.35975646972656, 106.55868530273438, 109.75762176513672, 112.95655822753906, 116.1554946899414, 119.35443115234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 10.0, 18.0, 19.0, 29.0, 36.0, 68.0, 95.0, 160.0, 235.0, 451.0, 863.0, 1545.0, 3145.0, 6289.0, 14220.0, 33376.0, 83394.0, 169613.0, 123058.0, 49839.0, 20120.0, 8843.0, 4147.0, 2054.0, 1119.0, 592.0, 315.0, 221.0, 126.0, 85.0, 53.0, 41.0, 22.0, 10.0, 16.0, 7.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.0517578125, -18.431640625, -17.8115234375, -17.19140625, -16.5712890625, -15.951171875, -15.3310546875, -14.7109375, -14.0908203125, -13.470703125, -12.8505859375, -12.23046875, -11.6103515625, -10.990234375, -10.3701171875, -9.75, -9.1298828125, -8.509765625, -7.8896484375, -7.26953125, -6.6494140625, -6.029296875, -5.4091796875, -4.7890625, -4.1689453125, -3.548828125, -2.9287109375, -2.30859375, -1.6884765625, -1.068359375, -0.4482421875, 0.171875, 0.7919921875, 1.412109375, 2.0322265625, 2.65234375, 3.2724609375, 3.892578125, 4.5126953125, 5.1328125, 5.7529296875, 6.373046875, 6.9931640625, 7.61328125, 8.2333984375, 8.853515625, 9.4736328125, 10.09375, 10.7138671875, 11.333984375, 11.9541015625, 12.57421875, 13.1943359375, 13.814453125, 14.4345703125, 15.0546875, 15.6748046875, 16.294921875, 16.9150390625, 17.53515625, 18.1552734375, 18.775390625, 19.3955078125, 20.015625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 14.0, 23.0, 24.0, 18.0, 42.0, 36.0, 41.0, 50.0, 80.0, 84.0, 75.0, 71.0, 77.0, 72.0, 50.0, 42.0, 40.0, 36.0, 22.0, 25.0, 14.0, 14.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.206512451171875, -5.06146240234375, -4.916412353515625, -4.7713623046875, -4.626312255859375, -4.48126220703125, -4.336212158203125, -4.191162109375, -4.046112060546875, -3.90106201171875, -3.756011962890625, -3.6109619140625, -3.465911865234375, -3.32086181640625, -3.175811767578125, -3.03076171875, -2.885711669921875, -2.74066162109375, -2.595611572265625, -2.4505615234375, -2.305511474609375, -2.16046142578125, -2.015411376953125, -1.870361328125, -1.725311279296875, -1.58026123046875, -1.435211181640625, -1.2901611328125, -1.145111083984375, -1.00006103515625, -0.855010986328125, -0.7099609375, -0.564910888671875, -0.41986083984375, -0.274810791015625, -0.1297607421875, 0.015289306640625, 0.16033935546875, 0.305389404296875, 0.450439453125, 0.595489501953125, 0.74053955078125, 0.885589599609375, 1.0306396484375, 1.175689697265625, 1.32073974609375, 1.465789794921875, 1.61083984375, 1.755889892578125, 1.90093994140625, 2.045989990234375, 2.1910400390625, 2.336090087890625, 2.48114013671875, 2.626190185546875, 2.771240234375, 2.916290283203125, 3.06134033203125, 3.206390380859375, 3.3514404296875, 3.496490478515625, 3.64154052734375, 3.786590576171875, 3.931640625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 13.0, 13.0, 25.0, 70.0, 88.0, 87.0, 72.0, 42.0, 13.0, 6.0, 12.0, 10.0, 9.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.99530029296875, -35.039794921875, -34.08428955078125, -33.1287841796875, -32.17327880859375, -31.217775344848633, -30.262269973754883, -29.306764602661133, -28.351259231567383, -27.395753860473633, -26.440248489379883, -25.484745025634766, -24.529239654541016, -23.573734283447266, -22.618228912353516, -21.662723541259766, -20.707218170166016, -19.751712799072266, -18.796207427978516, -17.840702056884766, -16.88519859313965, -15.929693222045898, -14.974187850952148, -14.018682479858398, -13.063179016113281, -12.107673645019531, -11.152169227600098, -10.196663856506348, -9.241158485412598, -8.285654067993164, -7.330148696899414, -6.374643325805664, -5.419137954711914, -4.463633060455322, -3.5081276893615723, -2.5526227951049805, -1.5971176624298096, -0.6416125297546387, 0.3138923645019531, 1.2693977355957031, 2.224902629852295, 3.180407762527466, 4.135912895202637, 5.0914177894592285, 6.04692268371582, 7.00242805480957, 7.957932949066162, 8.91343879699707, 9.868943214416504, 10.824448585510254, 11.779953002929688, 12.735458374023438, 13.690963745117188, 14.646469116210938, 15.601973533630371, 16.557479858398438, 17.512983322143555, 18.468488693237305, 19.423994064331055, 20.379497528076172, 21.335002899169922, 22.290508270263672, 23.246013641357422, 24.201519012451172, 25.157024383544922]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 11.0, 14.0, 13.0, 45.0, 71.0, 84.0, 70.0, 45.0, 31.0, 20.0, 12.0, 6.0, 8.0, 4.0, 1.0, 4.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.503015518188477, -17.868295669555664, -17.23357391357422, -16.598854064941406, -15.964132308959961, -15.329411506652832, -14.694690704345703, -14.05997085571289, -13.425249099731445, -12.790528297424316, -12.155807495117188, -11.521086692810059, -10.88636589050293, -10.2516450881958, -9.616924285888672, -8.98220443725586, -8.34748363494873, -7.712762832641602, -7.078042030334473, -6.443321228027344, -5.808600425720215, -5.173879623413086, -4.539159297943115, -3.9044384956359863, -3.2697176933288574, -2.6349968910217285, -2.0002760887145996, -1.3655555248260498, -0.7308347225189209, -0.09611392021179199, 0.5386066436767578, 1.1733274459838867, 1.8080482482910156, 2.4427690505981445, 3.0774898529052734, 3.7122104167938232, 4.346931457519531, 4.98165225982666, 5.616372585296631, 6.25109338760376, 6.885814189910889, 7.520534992218018, 8.155255317687988, 8.789976119995117, 9.424696922302246, 10.059417724609375, 10.694138526916504, 11.328859329223633, 11.963580131530762, 12.59830093383789, 13.23302173614502, 13.867742538452148, 14.502463340759277, 15.137184143066406, 15.771903991699219, 16.406625747680664, 17.041345596313477, 17.67606544494629, 18.310787200927734, 18.945507049560547, 19.580228805541992, 20.214948654174805, 20.84967041015625, 21.484390258789062, 22.119112014770508]}, "eval/loss": 4.330733299255371, "eval/wer": 1.92959143197144, "eval/runtime": 943.0842, "eval/samples_per_second": 2.801, "eval/steps_per_second": 0.351, "train/train_runtime": 8505.8878, "train/train_samples_per_second": 3.355, "train/train_steps_per_second": 0.21, "train/total_flos": 0.0, "train/train_loss": 4.4116124524129345} \ No newline at end of file